xref: /qemu/tcg/tcg.c (revision b016486e7baddb43cfc1e51909b05cde9cf82e0c)
1c896fe29Sbellard /*
2c896fe29Sbellard  * Tiny Code Generator for QEMU
3c896fe29Sbellard  *
4c896fe29Sbellard  * Copyright (c) 2008 Fabrice Bellard
5c896fe29Sbellard  *
6c896fe29Sbellard  * Permission is hereby granted, free of charge, to any person obtaining a copy
7c896fe29Sbellard  * of this software and associated documentation files (the "Software"), to deal
8c896fe29Sbellard  * in the Software without restriction, including without limitation the rights
9c896fe29Sbellard  * to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
10c896fe29Sbellard  * copies of the Software, and to permit persons to whom the Software is
11c896fe29Sbellard  * furnished to do so, subject to the following conditions:
12c896fe29Sbellard  *
13c896fe29Sbellard  * The above copyright notice and this permission notice shall be included in
14c896fe29Sbellard  * all copies or substantial portions of the Software.
15c896fe29Sbellard  *
16c896fe29Sbellard  * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
17c896fe29Sbellard  * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
18c896fe29Sbellard  * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
19c896fe29Sbellard  * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
20c896fe29Sbellard  * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
21c896fe29Sbellard  * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
22c896fe29Sbellard  * THE SOFTWARE.
23c896fe29Sbellard  */
24c896fe29Sbellard 
25c896fe29Sbellard /* define it to use liveness analysis (better code) */
268f2e8c07SKirill Batuzov #define USE_TCG_OPTIMIZATIONS
27c896fe29Sbellard 
28757e725bSPeter Maydell #include "qemu/osdep.h"
29cca82982Saurel32 
30813da627SRichard Henderson /* Define to jump the ELF file used to communicate with GDB.  */
31813da627SRichard Henderson #undef DEBUG_JIT
32813da627SRichard Henderson 
3372fd2efbSEmilio G. Cota #include "qemu/error-report.h"
34f348b6d1SVeronia Bahaa #include "qemu/cutils.h"
351de7afc9SPaolo Bonzini #include "qemu/host-utils.h"
361de7afc9SPaolo Bonzini #include "qemu/timer.h"
37c896fe29Sbellard 
38c5d3c498SStefan Weil /* Note: the long term plan is to reduce the dependencies on the QEMU
39c896fe29Sbellard    CPU definitions. Currently they are used for qemu_ld/st
40c896fe29Sbellard    instructions */
41c896fe29Sbellard #define NO_CPU_IO_DEFS
42c896fe29Sbellard #include "cpu.h"
43c896fe29Sbellard 
4463c91552SPaolo Bonzini #include "exec/cpu-common.h"
4563c91552SPaolo Bonzini #include "exec/exec-all.h"
4663c91552SPaolo Bonzini 
47c896fe29Sbellard #include "tcg-op.h"
48813da627SRichard Henderson 
49edee2579SRichard Henderson #if UINTPTR_MAX == UINT32_MAX
50813da627SRichard Henderson # define ELF_CLASS  ELFCLASS32
51edee2579SRichard Henderson #else
52edee2579SRichard Henderson # define ELF_CLASS  ELFCLASS64
53813da627SRichard Henderson #endif
54813da627SRichard Henderson #ifdef HOST_WORDS_BIGENDIAN
55813da627SRichard Henderson # define ELF_DATA   ELFDATA2MSB
56813da627SRichard Henderson #else
57813da627SRichard Henderson # define ELF_DATA   ELFDATA2LSB
58813da627SRichard Henderson #endif
59813da627SRichard Henderson 
60c896fe29Sbellard #include "elf.h"
61508127e2SPaolo Bonzini #include "exec/log.h"
623468b59eSEmilio G. Cota #include "sysemu/sysemu.h"
63c896fe29Sbellard 
64ce151109SPeter Maydell /* Forward declarations for functions declared in tcg-target.inc.c and
65ce151109SPeter Maydell    used here. */
66e4d58b41SRichard Henderson static void tcg_target_init(TCGContext *s);
67f69d277eSRichard Henderson static const TCGTargetOpDef *tcg_target_op_def(TCGOpcode);
68e4d58b41SRichard Henderson static void tcg_target_qemu_prologue(TCGContext *s);
696ac17786SRichard Henderson static bool patch_reloc(tcg_insn_unit *code_ptr, int type,
702ba7fae2SRichard Henderson                         intptr_t value, intptr_t addend);
71c896fe29Sbellard 
72497a22ebSRichard Henderson /* The CIE and FDE header definitions will be common to all hosts.  */
73497a22ebSRichard Henderson typedef struct {
74497a22ebSRichard Henderson     uint32_t len __attribute__((aligned((sizeof(void *)))));
75497a22ebSRichard Henderson     uint32_t id;
76497a22ebSRichard Henderson     uint8_t version;
77497a22ebSRichard Henderson     char augmentation[1];
78497a22ebSRichard Henderson     uint8_t code_align;
79497a22ebSRichard Henderson     uint8_t data_align;
80497a22ebSRichard Henderson     uint8_t return_column;
81497a22ebSRichard Henderson } DebugFrameCIE;
82497a22ebSRichard Henderson 
83497a22ebSRichard Henderson typedef struct QEMU_PACKED {
84497a22ebSRichard Henderson     uint32_t len __attribute__((aligned((sizeof(void *)))));
85497a22ebSRichard Henderson     uint32_t cie_offset;
86edee2579SRichard Henderson     uintptr_t func_start;
87edee2579SRichard Henderson     uintptr_t func_len;
88497a22ebSRichard Henderson } DebugFrameFDEHeader;
89497a22ebSRichard Henderson 
902c90784aSRichard Henderson typedef struct QEMU_PACKED {
912c90784aSRichard Henderson     DebugFrameCIE cie;
922c90784aSRichard Henderson     DebugFrameFDEHeader fde;
932c90784aSRichard Henderson } DebugFrameHeader;
942c90784aSRichard Henderson 
95813da627SRichard Henderson static void tcg_register_jit_int(void *buf, size_t size,
962c90784aSRichard Henderson                                  const void *debug_frame,
972c90784aSRichard Henderson                                  size_t debug_frame_size)
98813da627SRichard Henderson     __attribute__((unused));
99813da627SRichard Henderson 
100ce151109SPeter Maydell /* Forward declarations for functions declared and used in tcg-target.inc.c. */
101069ea736SRichard Henderson static const char *target_parse_constraint(TCGArgConstraint *ct,
102069ea736SRichard Henderson                                            const char *ct_str, TCGType type);
1032a534affSRichard Henderson static void tcg_out_ld(TCGContext *s, TCGType type, TCGReg ret, TCGReg arg1,
104a05b5b9bSRichard Henderson                        intptr_t arg2);
1052a534affSRichard Henderson static void tcg_out_mov(TCGContext *s, TCGType type, TCGReg ret, TCGReg arg);
106c0ad3001SStefan Weil static void tcg_out_movi(TCGContext *s, TCGType type,
1072a534affSRichard Henderson                          TCGReg ret, tcg_target_long arg);
108c0ad3001SStefan Weil static void tcg_out_op(TCGContext *s, TCGOpcode opc, const TCGArg *args,
109c0ad3001SStefan Weil                        const int *const_args);
110d2fd745fSRichard Henderson #if TCG_TARGET_MAYBE_vec
111d2fd745fSRichard Henderson static void tcg_out_vec_op(TCGContext *s, TCGOpcode opc, unsigned vecl,
112d2fd745fSRichard Henderson                            unsigned vece, const TCGArg *args,
113d2fd745fSRichard Henderson                            const int *const_args);
114d2fd745fSRichard Henderson #else
115d2fd745fSRichard Henderson static inline void tcg_out_vec_op(TCGContext *s, TCGOpcode opc, unsigned vecl,
116d2fd745fSRichard Henderson                                   unsigned vece, const TCGArg *args,
117d2fd745fSRichard Henderson                                   const int *const_args)
118d2fd745fSRichard Henderson {
119d2fd745fSRichard Henderson     g_assert_not_reached();
120d2fd745fSRichard Henderson }
121d2fd745fSRichard Henderson #endif
1222a534affSRichard Henderson static void tcg_out_st(TCGContext *s, TCGType type, TCGReg arg, TCGReg arg1,
123a05b5b9bSRichard Henderson                        intptr_t arg2);
12459d7c14eSRichard Henderson static bool tcg_out_sti(TCGContext *s, TCGType type, TCGArg val,
12559d7c14eSRichard Henderson                         TCGReg base, intptr_t ofs);
126cf066674SRichard Henderson static void tcg_out_call(TCGContext *s, tcg_insn_unit *target);
127f6c6afc1SRichard Henderson static int tcg_target_const_match(tcg_target_long val, TCGType type,
128c0ad3001SStefan Weil                                   const TCGArgConstraint *arg_ct);
129659ef5cbSRichard Henderson #ifdef TCG_TARGET_NEED_LDST_LABELS
130659ef5cbSRichard Henderson static bool tcg_out_ldst_finalize(TCGContext *s);
131659ef5cbSRichard Henderson #endif
132c896fe29Sbellard 
133a505785cSEmilio G. Cota #define TCG_HIGHWATER 1024
134a505785cSEmilio G. Cota 
135df2cce29SEmilio G. Cota static TCGContext **tcg_ctxs;
136df2cce29SEmilio G. Cota static unsigned int n_tcg_ctxs;
1371c2adb95SRichard Henderson TCGv_env cpu_env = 0;
138df2cce29SEmilio G. Cota 
139be2cdc5eSEmilio G. Cota struct tcg_region_tree {
140be2cdc5eSEmilio G. Cota     QemuMutex lock;
141be2cdc5eSEmilio G. Cota     GTree *tree;
142be2cdc5eSEmilio G. Cota     /* padding to avoid false sharing is computed at run-time */
143be2cdc5eSEmilio G. Cota };
144be2cdc5eSEmilio G. Cota 
145e8feb96fSEmilio G. Cota /*
146e8feb96fSEmilio G. Cota  * We divide code_gen_buffer into equally-sized "regions" that TCG threads
147e8feb96fSEmilio G. Cota  * dynamically allocate from as demand dictates. Given appropriate region
148e8feb96fSEmilio G. Cota  * sizing, this minimizes flushes even when some TCG threads generate a lot
149e8feb96fSEmilio G. Cota  * more code than others.
150e8feb96fSEmilio G. Cota  */
151e8feb96fSEmilio G. Cota struct tcg_region_state {
152e8feb96fSEmilio G. Cota     QemuMutex lock;
153e8feb96fSEmilio G. Cota 
154e8feb96fSEmilio G. Cota     /* fields set at init time */
155e8feb96fSEmilio G. Cota     void *start;
156e8feb96fSEmilio G. Cota     void *start_aligned;
157e8feb96fSEmilio G. Cota     void *end;
158e8feb96fSEmilio G. Cota     size_t n;
159e8feb96fSEmilio G. Cota     size_t size; /* size of one region */
160e8feb96fSEmilio G. Cota     size_t stride; /* .size + guard size */
161e8feb96fSEmilio G. Cota 
162e8feb96fSEmilio G. Cota     /* fields protected by the lock */
163e8feb96fSEmilio G. Cota     size_t current; /* current region index */
164e8feb96fSEmilio G. Cota     size_t agg_size_full; /* aggregate size of full regions */
165e8feb96fSEmilio G. Cota };
166e8feb96fSEmilio G. Cota 
167e8feb96fSEmilio G. Cota static struct tcg_region_state region;
168be2cdc5eSEmilio G. Cota /*
169be2cdc5eSEmilio G. Cota  * This is an array of struct tcg_region_tree's, with padding.
170be2cdc5eSEmilio G. Cota  * We use void * to simplify the computation of region_trees[i]; each
171be2cdc5eSEmilio G. Cota  * struct is found every tree_size bytes.
172be2cdc5eSEmilio G. Cota  */
173be2cdc5eSEmilio G. Cota static void *region_trees;
174be2cdc5eSEmilio G. Cota static size_t tree_size;
175d2fd745fSRichard Henderson static TCGRegSet tcg_target_available_regs[TCG_TYPE_COUNT];
176b1d8e52eSblueswir1 static TCGRegSet tcg_target_call_clobber_regs;
177c896fe29Sbellard 
1781813e175SRichard Henderson #if TCG_TARGET_INSN_UNIT_SIZE == 1
1794196dca6SPeter Maydell static __attribute__((unused)) inline void tcg_out8(TCGContext *s, uint8_t v)
180c896fe29Sbellard {
181c896fe29Sbellard     *s->code_ptr++ = v;
182c896fe29Sbellard }
183c896fe29Sbellard 
1844196dca6SPeter Maydell static __attribute__((unused)) inline void tcg_patch8(tcg_insn_unit *p,
1854196dca6SPeter Maydell                                                       uint8_t v)
1865c53bb81SPeter Maydell {
1871813e175SRichard Henderson     *p = v;
1885c53bb81SPeter Maydell }
1891813e175SRichard Henderson #endif
1905c53bb81SPeter Maydell 
1911813e175SRichard Henderson #if TCG_TARGET_INSN_UNIT_SIZE <= 2
1924196dca6SPeter Maydell static __attribute__((unused)) inline void tcg_out16(TCGContext *s, uint16_t v)
193c896fe29Sbellard {
1941813e175SRichard Henderson     if (TCG_TARGET_INSN_UNIT_SIZE == 2) {
1951813e175SRichard Henderson         *s->code_ptr++ = v;
1961813e175SRichard Henderson     } else {
1971813e175SRichard Henderson         tcg_insn_unit *p = s->code_ptr;
1984387345aSPeter Maydell         memcpy(p, &v, sizeof(v));
1991813e175SRichard Henderson         s->code_ptr = p + (2 / TCG_TARGET_INSN_UNIT_SIZE);
2001813e175SRichard Henderson     }
201c896fe29Sbellard }
202c896fe29Sbellard 
2034196dca6SPeter Maydell static __attribute__((unused)) inline void tcg_patch16(tcg_insn_unit *p,
2044196dca6SPeter Maydell                                                        uint16_t v)
2055c53bb81SPeter Maydell {
2061813e175SRichard Henderson     if (TCG_TARGET_INSN_UNIT_SIZE == 2) {
2071813e175SRichard Henderson         *p = v;
2081813e175SRichard Henderson     } else {
2095c53bb81SPeter Maydell         memcpy(p, &v, sizeof(v));
2105c53bb81SPeter Maydell     }
2111813e175SRichard Henderson }
2121813e175SRichard Henderson #endif
2135c53bb81SPeter Maydell 
2141813e175SRichard Henderson #if TCG_TARGET_INSN_UNIT_SIZE <= 4
2154196dca6SPeter Maydell static __attribute__((unused)) inline void tcg_out32(TCGContext *s, uint32_t v)
216c896fe29Sbellard {
2171813e175SRichard Henderson     if (TCG_TARGET_INSN_UNIT_SIZE == 4) {
2181813e175SRichard Henderson         *s->code_ptr++ = v;
2191813e175SRichard Henderson     } else {
2201813e175SRichard Henderson         tcg_insn_unit *p = s->code_ptr;
2214387345aSPeter Maydell         memcpy(p, &v, sizeof(v));
2221813e175SRichard Henderson         s->code_ptr = p + (4 / TCG_TARGET_INSN_UNIT_SIZE);
2231813e175SRichard Henderson     }
224c896fe29Sbellard }
225c896fe29Sbellard 
2264196dca6SPeter Maydell static __attribute__((unused)) inline void tcg_patch32(tcg_insn_unit *p,
2274196dca6SPeter Maydell                                                        uint32_t v)
2285c53bb81SPeter Maydell {
2291813e175SRichard Henderson     if (TCG_TARGET_INSN_UNIT_SIZE == 4) {
2301813e175SRichard Henderson         *p = v;
2311813e175SRichard Henderson     } else {
2325c53bb81SPeter Maydell         memcpy(p, &v, sizeof(v));
2335c53bb81SPeter Maydell     }
2341813e175SRichard Henderson }
2351813e175SRichard Henderson #endif
2365c53bb81SPeter Maydell 
2371813e175SRichard Henderson #if TCG_TARGET_INSN_UNIT_SIZE <= 8
2384196dca6SPeter Maydell static __attribute__((unused)) inline void tcg_out64(TCGContext *s, uint64_t v)
239ac26eb69SRichard Henderson {
2401813e175SRichard Henderson     if (TCG_TARGET_INSN_UNIT_SIZE == 8) {
2411813e175SRichard Henderson         *s->code_ptr++ = v;
2421813e175SRichard Henderson     } else {
2431813e175SRichard Henderson         tcg_insn_unit *p = s->code_ptr;
2444387345aSPeter Maydell         memcpy(p, &v, sizeof(v));
2451813e175SRichard Henderson         s->code_ptr = p + (8 / TCG_TARGET_INSN_UNIT_SIZE);
2461813e175SRichard Henderson     }
247ac26eb69SRichard Henderson }
248ac26eb69SRichard Henderson 
2494196dca6SPeter Maydell static __attribute__((unused)) inline void tcg_patch64(tcg_insn_unit *p,
2504196dca6SPeter Maydell                                                        uint64_t v)
2515c53bb81SPeter Maydell {
2521813e175SRichard Henderson     if (TCG_TARGET_INSN_UNIT_SIZE == 8) {
2531813e175SRichard Henderson         *p = v;
2541813e175SRichard Henderson     } else {
2555c53bb81SPeter Maydell         memcpy(p, &v, sizeof(v));
2565c53bb81SPeter Maydell     }
2571813e175SRichard Henderson }
2581813e175SRichard Henderson #endif
2595c53bb81SPeter Maydell 
260c896fe29Sbellard /* label relocation processing */
261c896fe29Sbellard 
2621813e175SRichard Henderson static void tcg_out_reloc(TCGContext *s, tcg_insn_unit *code_ptr, int type,
263bec16311SRichard Henderson                           TCGLabel *l, intptr_t addend)
264c896fe29Sbellard {
265c896fe29Sbellard     TCGRelocation *r;
266c896fe29Sbellard 
267c896fe29Sbellard     if (l->has_value) {
268623e265cSpbrook         /* FIXME: This may break relocations on RISC targets that
269623e265cSpbrook            modify instruction fields in place.  The caller may not have
270623e265cSpbrook            written the initial value.  */
2716ac17786SRichard Henderson         bool ok = patch_reloc(code_ptr, type, l->u.value, addend);
2726ac17786SRichard Henderson         tcg_debug_assert(ok);
273c896fe29Sbellard     } else {
274c896fe29Sbellard         /* add a new relocation entry */
275c896fe29Sbellard         r = tcg_malloc(sizeof(TCGRelocation));
276c896fe29Sbellard         r->type = type;
277c896fe29Sbellard         r->ptr = code_ptr;
278c896fe29Sbellard         r->addend = addend;
279c896fe29Sbellard         r->next = l->u.first_reloc;
280c896fe29Sbellard         l->u.first_reloc = r;
281c896fe29Sbellard     }
282c896fe29Sbellard }
283c896fe29Sbellard 
284bec16311SRichard Henderson static void tcg_out_label(TCGContext *s, TCGLabel *l, tcg_insn_unit *ptr)
285c896fe29Sbellard {
2862ba7fae2SRichard Henderson     intptr_t value = (intptr_t)ptr;
2871813e175SRichard Henderson     TCGRelocation *r;
288c896fe29Sbellard 
289eabb7b91SAurelien Jarno     tcg_debug_assert(!l->has_value);
2901813e175SRichard Henderson 
2911813e175SRichard Henderson     for (r = l->u.first_reloc; r != NULL; r = r->next) {
2926ac17786SRichard Henderson         bool ok = patch_reloc(r->ptr, r->type, value, r->addend);
2936ac17786SRichard Henderson         tcg_debug_assert(ok);
294c896fe29Sbellard     }
2951813e175SRichard Henderson 
296c896fe29Sbellard     l->has_value = 1;
2971813e175SRichard Henderson     l->u.value_ptr = ptr;
298c896fe29Sbellard }
299c896fe29Sbellard 
30042a268c2SRichard Henderson TCGLabel *gen_new_label(void)
301c896fe29Sbellard {
302b1311c4aSEmilio G. Cota     TCGContext *s = tcg_ctx;
30351e3972cSRichard Henderson     TCGLabel *l = tcg_malloc(sizeof(TCGLabel));
304c896fe29Sbellard 
30551e3972cSRichard Henderson     *l = (TCGLabel){
30651e3972cSRichard Henderson         .id = s->nb_labels++
30751e3972cSRichard Henderson     };
30842a268c2SRichard Henderson 
30942a268c2SRichard Henderson     return l;
310c896fe29Sbellard }
311c896fe29Sbellard 
3129f754620SRichard Henderson static void set_jmp_reset_offset(TCGContext *s, int which)
3139f754620SRichard Henderson {
3149f754620SRichard Henderson     size_t off = tcg_current_code_size(s);
3159f754620SRichard Henderson     s->tb_jmp_reset_offset[which] = off;
3169f754620SRichard Henderson     /* Make sure that we didn't overflow the stored offset.  */
3179f754620SRichard Henderson     assert(s->tb_jmp_reset_offset[which] == off);
3189f754620SRichard Henderson }
3199f754620SRichard Henderson 
320ce151109SPeter Maydell #include "tcg-target.inc.c"
321c896fe29Sbellard 
322be2cdc5eSEmilio G. Cota /* compare a pointer @ptr and a tb_tc @s */
323be2cdc5eSEmilio G. Cota static int ptr_cmp_tb_tc(const void *ptr, const struct tb_tc *s)
324be2cdc5eSEmilio G. Cota {
325be2cdc5eSEmilio G. Cota     if (ptr >= s->ptr + s->size) {
326be2cdc5eSEmilio G. Cota         return 1;
327be2cdc5eSEmilio G. Cota     } else if (ptr < s->ptr) {
328be2cdc5eSEmilio G. Cota         return -1;
329be2cdc5eSEmilio G. Cota     }
330be2cdc5eSEmilio G. Cota     return 0;
331be2cdc5eSEmilio G. Cota }
332be2cdc5eSEmilio G. Cota 
333be2cdc5eSEmilio G. Cota static gint tb_tc_cmp(gconstpointer ap, gconstpointer bp)
334be2cdc5eSEmilio G. Cota {
335be2cdc5eSEmilio G. Cota     const struct tb_tc *a = ap;
336be2cdc5eSEmilio G. Cota     const struct tb_tc *b = bp;
337be2cdc5eSEmilio G. Cota 
338be2cdc5eSEmilio G. Cota     /*
339be2cdc5eSEmilio G. Cota      * When both sizes are set, we know this isn't a lookup.
340be2cdc5eSEmilio G. Cota      * This is the most likely case: every TB must be inserted; lookups
341be2cdc5eSEmilio G. Cota      * are a lot less frequent.
342be2cdc5eSEmilio G. Cota      */
343be2cdc5eSEmilio G. Cota     if (likely(a->size && b->size)) {
344be2cdc5eSEmilio G. Cota         if (a->ptr > b->ptr) {
345be2cdc5eSEmilio G. Cota             return 1;
346be2cdc5eSEmilio G. Cota         } else if (a->ptr < b->ptr) {
347be2cdc5eSEmilio G. Cota             return -1;
348be2cdc5eSEmilio G. Cota         }
349be2cdc5eSEmilio G. Cota         /* a->ptr == b->ptr should happen only on deletions */
350be2cdc5eSEmilio G. Cota         g_assert(a->size == b->size);
351be2cdc5eSEmilio G. Cota         return 0;
352be2cdc5eSEmilio G. Cota     }
353be2cdc5eSEmilio G. Cota     /*
354be2cdc5eSEmilio G. Cota      * All lookups have either .size field set to 0.
355be2cdc5eSEmilio G. Cota      * From the glib sources we see that @ap is always the lookup key. However
356be2cdc5eSEmilio G. Cota      * the docs provide no guarantee, so we just mark this case as likely.
357be2cdc5eSEmilio G. Cota      */
358be2cdc5eSEmilio G. Cota     if (likely(a->size == 0)) {
359be2cdc5eSEmilio G. Cota         return ptr_cmp_tb_tc(a->ptr, b);
360be2cdc5eSEmilio G. Cota     }
361be2cdc5eSEmilio G. Cota     return ptr_cmp_tb_tc(b->ptr, a);
362be2cdc5eSEmilio G. Cota }
363be2cdc5eSEmilio G. Cota 
364be2cdc5eSEmilio G. Cota static void tcg_region_trees_init(void)
365be2cdc5eSEmilio G. Cota {
366be2cdc5eSEmilio G. Cota     size_t i;
367be2cdc5eSEmilio G. Cota 
368be2cdc5eSEmilio G. Cota     tree_size = ROUND_UP(sizeof(struct tcg_region_tree), qemu_dcache_linesize);
369be2cdc5eSEmilio G. Cota     region_trees = qemu_memalign(qemu_dcache_linesize, region.n * tree_size);
370be2cdc5eSEmilio G. Cota     for (i = 0; i < region.n; i++) {
371be2cdc5eSEmilio G. Cota         struct tcg_region_tree *rt = region_trees + i * tree_size;
372be2cdc5eSEmilio G. Cota 
373be2cdc5eSEmilio G. Cota         qemu_mutex_init(&rt->lock);
374be2cdc5eSEmilio G. Cota         rt->tree = g_tree_new(tb_tc_cmp);
375be2cdc5eSEmilio G. Cota     }
376be2cdc5eSEmilio G. Cota }
377be2cdc5eSEmilio G. Cota 
378be2cdc5eSEmilio G. Cota static struct tcg_region_tree *tc_ptr_to_region_tree(void *p)
379be2cdc5eSEmilio G. Cota {
380be2cdc5eSEmilio G. Cota     size_t region_idx;
381be2cdc5eSEmilio G. Cota 
382be2cdc5eSEmilio G. Cota     if (p < region.start_aligned) {
383be2cdc5eSEmilio G. Cota         region_idx = 0;
384be2cdc5eSEmilio G. Cota     } else {
385be2cdc5eSEmilio G. Cota         ptrdiff_t offset = p - region.start_aligned;
386be2cdc5eSEmilio G. Cota 
387be2cdc5eSEmilio G. Cota         if (offset > region.stride * (region.n - 1)) {
388be2cdc5eSEmilio G. Cota             region_idx = region.n - 1;
389be2cdc5eSEmilio G. Cota         } else {
390be2cdc5eSEmilio G. Cota             region_idx = offset / region.stride;
391be2cdc5eSEmilio G. Cota         }
392be2cdc5eSEmilio G. Cota     }
393be2cdc5eSEmilio G. Cota     return region_trees + region_idx * tree_size;
394be2cdc5eSEmilio G. Cota }
395be2cdc5eSEmilio G. Cota 
396be2cdc5eSEmilio G. Cota void tcg_tb_insert(TranslationBlock *tb)
397be2cdc5eSEmilio G. Cota {
398be2cdc5eSEmilio G. Cota     struct tcg_region_tree *rt = tc_ptr_to_region_tree(tb->tc.ptr);
399be2cdc5eSEmilio G. Cota 
400be2cdc5eSEmilio G. Cota     qemu_mutex_lock(&rt->lock);
401be2cdc5eSEmilio G. Cota     g_tree_insert(rt->tree, &tb->tc, tb);
402be2cdc5eSEmilio G. Cota     qemu_mutex_unlock(&rt->lock);
403be2cdc5eSEmilio G. Cota }
404be2cdc5eSEmilio G. Cota 
405be2cdc5eSEmilio G. Cota void tcg_tb_remove(TranslationBlock *tb)
406be2cdc5eSEmilio G. Cota {
407be2cdc5eSEmilio G. Cota     struct tcg_region_tree *rt = tc_ptr_to_region_tree(tb->tc.ptr);
408be2cdc5eSEmilio G. Cota 
409be2cdc5eSEmilio G. Cota     qemu_mutex_lock(&rt->lock);
410be2cdc5eSEmilio G. Cota     g_tree_remove(rt->tree, &tb->tc);
411be2cdc5eSEmilio G. Cota     qemu_mutex_unlock(&rt->lock);
412be2cdc5eSEmilio G. Cota }
413be2cdc5eSEmilio G. Cota 
414be2cdc5eSEmilio G. Cota /*
415be2cdc5eSEmilio G. Cota  * Find the TB 'tb' such that
416be2cdc5eSEmilio G. Cota  * tb->tc.ptr <= tc_ptr < tb->tc.ptr + tb->tc.size
417be2cdc5eSEmilio G. Cota  * Return NULL if not found.
418be2cdc5eSEmilio G. Cota  */
419be2cdc5eSEmilio G. Cota TranslationBlock *tcg_tb_lookup(uintptr_t tc_ptr)
420be2cdc5eSEmilio G. Cota {
421be2cdc5eSEmilio G. Cota     struct tcg_region_tree *rt = tc_ptr_to_region_tree((void *)tc_ptr);
422be2cdc5eSEmilio G. Cota     TranslationBlock *tb;
423be2cdc5eSEmilio G. Cota     struct tb_tc s = { .ptr = (void *)tc_ptr };
424be2cdc5eSEmilio G. Cota 
425be2cdc5eSEmilio G. Cota     qemu_mutex_lock(&rt->lock);
426be2cdc5eSEmilio G. Cota     tb = g_tree_lookup(rt->tree, &s);
427be2cdc5eSEmilio G. Cota     qemu_mutex_unlock(&rt->lock);
428be2cdc5eSEmilio G. Cota     return tb;
429be2cdc5eSEmilio G. Cota }
430be2cdc5eSEmilio G. Cota 
431be2cdc5eSEmilio G. Cota static void tcg_region_tree_lock_all(void)
432be2cdc5eSEmilio G. Cota {
433be2cdc5eSEmilio G. Cota     size_t i;
434be2cdc5eSEmilio G. Cota 
435be2cdc5eSEmilio G. Cota     for (i = 0; i < region.n; i++) {
436be2cdc5eSEmilio G. Cota         struct tcg_region_tree *rt = region_trees + i * tree_size;
437be2cdc5eSEmilio G. Cota 
438be2cdc5eSEmilio G. Cota         qemu_mutex_lock(&rt->lock);
439be2cdc5eSEmilio G. Cota     }
440be2cdc5eSEmilio G. Cota }
441be2cdc5eSEmilio G. Cota 
442be2cdc5eSEmilio G. Cota static void tcg_region_tree_unlock_all(void)
443be2cdc5eSEmilio G. Cota {
444be2cdc5eSEmilio G. Cota     size_t i;
445be2cdc5eSEmilio G. Cota 
446be2cdc5eSEmilio G. Cota     for (i = 0; i < region.n; i++) {
447be2cdc5eSEmilio G. Cota         struct tcg_region_tree *rt = region_trees + i * tree_size;
448be2cdc5eSEmilio G. Cota 
449be2cdc5eSEmilio G. Cota         qemu_mutex_unlock(&rt->lock);
450be2cdc5eSEmilio G. Cota     }
451be2cdc5eSEmilio G. Cota }
452be2cdc5eSEmilio G. Cota 
453be2cdc5eSEmilio G. Cota void tcg_tb_foreach(GTraverseFunc func, gpointer user_data)
454be2cdc5eSEmilio G. Cota {
455be2cdc5eSEmilio G. Cota     size_t i;
456be2cdc5eSEmilio G. Cota 
457be2cdc5eSEmilio G. Cota     tcg_region_tree_lock_all();
458be2cdc5eSEmilio G. Cota     for (i = 0; i < region.n; i++) {
459be2cdc5eSEmilio G. Cota         struct tcg_region_tree *rt = region_trees + i * tree_size;
460be2cdc5eSEmilio G. Cota 
461be2cdc5eSEmilio G. Cota         g_tree_foreach(rt->tree, func, user_data);
462be2cdc5eSEmilio G. Cota     }
463be2cdc5eSEmilio G. Cota     tcg_region_tree_unlock_all();
464be2cdc5eSEmilio G. Cota }
465be2cdc5eSEmilio G. Cota 
466be2cdc5eSEmilio G. Cota size_t tcg_nb_tbs(void)
467be2cdc5eSEmilio G. Cota {
468be2cdc5eSEmilio G. Cota     size_t nb_tbs = 0;
469be2cdc5eSEmilio G. Cota     size_t i;
470be2cdc5eSEmilio G. Cota 
471be2cdc5eSEmilio G. Cota     tcg_region_tree_lock_all();
472be2cdc5eSEmilio G. Cota     for (i = 0; i < region.n; i++) {
473be2cdc5eSEmilio G. Cota         struct tcg_region_tree *rt = region_trees + i * tree_size;
474be2cdc5eSEmilio G. Cota 
475be2cdc5eSEmilio G. Cota         nb_tbs += g_tree_nnodes(rt->tree);
476be2cdc5eSEmilio G. Cota     }
477be2cdc5eSEmilio G. Cota     tcg_region_tree_unlock_all();
478be2cdc5eSEmilio G. Cota     return nb_tbs;
479be2cdc5eSEmilio G. Cota }
480be2cdc5eSEmilio G. Cota 
481be2cdc5eSEmilio G. Cota static void tcg_region_tree_reset_all(void)
482be2cdc5eSEmilio G. Cota {
483be2cdc5eSEmilio G. Cota     size_t i;
484be2cdc5eSEmilio G. Cota 
485be2cdc5eSEmilio G. Cota     tcg_region_tree_lock_all();
486be2cdc5eSEmilio G. Cota     for (i = 0; i < region.n; i++) {
487be2cdc5eSEmilio G. Cota         struct tcg_region_tree *rt = region_trees + i * tree_size;
488be2cdc5eSEmilio G. Cota 
489be2cdc5eSEmilio G. Cota         /* Increment the refcount first so that destroy acts as a reset */
490be2cdc5eSEmilio G. Cota         g_tree_ref(rt->tree);
491be2cdc5eSEmilio G. Cota         g_tree_destroy(rt->tree);
492be2cdc5eSEmilio G. Cota     }
493be2cdc5eSEmilio G. Cota     tcg_region_tree_unlock_all();
494be2cdc5eSEmilio G. Cota }
495be2cdc5eSEmilio G. Cota 
496e8feb96fSEmilio G. Cota static void tcg_region_bounds(size_t curr_region, void **pstart, void **pend)
497e8feb96fSEmilio G. Cota {
498e8feb96fSEmilio G. Cota     void *start, *end;
499e8feb96fSEmilio G. Cota 
500e8feb96fSEmilio G. Cota     start = region.start_aligned + curr_region * region.stride;
501e8feb96fSEmilio G. Cota     end = start + region.size;
502e8feb96fSEmilio G. Cota 
503e8feb96fSEmilio G. Cota     if (curr_region == 0) {
504e8feb96fSEmilio G. Cota         start = region.start;
505e8feb96fSEmilio G. Cota     }
506e8feb96fSEmilio G. Cota     if (curr_region == region.n - 1) {
507e8feb96fSEmilio G. Cota         end = region.end;
508e8feb96fSEmilio G. Cota     }
509e8feb96fSEmilio G. Cota 
510e8feb96fSEmilio G. Cota     *pstart = start;
511e8feb96fSEmilio G. Cota     *pend = end;
512e8feb96fSEmilio G. Cota }
513e8feb96fSEmilio G. Cota 
514e8feb96fSEmilio G. Cota static void tcg_region_assign(TCGContext *s, size_t curr_region)
515e8feb96fSEmilio G. Cota {
516e8feb96fSEmilio G. Cota     void *start, *end;
517e8feb96fSEmilio G. Cota 
518e8feb96fSEmilio G. Cota     tcg_region_bounds(curr_region, &start, &end);
519e8feb96fSEmilio G. Cota 
520e8feb96fSEmilio G. Cota     s->code_gen_buffer = start;
521e8feb96fSEmilio G. Cota     s->code_gen_ptr = start;
522e8feb96fSEmilio G. Cota     s->code_gen_buffer_size = end - start;
523e8feb96fSEmilio G. Cota     s->code_gen_highwater = end - TCG_HIGHWATER;
524e8feb96fSEmilio G. Cota }
525e8feb96fSEmilio G. Cota 
526e8feb96fSEmilio G. Cota static bool tcg_region_alloc__locked(TCGContext *s)
527e8feb96fSEmilio G. Cota {
528e8feb96fSEmilio G. Cota     if (region.current == region.n) {
529e8feb96fSEmilio G. Cota         return true;
530e8feb96fSEmilio G. Cota     }
531e8feb96fSEmilio G. Cota     tcg_region_assign(s, region.current);
532e8feb96fSEmilio G. Cota     region.current++;
533e8feb96fSEmilio G. Cota     return false;
534e8feb96fSEmilio G. Cota }
535e8feb96fSEmilio G. Cota 
536e8feb96fSEmilio G. Cota /*
537e8feb96fSEmilio G. Cota  * Request a new region once the one in use has filled up.
538e8feb96fSEmilio G. Cota  * Returns true on error.
539e8feb96fSEmilio G. Cota  */
540e8feb96fSEmilio G. Cota static bool tcg_region_alloc(TCGContext *s)
541e8feb96fSEmilio G. Cota {
542e8feb96fSEmilio G. Cota     bool err;
543e8feb96fSEmilio G. Cota     /* read the region size now; alloc__locked will overwrite it on success */
544e8feb96fSEmilio G. Cota     size_t size_full = s->code_gen_buffer_size;
545e8feb96fSEmilio G. Cota 
546e8feb96fSEmilio G. Cota     qemu_mutex_lock(&region.lock);
547e8feb96fSEmilio G. Cota     err = tcg_region_alloc__locked(s);
548e8feb96fSEmilio G. Cota     if (!err) {
549e8feb96fSEmilio G. Cota         region.agg_size_full += size_full - TCG_HIGHWATER;
550e8feb96fSEmilio G. Cota     }
551e8feb96fSEmilio G. Cota     qemu_mutex_unlock(&region.lock);
552e8feb96fSEmilio G. Cota     return err;
553e8feb96fSEmilio G. Cota }
554e8feb96fSEmilio G. Cota 
555e8feb96fSEmilio G. Cota /*
556e8feb96fSEmilio G. Cota  * Perform a context's first region allocation.
557e8feb96fSEmilio G. Cota  * This function does _not_ increment region.agg_size_full.
558e8feb96fSEmilio G. Cota  */
559e8feb96fSEmilio G. Cota static inline bool tcg_region_initial_alloc__locked(TCGContext *s)
560e8feb96fSEmilio G. Cota {
561e8feb96fSEmilio G. Cota     return tcg_region_alloc__locked(s);
562e8feb96fSEmilio G. Cota }
563e8feb96fSEmilio G. Cota 
564e8feb96fSEmilio G. Cota /* Call from a safe-work context */
565e8feb96fSEmilio G. Cota void tcg_region_reset_all(void)
566e8feb96fSEmilio G. Cota {
5673468b59eSEmilio G. Cota     unsigned int n_ctxs = atomic_read(&n_tcg_ctxs);
568e8feb96fSEmilio G. Cota     unsigned int i;
569e8feb96fSEmilio G. Cota 
570e8feb96fSEmilio G. Cota     qemu_mutex_lock(&region.lock);
571e8feb96fSEmilio G. Cota     region.current = 0;
572e8feb96fSEmilio G. Cota     region.agg_size_full = 0;
573e8feb96fSEmilio G. Cota 
5743468b59eSEmilio G. Cota     for (i = 0; i < n_ctxs; i++) {
5753468b59eSEmilio G. Cota         TCGContext *s = atomic_read(&tcg_ctxs[i]);
5763468b59eSEmilio G. Cota         bool err = tcg_region_initial_alloc__locked(s);
577e8feb96fSEmilio G. Cota 
578e8feb96fSEmilio G. Cota         g_assert(!err);
579e8feb96fSEmilio G. Cota     }
580e8feb96fSEmilio G. Cota     qemu_mutex_unlock(&region.lock);
581be2cdc5eSEmilio G. Cota 
582be2cdc5eSEmilio G. Cota     tcg_region_tree_reset_all();
583e8feb96fSEmilio G. Cota }
584e8feb96fSEmilio G. Cota 
5853468b59eSEmilio G. Cota #ifdef CONFIG_USER_ONLY
5863468b59eSEmilio G. Cota static size_t tcg_n_regions(void)
5873468b59eSEmilio G. Cota {
5883468b59eSEmilio G. Cota     return 1;
5893468b59eSEmilio G. Cota }
5903468b59eSEmilio G. Cota #else
5913468b59eSEmilio G. Cota /*
5923468b59eSEmilio G. Cota  * It is likely that some vCPUs will translate more code than others, so we
5933468b59eSEmilio G. Cota  * first try to set more regions than max_cpus, with those regions being of
5943468b59eSEmilio G. Cota  * reasonable size. If that's not possible we make do by evenly dividing
5953468b59eSEmilio G. Cota  * the code_gen_buffer among the vCPUs.
5963468b59eSEmilio G. Cota  */
5973468b59eSEmilio G. Cota static size_t tcg_n_regions(void)
5983468b59eSEmilio G. Cota {
5993468b59eSEmilio G. Cota     size_t i;
6003468b59eSEmilio G. Cota 
6013468b59eSEmilio G. Cota     /* Use a single region if all we have is one vCPU thread */
6023468b59eSEmilio G. Cota     if (max_cpus == 1 || !qemu_tcg_mttcg_enabled()) {
6033468b59eSEmilio G. Cota         return 1;
6043468b59eSEmilio G. Cota     }
6053468b59eSEmilio G. Cota 
6063468b59eSEmilio G. Cota     /* Try to have more regions than max_cpus, with each region being >= 2 MB */
6073468b59eSEmilio G. Cota     for (i = 8; i > 0; i--) {
6083468b59eSEmilio G. Cota         size_t regions_per_thread = i;
6093468b59eSEmilio G. Cota         size_t region_size;
6103468b59eSEmilio G. Cota 
6113468b59eSEmilio G. Cota         region_size = tcg_init_ctx.code_gen_buffer_size;
6123468b59eSEmilio G. Cota         region_size /= max_cpus * regions_per_thread;
6133468b59eSEmilio G. Cota 
6143468b59eSEmilio G. Cota         if (region_size >= 2 * 1024u * 1024) {
6153468b59eSEmilio G. Cota             return max_cpus * regions_per_thread;
6163468b59eSEmilio G. Cota         }
6173468b59eSEmilio G. Cota     }
6183468b59eSEmilio G. Cota     /* If we can't, then just allocate one region per vCPU thread */
6193468b59eSEmilio G. Cota     return max_cpus;
6203468b59eSEmilio G. Cota }
6213468b59eSEmilio G. Cota #endif
6223468b59eSEmilio G. Cota 
623e8feb96fSEmilio G. Cota /*
624e8feb96fSEmilio G. Cota  * Initializes region partitioning.
625e8feb96fSEmilio G. Cota  *
626e8feb96fSEmilio G. Cota  * Called at init time from the parent thread (i.e. the one calling
627e8feb96fSEmilio G. Cota  * tcg_context_init), after the target's TCG globals have been set.
6283468b59eSEmilio G. Cota  *
6293468b59eSEmilio G. Cota  * Region partitioning works by splitting code_gen_buffer into separate regions,
6303468b59eSEmilio G. Cota  * and then assigning regions to TCG threads so that the threads can translate
6313468b59eSEmilio G. Cota  * code in parallel without synchronization.
6323468b59eSEmilio G. Cota  *
6333468b59eSEmilio G. Cota  * In softmmu the number of TCG threads is bounded by max_cpus, so we use at
6343468b59eSEmilio G. Cota  * least max_cpus regions in MTTCG. In !MTTCG we use a single region.
6353468b59eSEmilio G. Cota  * Note that the TCG options from the command-line (i.e. -accel accel=tcg,[...])
6363468b59eSEmilio G. Cota  * must have been parsed before calling this function, since it calls
6373468b59eSEmilio G. Cota  * qemu_tcg_mttcg_enabled().
6383468b59eSEmilio G. Cota  *
6393468b59eSEmilio G. Cota  * In user-mode we use a single region.  Having multiple regions in user-mode
6403468b59eSEmilio G. Cota  * is not supported, because the number of vCPU threads (recall that each thread
6413468b59eSEmilio G. Cota  * spawned by the guest corresponds to a vCPU thread) is only bounded by the
6423468b59eSEmilio G. Cota  * OS, and usually this number is huge (tens of thousands is not uncommon).
6433468b59eSEmilio G. Cota  * Thus, given this large bound on the number of vCPU threads and the fact
6443468b59eSEmilio G. Cota  * that code_gen_buffer is allocated at compile-time, we cannot guarantee
6453468b59eSEmilio G. Cota  * that the availability of at least one region per vCPU thread.
6463468b59eSEmilio G. Cota  *
6473468b59eSEmilio G. Cota  * However, this user-mode limitation is unlikely to be a significant problem
6483468b59eSEmilio G. Cota  * in practice. Multi-threaded guests share most if not all of their translated
6493468b59eSEmilio G. Cota  * code, which makes parallel code generation less appealing than in softmmu.
650e8feb96fSEmilio G. Cota  */
651e8feb96fSEmilio G. Cota void tcg_region_init(void)
652e8feb96fSEmilio G. Cota {
653e8feb96fSEmilio G. Cota     void *buf = tcg_init_ctx.code_gen_buffer;
654e8feb96fSEmilio G. Cota     void *aligned;
655e8feb96fSEmilio G. Cota     size_t size = tcg_init_ctx.code_gen_buffer_size;
656e8feb96fSEmilio G. Cota     size_t page_size = qemu_real_host_page_size;
657e8feb96fSEmilio G. Cota     size_t region_size;
658e8feb96fSEmilio G. Cota     size_t n_regions;
659e8feb96fSEmilio G. Cota     size_t i;
660e8feb96fSEmilio G. Cota 
6613468b59eSEmilio G. Cota     n_regions = tcg_n_regions();
662e8feb96fSEmilio G. Cota 
663e8feb96fSEmilio G. Cota     /* The first region will be 'aligned - buf' bytes larger than the others */
664e8feb96fSEmilio G. Cota     aligned = QEMU_ALIGN_PTR_UP(buf, page_size);
665e8feb96fSEmilio G. Cota     g_assert(aligned < tcg_init_ctx.code_gen_buffer + size);
666e8feb96fSEmilio G. Cota     /*
667e8feb96fSEmilio G. Cota      * Make region_size a multiple of page_size, using aligned as the start.
668e8feb96fSEmilio G. Cota      * As a result of this we might end up with a few extra pages at the end of
669e8feb96fSEmilio G. Cota      * the buffer; we will assign those to the last region.
670e8feb96fSEmilio G. Cota      */
671e8feb96fSEmilio G. Cota     region_size = (size - (aligned - buf)) / n_regions;
672e8feb96fSEmilio G. Cota     region_size = QEMU_ALIGN_DOWN(region_size, page_size);
673e8feb96fSEmilio G. Cota 
674e8feb96fSEmilio G. Cota     /* A region must have at least 2 pages; one code, one guard */
675e8feb96fSEmilio G. Cota     g_assert(region_size >= 2 * page_size);
676e8feb96fSEmilio G. Cota 
677e8feb96fSEmilio G. Cota     /* init the region struct */
678e8feb96fSEmilio G. Cota     qemu_mutex_init(&region.lock);
679e8feb96fSEmilio G. Cota     region.n = n_regions;
680e8feb96fSEmilio G. Cota     region.size = region_size - page_size;
681e8feb96fSEmilio G. Cota     region.stride = region_size;
682e8feb96fSEmilio G. Cota     region.start = buf;
683e8feb96fSEmilio G. Cota     region.start_aligned = aligned;
684e8feb96fSEmilio G. Cota     /* page-align the end, since its last page will be a guard page */
685e8feb96fSEmilio G. Cota     region.end = QEMU_ALIGN_PTR_DOWN(buf + size, page_size);
686e8feb96fSEmilio G. Cota     /* account for that last guard page */
687e8feb96fSEmilio G. Cota     region.end -= page_size;
688e8feb96fSEmilio G. Cota 
689e8feb96fSEmilio G. Cota     /* set guard pages */
690e8feb96fSEmilio G. Cota     for (i = 0; i < region.n; i++) {
691e8feb96fSEmilio G. Cota         void *start, *end;
692e8feb96fSEmilio G. Cota         int rc;
693e8feb96fSEmilio G. Cota 
694e8feb96fSEmilio G. Cota         tcg_region_bounds(i, &start, &end);
695e8feb96fSEmilio G. Cota         rc = qemu_mprotect_none(end, page_size);
696e8feb96fSEmilio G. Cota         g_assert(!rc);
697e8feb96fSEmilio G. Cota     }
698e8feb96fSEmilio G. Cota 
699be2cdc5eSEmilio G. Cota     tcg_region_trees_init();
700be2cdc5eSEmilio G. Cota 
7013468b59eSEmilio G. Cota     /* In user-mode we support only one ctx, so do the initial allocation now */
7023468b59eSEmilio G. Cota #ifdef CONFIG_USER_ONLY
703e8feb96fSEmilio G. Cota     {
704e8feb96fSEmilio G. Cota         bool err = tcg_region_initial_alloc__locked(tcg_ctx);
705e8feb96fSEmilio G. Cota 
706e8feb96fSEmilio G. Cota         g_assert(!err);
707e8feb96fSEmilio G. Cota     }
7083468b59eSEmilio G. Cota #endif
709e8feb96fSEmilio G. Cota }
710e8feb96fSEmilio G. Cota 
711e8feb96fSEmilio G. Cota /*
7123468b59eSEmilio G. Cota  * All TCG threads except the parent (i.e. the one that called tcg_context_init
7133468b59eSEmilio G. Cota  * and registered the target's TCG globals) must register with this function
7143468b59eSEmilio G. Cota  * before initiating translation.
7153468b59eSEmilio G. Cota  *
7163468b59eSEmilio G. Cota  * In user-mode we just point tcg_ctx to tcg_init_ctx. See the documentation
7173468b59eSEmilio G. Cota  * of tcg_region_init() for the reasoning behind this.
7183468b59eSEmilio G. Cota  *
7193468b59eSEmilio G. Cota  * In softmmu each caller registers its context in tcg_ctxs[]. Note that in
7203468b59eSEmilio G. Cota  * softmmu tcg_ctxs[] does not track tcg_ctx_init, since the initial context
7213468b59eSEmilio G. Cota  * is not used anymore for translation once this function is called.
7223468b59eSEmilio G. Cota  *
7233468b59eSEmilio G. Cota  * Not tracking tcg_init_ctx in tcg_ctxs[] in softmmu keeps code that iterates
7243468b59eSEmilio G. Cota  * over the array (e.g. tcg_code_size() the same for both softmmu and user-mode.
7253468b59eSEmilio G. Cota  */
7263468b59eSEmilio G. Cota #ifdef CONFIG_USER_ONLY
7273468b59eSEmilio G. Cota void tcg_register_thread(void)
7283468b59eSEmilio G. Cota {
7293468b59eSEmilio G. Cota     tcg_ctx = &tcg_init_ctx;
7303468b59eSEmilio G. Cota }
7313468b59eSEmilio G. Cota #else
7323468b59eSEmilio G. Cota void tcg_register_thread(void)
7333468b59eSEmilio G. Cota {
7343468b59eSEmilio G. Cota     TCGContext *s = g_malloc(sizeof(*s));
7353468b59eSEmilio G. Cota     unsigned int i, n;
7363468b59eSEmilio G. Cota     bool err;
7373468b59eSEmilio G. Cota 
7383468b59eSEmilio G. Cota     *s = tcg_init_ctx;
7393468b59eSEmilio G. Cota 
7403468b59eSEmilio G. Cota     /* Relink mem_base.  */
7413468b59eSEmilio G. Cota     for (i = 0, n = tcg_init_ctx.nb_globals; i < n; ++i) {
7423468b59eSEmilio G. Cota         if (tcg_init_ctx.temps[i].mem_base) {
7433468b59eSEmilio G. Cota             ptrdiff_t b = tcg_init_ctx.temps[i].mem_base - tcg_init_ctx.temps;
7443468b59eSEmilio G. Cota             tcg_debug_assert(b >= 0 && b < n);
7453468b59eSEmilio G. Cota             s->temps[i].mem_base = &s->temps[b];
7463468b59eSEmilio G. Cota         }
7473468b59eSEmilio G. Cota     }
7483468b59eSEmilio G. Cota 
7493468b59eSEmilio G. Cota     /* Claim an entry in tcg_ctxs */
7503468b59eSEmilio G. Cota     n = atomic_fetch_inc(&n_tcg_ctxs);
7513468b59eSEmilio G. Cota     g_assert(n < max_cpus);
7523468b59eSEmilio G. Cota     atomic_set(&tcg_ctxs[n], s);
7533468b59eSEmilio G. Cota 
7543468b59eSEmilio G. Cota     tcg_ctx = s;
7553468b59eSEmilio G. Cota     qemu_mutex_lock(&region.lock);
7563468b59eSEmilio G. Cota     err = tcg_region_initial_alloc__locked(tcg_ctx);
7573468b59eSEmilio G. Cota     g_assert(!err);
7583468b59eSEmilio G. Cota     qemu_mutex_unlock(&region.lock);
7593468b59eSEmilio G. Cota }
7603468b59eSEmilio G. Cota #endif /* !CONFIG_USER_ONLY */
7613468b59eSEmilio G. Cota 
7623468b59eSEmilio G. Cota /*
763e8feb96fSEmilio G. Cota  * Returns the size (in bytes) of all translated code (i.e. from all regions)
764e8feb96fSEmilio G. Cota  * currently in the cache.
765e8feb96fSEmilio G. Cota  * See also: tcg_code_capacity()
766e8feb96fSEmilio G. Cota  * Do not confuse with tcg_current_code_size(); that one applies to a single
767e8feb96fSEmilio G. Cota  * TCG context.
768e8feb96fSEmilio G. Cota  */
769e8feb96fSEmilio G. Cota size_t tcg_code_size(void)
770e8feb96fSEmilio G. Cota {
7713468b59eSEmilio G. Cota     unsigned int n_ctxs = atomic_read(&n_tcg_ctxs);
772e8feb96fSEmilio G. Cota     unsigned int i;
773e8feb96fSEmilio G. Cota     size_t total;
774e8feb96fSEmilio G. Cota 
775e8feb96fSEmilio G. Cota     qemu_mutex_lock(&region.lock);
776e8feb96fSEmilio G. Cota     total = region.agg_size_full;
7773468b59eSEmilio G. Cota     for (i = 0; i < n_ctxs; i++) {
7783468b59eSEmilio G. Cota         const TCGContext *s = atomic_read(&tcg_ctxs[i]);
779e8feb96fSEmilio G. Cota         size_t size;
780e8feb96fSEmilio G. Cota 
781e8feb96fSEmilio G. Cota         size = atomic_read(&s->code_gen_ptr) - s->code_gen_buffer;
782e8feb96fSEmilio G. Cota         g_assert(size <= s->code_gen_buffer_size);
783e8feb96fSEmilio G. Cota         total += size;
784e8feb96fSEmilio G. Cota     }
785e8feb96fSEmilio G. Cota     qemu_mutex_unlock(&region.lock);
786e8feb96fSEmilio G. Cota     return total;
787e8feb96fSEmilio G. Cota }
788e8feb96fSEmilio G. Cota 
789e8feb96fSEmilio G. Cota /*
790e8feb96fSEmilio G. Cota  * Returns the code capacity (in bytes) of the entire cache, i.e. including all
791e8feb96fSEmilio G. Cota  * regions.
792e8feb96fSEmilio G. Cota  * See also: tcg_code_size()
793e8feb96fSEmilio G. Cota  */
794e8feb96fSEmilio G. Cota size_t tcg_code_capacity(void)
795e8feb96fSEmilio G. Cota {
796e8feb96fSEmilio G. Cota     size_t guard_size, capacity;
797e8feb96fSEmilio G. Cota 
798e8feb96fSEmilio G. Cota     /* no need for synchronization; these variables are set at init time */
799e8feb96fSEmilio G. Cota     guard_size = region.stride - region.size;
800e8feb96fSEmilio G. Cota     capacity = region.end + guard_size - region.start;
801e8feb96fSEmilio G. Cota     capacity -= region.n * (guard_size + TCG_HIGHWATER);
802e8feb96fSEmilio G. Cota     return capacity;
803e8feb96fSEmilio G. Cota }
804e8feb96fSEmilio G. Cota 
805128ed227SEmilio G. Cota size_t tcg_tb_phys_invalidate_count(void)
806128ed227SEmilio G. Cota {
807128ed227SEmilio G. Cota     unsigned int n_ctxs = atomic_read(&n_tcg_ctxs);
808128ed227SEmilio G. Cota     unsigned int i;
809128ed227SEmilio G. Cota     size_t total = 0;
810128ed227SEmilio G. Cota 
811128ed227SEmilio G. Cota     for (i = 0; i < n_ctxs; i++) {
812128ed227SEmilio G. Cota         const TCGContext *s = atomic_read(&tcg_ctxs[i]);
813128ed227SEmilio G. Cota 
814128ed227SEmilio G. Cota         total += atomic_read(&s->tb_phys_invalidate_count);
815128ed227SEmilio G. Cota     }
816128ed227SEmilio G. Cota     return total;
817128ed227SEmilio G. Cota }
818128ed227SEmilio G. Cota 
819c896fe29Sbellard /* pool based memory allocation */
820c896fe29Sbellard void *tcg_malloc_internal(TCGContext *s, int size)
821c896fe29Sbellard {
822c896fe29Sbellard     TCGPool *p;
823c896fe29Sbellard     int pool_size;
824c896fe29Sbellard 
825c896fe29Sbellard     if (size > TCG_POOL_CHUNK_SIZE) {
826c896fe29Sbellard         /* big malloc: insert a new pool (XXX: could optimize) */
8277267c094SAnthony Liguori         p = g_malloc(sizeof(TCGPool) + size);
828c896fe29Sbellard         p->size = size;
8294055299eSKirill Batuzov         p->next = s->pool_first_large;
8304055299eSKirill Batuzov         s->pool_first_large = p;
8314055299eSKirill Batuzov         return p->data;
832c896fe29Sbellard     } else {
833c896fe29Sbellard         p = s->pool_current;
834c896fe29Sbellard         if (!p) {
835c896fe29Sbellard             p = s->pool_first;
836c896fe29Sbellard             if (!p)
837c896fe29Sbellard                 goto new_pool;
838c896fe29Sbellard         } else {
839c896fe29Sbellard             if (!p->next) {
840c896fe29Sbellard             new_pool:
841c896fe29Sbellard                 pool_size = TCG_POOL_CHUNK_SIZE;
8427267c094SAnthony Liguori                 p = g_malloc(sizeof(TCGPool) + pool_size);
843c896fe29Sbellard                 p->size = pool_size;
844c896fe29Sbellard                 p->next = NULL;
845c896fe29Sbellard                 if (s->pool_current)
846c896fe29Sbellard                     s->pool_current->next = p;
847c896fe29Sbellard                 else
848c896fe29Sbellard                     s->pool_first = p;
849c896fe29Sbellard             } else {
850c896fe29Sbellard                 p = p->next;
851c896fe29Sbellard             }
852c896fe29Sbellard         }
853c896fe29Sbellard     }
854c896fe29Sbellard     s->pool_current = p;
855c896fe29Sbellard     s->pool_cur = p->data + size;
856c896fe29Sbellard     s->pool_end = p->data + p->size;
857c896fe29Sbellard     return p->data;
858c896fe29Sbellard }
859c896fe29Sbellard 
860c896fe29Sbellard void tcg_pool_reset(TCGContext *s)
861c896fe29Sbellard {
8624055299eSKirill Batuzov     TCGPool *p, *t;
8634055299eSKirill Batuzov     for (p = s->pool_first_large; p; p = t) {
8644055299eSKirill Batuzov         t = p->next;
8654055299eSKirill Batuzov         g_free(p);
8664055299eSKirill Batuzov     }
8674055299eSKirill Batuzov     s->pool_first_large = NULL;
868c896fe29Sbellard     s->pool_cur = s->pool_end = NULL;
869c896fe29Sbellard     s->pool_current = NULL;
870c896fe29Sbellard }
871c896fe29Sbellard 
872100b5e01SRichard Henderson typedef struct TCGHelperInfo {
873100b5e01SRichard Henderson     void *func;
874100b5e01SRichard Henderson     const char *name;
875afb49896SRichard Henderson     unsigned flags;
876afb49896SRichard Henderson     unsigned sizemask;
877100b5e01SRichard Henderson } TCGHelperInfo;
878100b5e01SRichard Henderson 
8792ef6175aSRichard Henderson #include "exec/helper-proto.h"
8802ef6175aSRichard Henderson 
881100b5e01SRichard Henderson static const TCGHelperInfo all_helpers[] = {
8822ef6175aSRichard Henderson #include "exec/helper-tcg.h"
883100b5e01SRichard Henderson };
884619205fdSEmilio G. Cota static GHashTable *helper_table;
885100b5e01SRichard Henderson 
88691478cefSRichard Henderson static int indirect_reg_alloc_order[ARRAY_SIZE(tcg_target_reg_alloc_order)];
887f69d277eSRichard Henderson static void process_op_defs(TCGContext *s);
8881c2adb95SRichard Henderson static TCGTemp *tcg_global_reg_new_internal(TCGContext *s, TCGType type,
8891c2adb95SRichard Henderson                                             TCGReg reg, const char *name);
89091478cefSRichard Henderson 
891c896fe29Sbellard void tcg_context_init(TCGContext *s)
892c896fe29Sbellard {
893100b5e01SRichard Henderson     int op, total_args, n, i;
894c896fe29Sbellard     TCGOpDef *def;
895c896fe29Sbellard     TCGArgConstraint *args_ct;
896c896fe29Sbellard     int *sorted_args;
8971c2adb95SRichard Henderson     TCGTemp *ts;
898c896fe29Sbellard 
899c896fe29Sbellard     memset(s, 0, sizeof(*s));
900c896fe29Sbellard     s->nb_globals = 0;
901c896fe29Sbellard 
902c896fe29Sbellard     /* Count total number of arguments and allocate the corresponding
903c896fe29Sbellard        space */
904c896fe29Sbellard     total_args = 0;
905c896fe29Sbellard     for(op = 0; op < NB_OPS; op++) {
906c896fe29Sbellard         def = &tcg_op_defs[op];
907c896fe29Sbellard         n = def->nb_iargs + def->nb_oargs;
908c896fe29Sbellard         total_args += n;
909c896fe29Sbellard     }
910c896fe29Sbellard 
9117267c094SAnthony Liguori     args_ct = g_malloc(sizeof(TCGArgConstraint) * total_args);
9127267c094SAnthony Liguori     sorted_args = g_malloc(sizeof(int) * total_args);
913c896fe29Sbellard 
914c896fe29Sbellard     for(op = 0; op < NB_OPS; op++) {
915c896fe29Sbellard         def = &tcg_op_defs[op];
916c896fe29Sbellard         def->args_ct = args_ct;
917c896fe29Sbellard         def->sorted_args = sorted_args;
918c896fe29Sbellard         n = def->nb_iargs + def->nb_oargs;
919c896fe29Sbellard         sorted_args += n;
920c896fe29Sbellard         args_ct += n;
921c896fe29Sbellard     }
922c896fe29Sbellard 
9235cd8f621SRichard Henderson     /* Register helpers.  */
92484fd9dd3SRichard Henderson     /* Use g_direct_hash/equal for direct pointer comparisons on func.  */
925619205fdSEmilio G. Cota     helper_table = g_hash_table_new(NULL, NULL);
92684fd9dd3SRichard Henderson 
927100b5e01SRichard Henderson     for (i = 0; i < ARRAY_SIZE(all_helpers); ++i) {
92884fd9dd3SRichard Henderson         g_hash_table_insert(helper_table, (gpointer)all_helpers[i].func,
92972866e82SRichard Henderson                             (gpointer)&all_helpers[i]);
930100b5e01SRichard Henderson     }
9315cd8f621SRichard Henderson 
932c896fe29Sbellard     tcg_target_init(s);
933f69d277eSRichard Henderson     process_op_defs(s);
93491478cefSRichard Henderson 
93591478cefSRichard Henderson     /* Reverse the order of the saved registers, assuming they're all at
93691478cefSRichard Henderson        the start of tcg_target_reg_alloc_order.  */
93791478cefSRichard Henderson     for (n = 0; n < ARRAY_SIZE(tcg_target_reg_alloc_order); ++n) {
93891478cefSRichard Henderson         int r = tcg_target_reg_alloc_order[n];
93991478cefSRichard Henderson         if (tcg_regset_test_reg(tcg_target_call_clobber_regs, r)) {
94091478cefSRichard Henderson             break;
94191478cefSRichard Henderson         }
94291478cefSRichard Henderson     }
94391478cefSRichard Henderson     for (i = 0; i < n; ++i) {
94491478cefSRichard Henderson         indirect_reg_alloc_order[i] = tcg_target_reg_alloc_order[n - 1 - i];
94591478cefSRichard Henderson     }
94691478cefSRichard Henderson     for (; i < ARRAY_SIZE(tcg_target_reg_alloc_order); ++i) {
94791478cefSRichard Henderson         indirect_reg_alloc_order[i] = tcg_target_reg_alloc_order[i];
94891478cefSRichard Henderson     }
949b1311c4aSEmilio G. Cota 
950b1311c4aSEmilio G. Cota     tcg_ctx = s;
9513468b59eSEmilio G. Cota     /*
9523468b59eSEmilio G. Cota      * In user-mode we simply share the init context among threads, since we
9533468b59eSEmilio G. Cota      * use a single region. See the documentation tcg_region_init() for the
9543468b59eSEmilio G. Cota      * reasoning behind this.
9553468b59eSEmilio G. Cota      * In softmmu we will have at most max_cpus TCG threads.
9563468b59eSEmilio G. Cota      */
9573468b59eSEmilio G. Cota #ifdef CONFIG_USER_ONLY
958df2cce29SEmilio G. Cota     tcg_ctxs = &tcg_ctx;
959df2cce29SEmilio G. Cota     n_tcg_ctxs = 1;
9603468b59eSEmilio G. Cota #else
9613468b59eSEmilio G. Cota     tcg_ctxs = g_new(TCGContext *, max_cpus);
9623468b59eSEmilio G. Cota #endif
9631c2adb95SRichard Henderson 
9641c2adb95SRichard Henderson     tcg_debug_assert(!tcg_regset_test_reg(s->reserved_regs, TCG_AREG0));
9651c2adb95SRichard Henderson     ts = tcg_global_reg_new_internal(s, TCG_TYPE_PTR, TCG_AREG0, "env");
9661c2adb95SRichard Henderson     cpu_env = temp_tcgv_ptr(ts);
9679002ec79SRichard Henderson }
968b03cce8eSbellard 
9696e3b2bfdSEmilio G. Cota /*
9706e3b2bfdSEmilio G. Cota  * Allocate TBs right before their corresponding translated code, making
9716e3b2bfdSEmilio G. Cota  * sure that TBs and code are on different cache lines.
9726e3b2bfdSEmilio G. Cota  */
9736e3b2bfdSEmilio G. Cota TranslationBlock *tcg_tb_alloc(TCGContext *s)
9746e3b2bfdSEmilio G. Cota {
9756e3b2bfdSEmilio G. Cota     uintptr_t align = qemu_icache_linesize;
9766e3b2bfdSEmilio G. Cota     TranslationBlock *tb;
9776e3b2bfdSEmilio G. Cota     void *next;
9786e3b2bfdSEmilio G. Cota 
979e8feb96fSEmilio G. Cota  retry:
9806e3b2bfdSEmilio G. Cota     tb = (void *)ROUND_UP((uintptr_t)s->code_gen_ptr, align);
9816e3b2bfdSEmilio G. Cota     next = (void *)ROUND_UP((uintptr_t)(tb + 1), align);
9826e3b2bfdSEmilio G. Cota 
9836e3b2bfdSEmilio G. Cota     if (unlikely(next > s->code_gen_highwater)) {
984e8feb96fSEmilio G. Cota         if (tcg_region_alloc(s)) {
9856e3b2bfdSEmilio G. Cota             return NULL;
9866e3b2bfdSEmilio G. Cota         }
987e8feb96fSEmilio G. Cota         goto retry;
988e8feb96fSEmilio G. Cota     }
989e8feb96fSEmilio G. Cota     atomic_set(&s->code_gen_ptr, next);
99057a26946SRichard Henderson     s->data_gen_ptr = NULL;
9916e3b2bfdSEmilio G. Cota     return tb;
9926e3b2bfdSEmilio G. Cota }
9936e3b2bfdSEmilio G. Cota 
9949002ec79SRichard Henderson void tcg_prologue_init(TCGContext *s)
9959002ec79SRichard Henderson {
9968163b749SRichard Henderson     size_t prologue_size, total_size;
9978163b749SRichard Henderson     void *buf0, *buf1;
9988163b749SRichard Henderson 
9998163b749SRichard Henderson     /* Put the prologue at the beginning of code_gen_buffer.  */
10008163b749SRichard Henderson     buf0 = s->code_gen_buffer;
10015b38ee31SRichard Henderson     total_size = s->code_gen_buffer_size;
10028163b749SRichard Henderson     s->code_ptr = buf0;
10038163b749SRichard Henderson     s->code_buf = buf0;
10045b38ee31SRichard Henderson     s->data_gen_ptr = NULL;
10058163b749SRichard Henderson     s->code_gen_prologue = buf0;
10068163b749SRichard Henderson 
10075b38ee31SRichard Henderson     /* Compute a high-water mark, at which we voluntarily flush the buffer
10085b38ee31SRichard Henderson        and start over.  The size here is arbitrary, significantly larger
10095b38ee31SRichard Henderson        than we expect the code generation for any one opcode to require.  */
10105b38ee31SRichard Henderson     s->code_gen_highwater = s->code_gen_buffer + (total_size - TCG_HIGHWATER);
10115b38ee31SRichard Henderson 
10125b38ee31SRichard Henderson #ifdef TCG_TARGET_NEED_POOL_LABELS
10135b38ee31SRichard Henderson     s->pool_labels = NULL;
10145b38ee31SRichard Henderson #endif
10155b38ee31SRichard Henderson 
10168163b749SRichard Henderson     /* Generate the prologue.  */
1017b03cce8eSbellard     tcg_target_qemu_prologue(s);
10185b38ee31SRichard Henderson 
10195b38ee31SRichard Henderson #ifdef TCG_TARGET_NEED_POOL_LABELS
10205b38ee31SRichard Henderson     /* Allow the prologue to put e.g. guest_base into a pool entry.  */
10215b38ee31SRichard Henderson     {
10225b38ee31SRichard Henderson         bool ok = tcg_out_pool_finalize(s);
10235b38ee31SRichard Henderson         tcg_debug_assert(ok);
10245b38ee31SRichard Henderson     }
10255b38ee31SRichard Henderson #endif
10265b38ee31SRichard Henderson 
10278163b749SRichard Henderson     buf1 = s->code_ptr;
10288163b749SRichard Henderson     flush_icache_range((uintptr_t)buf0, (uintptr_t)buf1);
10298163b749SRichard Henderson 
10308163b749SRichard Henderson     /* Deduct the prologue from the buffer.  */
10318163b749SRichard Henderson     prologue_size = tcg_current_code_size(s);
10328163b749SRichard Henderson     s->code_gen_ptr = buf1;
10338163b749SRichard Henderson     s->code_gen_buffer = buf1;
10348163b749SRichard Henderson     s->code_buf = buf1;
10355b38ee31SRichard Henderson     total_size -= prologue_size;
10368163b749SRichard Henderson     s->code_gen_buffer_size = total_size;
10378163b749SRichard Henderson 
10388163b749SRichard Henderson     tcg_register_jit(s->code_gen_buffer, total_size);
1039d6b64b2bSRichard Henderson 
1040d6b64b2bSRichard Henderson #ifdef DEBUG_DISAS
1041d6b64b2bSRichard Henderson     if (qemu_loglevel_mask(CPU_LOG_TB_OUT_ASM)) {
10421ee73216SRichard Henderson         qemu_log_lock();
10438163b749SRichard Henderson         qemu_log("PROLOGUE: [size=%zu]\n", prologue_size);
10445b38ee31SRichard Henderson         if (s->data_gen_ptr) {
10455b38ee31SRichard Henderson             size_t code_size = s->data_gen_ptr - buf0;
10465b38ee31SRichard Henderson             size_t data_size = prologue_size - code_size;
10475b38ee31SRichard Henderson             size_t i;
10485b38ee31SRichard Henderson 
10495b38ee31SRichard Henderson             log_disas(buf0, code_size);
10505b38ee31SRichard Henderson 
10515b38ee31SRichard Henderson             for (i = 0; i < data_size; i += sizeof(tcg_target_ulong)) {
10525b38ee31SRichard Henderson                 if (sizeof(tcg_target_ulong) == 8) {
10535b38ee31SRichard Henderson                     qemu_log("0x%08" PRIxPTR ":  .quad  0x%016" PRIx64 "\n",
10545b38ee31SRichard Henderson                              (uintptr_t)s->data_gen_ptr + i,
10555b38ee31SRichard Henderson                              *(uint64_t *)(s->data_gen_ptr + i));
10565b38ee31SRichard Henderson                 } else {
10575b38ee31SRichard Henderson                     qemu_log("0x%08" PRIxPTR ":  .long  0x%08x\n",
10585b38ee31SRichard Henderson                              (uintptr_t)s->data_gen_ptr + i,
10595b38ee31SRichard Henderson                              *(uint32_t *)(s->data_gen_ptr + i));
10605b38ee31SRichard Henderson                 }
10615b38ee31SRichard Henderson             }
10625b38ee31SRichard Henderson         } else {
10638163b749SRichard Henderson             log_disas(buf0, prologue_size);
10645b38ee31SRichard Henderson         }
1065d6b64b2bSRichard Henderson         qemu_log("\n");
1066d6b64b2bSRichard Henderson         qemu_log_flush();
10671ee73216SRichard Henderson         qemu_log_unlock();
1068d6b64b2bSRichard Henderson     }
1069d6b64b2bSRichard Henderson #endif
1070cedbcb01SEmilio G. Cota 
1071cedbcb01SEmilio G. Cota     /* Assert that goto_ptr is implemented completely.  */
1072cedbcb01SEmilio G. Cota     if (TCG_TARGET_HAS_goto_ptr) {
1073cedbcb01SEmilio G. Cota         tcg_debug_assert(s->code_gen_epilogue != NULL);
1074cedbcb01SEmilio G. Cota     }
1075c896fe29Sbellard }
1076c896fe29Sbellard 
1077c896fe29Sbellard void tcg_func_start(TCGContext *s)
1078c896fe29Sbellard {
1079c896fe29Sbellard     tcg_pool_reset(s);
1080c896fe29Sbellard     s->nb_temps = s->nb_globals;
10810ec9eabcSRichard Henderson 
10820ec9eabcSRichard Henderson     /* No temps have been previously allocated for size or locality.  */
10830ec9eabcSRichard Henderson     memset(s->free_temps, 0, sizeof(s->free_temps));
10840ec9eabcSRichard Henderson 
1085abebf925SRichard Henderson     s->nb_ops = 0;
1086c896fe29Sbellard     s->nb_labels = 0;
1087c896fe29Sbellard     s->current_frame_offset = s->frame_start;
1088c896fe29Sbellard 
10890a209d4bSRichard Henderson #ifdef CONFIG_DEBUG_TCG
10900a209d4bSRichard Henderson     s->goto_tb_issue_mask = 0;
10910a209d4bSRichard Henderson #endif
10920a209d4bSRichard Henderson 
109315fa08f8SRichard Henderson     QTAILQ_INIT(&s->ops);
109415fa08f8SRichard Henderson     QTAILQ_INIT(&s->free_ops);
1095c896fe29Sbellard }
1096c896fe29Sbellard 
10977ca4b752SRichard Henderson static inline TCGTemp *tcg_temp_alloc(TCGContext *s)
10987ca4b752SRichard Henderson {
10997ca4b752SRichard Henderson     int n = s->nb_temps++;
11007ca4b752SRichard Henderson     tcg_debug_assert(n < TCG_MAX_TEMPS);
11017ca4b752SRichard Henderson     return memset(&s->temps[n], 0, sizeof(TCGTemp));
11027ca4b752SRichard Henderson }
11037ca4b752SRichard Henderson 
11047ca4b752SRichard Henderson static inline TCGTemp *tcg_global_alloc(TCGContext *s)
11057ca4b752SRichard Henderson {
1106fa477d25SRichard Henderson     TCGTemp *ts;
1107fa477d25SRichard Henderson 
11087ca4b752SRichard Henderson     tcg_debug_assert(s->nb_globals == s->nb_temps);
11097ca4b752SRichard Henderson     s->nb_globals++;
1110fa477d25SRichard Henderson     ts = tcg_temp_alloc(s);
1111fa477d25SRichard Henderson     ts->temp_global = 1;
1112fa477d25SRichard Henderson 
1113fa477d25SRichard Henderson     return ts;
1114c896fe29Sbellard }
1115c896fe29Sbellard 
1116085272b3SRichard Henderson static TCGTemp *tcg_global_reg_new_internal(TCGContext *s, TCGType type,
1117b6638662SRichard Henderson                                             TCGReg reg, const char *name)
1118c896fe29Sbellard {
1119c896fe29Sbellard     TCGTemp *ts;
1120c896fe29Sbellard 
1121b3a62939SRichard Henderson     if (TCG_TARGET_REG_BITS == 32 && type != TCG_TYPE_I32) {
1122c896fe29Sbellard         tcg_abort();
1123b3a62939SRichard Henderson     }
11247ca4b752SRichard Henderson 
11257ca4b752SRichard Henderson     ts = tcg_global_alloc(s);
1126c896fe29Sbellard     ts->base_type = type;
1127c896fe29Sbellard     ts->type = type;
1128c896fe29Sbellard     ts->fixed_reg = 1;
1129c896fe29Sbellard     ts->reg = reg;
1130c896fe29Sbellard     ts->name = name;
1131c896fe29Sbellard     tcg_regset_set_reg(s->reserved_regs, reg);
11327ca4b752SRichard Henderson 
1133085272b3SRichard Henderson     return ts;
1134a7812ae4Spbrook }
1135a7812ae4Spbrook 
1136b6638662SRichard Henderson void tcg_set_frame(TCGContext *s, TCGReg reg, intptr_t start, intptr_t size)
1137a7812ae4Spbrook {
1138b3a62939SRichard Henderson     s->frame_start = start;
1139b3a62939SRichard Henderson     s->frame_end = start + size;
1140085272b3SRichard Henderson     s->frame_temp
1141085272b3SRichard Henderson         = tcg_global_reg_new_internal(s, TCG_TYPE_PTR, reg, "_frame");
1142b3a62939SRichard Henderson }
1143a7812ae4Spbrook 
1144085272b3SRichard Henderson TCGTemp *tcg_global_mem_new_internal(TCGType type, TCGv_ptr base,
1145e1ccc054SRichard Henderson                                      intptr_t offset, const char *name)
1146c896fe29Sbellard {
1147b1311c4aSEmilio G. Cota     TCGContext *s = tcg_ctx;
1148dc41aa7dSRichard Henderson     TCGTemp *base_ts = tcgv_ptr_temp(base);
11497ca4b752SRichard Henderson     TCGTemp *ts = tcg_global_alloc(s);
1150b3915dbbSRichard Henderson     int indirect_reg = 0, bigendian = 0;
11517ca4b752SRichard Henderson #ifdef HOST_WORDS_BIGENDIAN
11527ca4b752SRichard Henderson     bigendian = 1;
11537ca4b752SRichard Henderson #endif
1154c896fe29Sbellard 
1155b3915dbbSRichard Henderson     if (!base_ts->fixed_reg) {
11565a18407fSRichard Henderson         /* We do not support double-indirect registers.  */
11575a18407fSRichard Henderson         tcg_debug_assert(!base_ts->indirect_reg);
1158b3915dbbSRichard Henderson         base_ts->indirect_base = 1;
11595a18407fSRichard Henderson         s->nb_indirects += (TCG_TARGET_REG_BITS == 32 && type == TCG_TYPE_I64
11605a18407fSRichard Henderson                             ? 2 : 1);
11615a18407fSRichard Henderson         indirect_reg = 1;
1162b3915dbbSRichard Henderson     }
1163b3915dbbSRichard Henderson 
11647ca4b752SRichard Henderson     if (TCG_TARGET_REG_BITS == 32 && type == TCG_TYPE_I64) {
11657ca4b752SRichard Henderson         TCGTemp *ts2 = tcg_global_alloc(s);
1166c896fe29Sbellard         char buf[64];
11677ca4b752SRichard Henderson 
11687ca4b752SRichard Henderson         ts->base_type = TCG_TYPE_I64;
1169c896fe29Sbellard         ts->type = TCG_TYPE_I32;
1170b3915dbbSRichard Henderson         ts->indirect_reg = indirect_reg;
1171c896fe29Sbellard         ts->mem_allocated = 1;
1172b3a62939SRichard Henderson         ts->mem_base = base_ts;
11737ca4b752SRichard Henderson         ts->mem_offset = offset + bigendian * 4;
1174c896fe29Sbellard         pstrcpy(buf, sizeof(buf), name);
1175c896fe29Sbellard         pstrcat(buf, sizeof(buf), "_0");
1176c896fe29Sbellard         ts->name = strdup(buf);
1177c896fe29Sbellard 
11787ca4b752SRichard Henderson         tcg_debug_assert(ts2 == ts + 1);
11797ca4b752SRichard Henderson         ts2->base_type = TCG_TYPE_I64;
11807ca4b752SRichard Henderson         ts2->type = TCG_TYPE_I32;
1181b3915dbbSRichard Henderson         ts2->indirect_reg = indirect_reg;
11827ca4b752SRichard Henderson         ts2->mem_allocated = 1;
11837ca4b752SRichard Henderson         ts2->mem_base = base_ts;
11847ca4b752SRichard Henderson         ts2->mem_offset = offset + (1 - bigendian) * 4;
1185c896fe29Sbellard         pstrcpy(buf, sizeof(buf), name);
1186c896fe29Sbellard         pstrcat(buf, sizeof(buf), "_1");
1187120c1084SRichard Henderson         ts2->name = strdup(buf);
11887ca4b752SRichard Henderson     } else {
1189c896fe29Sbellard         ts->base_type = type;
1190c896fe29Sbellard         ts->type = type;
1191b3915dbbSRichard Henderson         ts->indirect_reg = indirect_reg;
1192c896fe29Sbellard         ts->mem_allocated = 1;
1193b3a62939SRichard Henderson         ts->mem_base = base_ts;
1194c896fe29Sbellard         ts->mem_offset = offset;
1195c896fe29Sbellard         ts->name = name;
1196c896fe29Sbellard     }
1197085272b3SRichard Henderson     return ts;
1198c896fe29Sbellard }
1199c896fe29Sbellard 
12005bfa8034SRichard Henderson TCGTemp *tcg_temp_new_internal(TCGType type, bool temp_local)
1201c896fe29Sbellard {
1202b1311c4aSEmilio G. Cota     TCGContext *s = tcg_ctx;
1203c896fe29Sbellard     TCGTemp *ts;
1204641d5fbeSbellard     int idx, k;
1205c896fe29Sbellard 
12060ec9eabcSRichard Henderson     k = type + (temp_local ? TCG_TYPE_COUNT : 0);
12070ec9eabcSRichard Henderson     idx = find_first_bit(s->free_temps[k].l, TCG_MAX_TEMPS);
12080ec9eabcSRichard Henderson     if (idx < TCG_MAX_TEMPS) {
12090ec9eabcSRichard Henderson         /* There is already an available temp with the right type.  */
12100ec9eabcSRichard Henderson         clear_bit(idx, s->free_temps[k].l);
12110ec9eabcSRichard Henderson 
1212e8996ee0Sbellard         ts = &s->temps[idx];
1213e8996ee0Sbellard         ts->temp_allocated = 1;
12147ca4b752SRichard Henderson         tcg_debug_assert(ts->base_type == type);
12157ca4b752SRichard Henderson         tcg_debug_assert(ts->temp_local == temp_local);
1216e8996ee0Sbellard     } else {
12177ca4b752SRichard Henderson         ts = tcg_temp_alloc(s);
12187ca4b752SRichard Henderson         if (TCG_TARGET_REG_BITS == 32 && type == TCG_TYPE_I64) {
12197ca4b752SRichard Henderson             TCGTemp *ts2 = tcg_temp_alloc(s);
12207ca4b752SRichard Henderson 
1221c896fe29Sbellard             ts->base_type = type;
1222c896fe29Sbellard             ts->type = TCG_TYPE_I32;
1223e8996ee0Sbellard             ts->temp_allocated = 1;
1224641d5fbeSbellard             ts->temp_local = temp_local;
12257ca4b752SRichard Henderson 
12267ca4b752SRichard Henderson             tcg_debug_assert(ts2 == ts + 1);
12277ca4b752SRichard Henderson             ts2->base_type = TCG_TYPE_I64;
12287ca4b752SRichard Henderson             ts2->type = TCG_TYPE_I32;
12297ca4b752SRichard Henderson             ts2->temp_allocated = 1;
12307ca4b752SRichard Henderson             ts2->temp_local = temp_local;
12317ca4b752SRichard Henderson         } else {
1232c896fe29Sbellard             ts->base_type = type;
1233c896fe29Sbellard             ts->type = type;
1234e8996ee0Sbellard             ts->temp_allocated = 1;
1235641d5fbeSbellard             ts->temp_local = temp_local;
1236c896fe29Sbellard         }
1237e8996ee0Sbellard     }
123827bfd83cSPeter Maydell 
123927bfd83cSPeter Maydell #if defined(CONFIG_DEBUG_TCG)
124027bfd83cSPeter Maydell     s->temps_in_use++;
124127bfd83cSPeter Maydell #endif
1242085272b3SRichard Henderson     return ts;
1243c896fe29Sbellard }
1244c896fe29Sbellard 
1245d2fd745fSRichard Henderson TCGv_vec tcg_temp_new_vec(TCGType type)
1246d2fd745fSRichard Henderson {
1247d2fd745fSRichard Henderson     TCGTemp *t;
1248d2fd745fSRichard Henderson 
1249d2fd745fSRichard Henderson #ifdef CONFIG_DEBUG_TCG
1250d2fd745fSRichard Henderson     switch (type) {
1251d2fd745fSRichard Henderson     case TCG_TYPE_V64:
1252d2fd745fSRichard Henderson         assert(TCG_TARGET_HAS_v64);
1253d2fd745fSRichard Henderson         break;
1254d2fd745fSRichard Henderson     case TCG_TYPE_V128:
1255d2fd745fSRichard Henderson         assert(TCG_TARGET_HAS_v128);
1256d2fd745fSRichard Henderson         break;
1257d2fd745fSRichard Henderson     case TCG_TYPE_V256:
1258d2fd745fSRichard Henderson         assert(TCG_TARGET_HAS_v256);
1259d2fd745fSRichard Henderson         break;
1260d2fd745fSRichard Henderson     default:
1261d2fd745fSRichard Henderson         g_assert_not_reached();
1262d2fd745fSRichard Henderson     }
1263d2fd745fSRichard Henderson #endif
1264d2fd745fSRichard Henderson 
1265d2fd745fSRichard Henderson     t = tcg_temp_new_internal(type, 0);
1266d2fd745fSRichard Henderson     return temp_tcgv_vec(t);
1267d2fd745fSRichard Henderson }
1268d2fd745fSRichard Henderson 
1269d2fd745fSRichard Henderson /* Create a new temp of the same type as an existing temp.  */
1270d2fd745fSRichard Henderson TCGv_vec tcg_temp_new_vec_matching(TCGv_vec match)
1271d2fd745fSRichard Henderson {
1272d2fd745fSRichard Henderson     TCGTemp *t = tcgv_vec_temp(match);
1273d2fd745fSRichard Henderson 
1274d2fd745fSRichard Henderson     tcg_debug_assert(t->temp_allocated != 0);
1275d2fd745fSRichard Henderson 
1276d2fd745fSRichard Henderson     t = tcg_temp_new_internal(t->base_type, 0);
1277d2fd745fSRichard Henderson     return temp_tcgv_vec(t);
1278d2fd745fSRichard Henderson }
1279d2fd745fSRichard Henderson 
12805bfa8034SRichard Henderson void tcg_temp_free_internal(TCGTemp *ts)
1281c896fe29Sbellard {
1282b1311c4aSEmilio G. Cota     TCGContext *s = tcg_ctx;
1283085272b3SRichard Henderson     int k, idx;
1284c896fe29Sbellard 
128527bfd83cSPeter Maydell #if defined(CONFIG_DEBUG_TCG)
128627bfd83cSPeter Maydell     s->temps_in_use--;
128727bfd83cSPeter Maydell     if (s->temps_in_use < 0) {
128827bfd83cSPeter Maydell         fprintf(stderr, "More temporaries freed than allocated!\n");
128927bfd83cSPeter Maydell     }
129027bfd83cSPeter Maydell #endif
129127bfd83cSPeter Maydell 
1292085272b3SRichard Henderson     tcg_debug_assert(ts->temp_global == 0);
1293eabb7b91SAurelien Jarno     tcg_debug_assert(ts->temp_allocated != 0);
1294e8996ee0Sbellard     ts->temp_allocated = 0;
12950ec9eabcSRichard Henderson 
1296085272b3SRichard Henderson     idx = temp_idx(ts);
129718d13fa2SAlexander Graf     k = ts->base_type + (ts->temp_local ? TCG_TYPE_COUNT : 0);
12980ec9eabcSRichard Henderson     set_bit(idx, s->free_temps[k].l);
1299e8996ee0Sbellard }
1300e8996ee0Sbellard 
1301a7812ae4Spbrook TCGv_i32 tcg_const_i32(int32_t val)
1302a7812ae4Spbrook {
1303a7812ae4Spbrook     TCGv_i32 t0;
1304a7812ae4Spbrook     t0 = tcg_temp_new_i32();
1305e8996ee0Sbellard     tcg_gen_movi_i32(t0, val);
1306e8996ee0Sbellard     return t0;
1307c896fe29Sbellard }
1308c896fe29Sbellard 
1309a7812ae4Spbrook TCGv_i64 tcg_const_i64(int64_t val)
1310c896fe29Sbellard {
1311a7812ae4Spbrook     TCGv_i64 t0;
1312a7812ae4Spbrook     t0 = tcg_temp_new_i64();
1313e8996ee0Sbellard     tcg_gen_movi_i64(t0, val);
1314e8996ee0Sbellard     return t0;
1315c896fe29Sbellard }
1316c896fe29Sbellard 
1317a7812ae4Spbrook TCGv_i32 tcg_const_local_i32(int32_t val)
1318bdffd4a9Saurel32 {
1319a7812ae4Spbrook     TCGv_i32 t0;
1320a7812ae4Spbrook     t0 = tcg_temp_local_new_i32();
1321bdffd4a9Saurel32     tcg_gen_movi_i32(t0, val);
1322bdffd4a9Saurel32     return t0;
1323bdffd4a9Saurel32 }
1324bdffd4a9Saurel32 
1325a7812ae4Spbrook TCGv_i64 tcg_const_local_i64(int64_t val)
1326bdffd4a9Saurel32 {
1327a7812ae4Spbrook     TCGv_i64 t0;
1328a7812ae4Spbrook     t0 = tcg_temp_local_new_i64();
1329bdffd4a9Saurel32     tcg_gen_movi_i64(t0, val);
1330bdffd4a9Saurel32     return t0;
1331bdffd4a9Saurel32 }
1332bdffd4a9Saurel32 
133327bfd83cSPeter Maydell #if defined(CONFIG_DEBUG_TCG)
133427bfd83cSPeter Maydell void tcg_clear_temp_count(void)
133527bfd83cSPeter Maydell {
1336b1311c4aSEmilio G. Cota     TCGContext *s = tcg_ctx;
133727bfd83cSPeter Maydell     s->temps_in_use = 0;
133827bfd83cSPeter Maydell }
133927bfd83cSPeter Maydell 
134027bfd83cSPeter Maydell int tcg_check_temp_count(void)
134127bfd83cSPeter Maydell {
1342b1311c4aSEmilio G. Cota     TCGContext *s = tcg_ctx;
134327bfd83cSPeter Maydell     if (s->temps_in_use) {
134427bfd83cSPeter Maydell         /* Clear the count so that we don't give another
134527bfd83cSPeter Maydell          * warning immediately next time around.
134627bfd83cSPeter Maydell          */
134727bfd83cSPeter Maydell         s->temps_in_use = 0;
134827bfd83cSPeter Maydell         return 1;
134927bfd83cSPeter Maydell     }
135027bfd83cSPeter Maydell     return 0;
135127bfd83cSPeter Maydell }
135227bfd83cSPeter Maydell #endif
135327bfd83cSPeter Maydell 
1354be0f34b5SRichard Henderson /* Return true if OP may appear in the opcode stream.
1355be0f34b5SRichard Henderson    Test the runtime variable that controls each opcode.  */
1356be0f34b5SRichard Henderson bool tcg_op_supported(TCGOpcode op)
1357be0f34b5SRichard Henderson {
1358d2fd745fSRichard Henderson     const bool have_vec
1359d2fd745fSRichard Henderson         = TCG_TARGET_HAS_v64 | TCG_TARGET_HAS_v128 | TCG_TARGET_HAS_v256;
1360d2fd745fSRichard Henderson 
1361be0f34b5SRichard Henderson     switch (op) {
1362be0f34b5SRichard Henderson     case INDEX_op_discard:
1363be0f34b5SRichard Henderson     case INDEX_op_set_label:
1364be0f34b5SRichard Henderson     case INDEX_op_call:
1365be0f34b5SRichard Henderson     case INDEX_op_br:
1366be0f34b5SRichard Henderson     case INDEX_op_mb:
1367be0f34b5SRichard Henderson     case INDEX_op_insn_start:
1368be0f34b5SRichard Henderson     case INDEX_op_exit_tb:
1369be0f34b5SRichard Henderson     case INDEX_op_goto_tb:
1370be0f34b5SRichard Henderson     case INDEX_op_qemu_ld_i32:
1371be0f34b5SRichard Henderson     case INDEX_op_qemu_st_i32:
1372be0f34b5SRichard Henderson     case INDEX_op_qemu_ld_i64:
1373be0f34b5SRichard Henderson     case INDEX_op_qemu_st_i64:
1374be0f34b5SRichard Henderson         return true;
1375be0f34b5SRichard Henderson 
1376be0f34b5SRichard Henderson     case INDEX_op_goto_ptr:
1377be0f34b5SRichard Henderson         return TCG_TARGET_HAS_goto_ptr;
1378be0f34b5SRichard Henderson 
1379be0f34b5SRichard Henderson     case INDEX_op_mov_i32:
1380be0f34b5SRichard Henderson     case INDEX_op_movi_i32:
1381be0f34b5SRichard Henderson     case INDEX_op_setcond_i32:
1382be0f34b5SRichard Henderson     case INDEX_op_brcond_i32:
1383be0f34b5SRichard Henderson     case INDEX_op_ld8u_i32:
1384be0f34b5SRichard Henderson     case INDEX_op_ld8s_i32:
1385be0f34b5SRichard Henderson     case INDEX_op_ld16u_i32:
1386be0f34b5SRichard Henderson     case INDEX_op_ld16s_i32:
1387be0f34b5SRichard Henderson     case INDEX_op_ld_i32:
1388be0f34b5SRichard Henderson     case INDEX_op_st8_i32:
1389be0f34b5SRichard Henderson     case INDEX_op_st16_i32:
1390be0f34b5SRichard Henderson     case INDEX_op_st_i32:
1391be0f34b5SRichard Henderson     case INDEX_op_add_i32:
1392be0f34b5SRichard Henderson     case INDEX_op_sub_i32:
1393be0f34b5SRichard Henderson     case INDEX_op_mul_i32:
1394be0f34b5SRichard Henderson     case INDEX_op_and_i32:
1395be0f34b5SRichard Henderson     case INDEX_op_or_i32:
1396be0f34b5SRichard Henderson     case INDEX_op_xor_i32:
1397be0f34b5SRichard Henderson     case INDEX_op_shl_i32:
1398be0f34b5SRichard Henderson     case INDEX_op_shr_i32:
1399be0f34b5SRichard Henderson     case INDEX_op_sar_i32:
1400be0f34b5SRichard Henderson         return true;
1401be0f34b5SRichard Henderson 
1402be0f34b5SRichard Henderson     case INDEX_op_movcond_i32:
1403be0f34b5SRichard Henderson         return TCG_TARGET_HAS_movcond_i32;
1404be0f34b5SRichard Henderson     case INDEX_op_div_i32:
1405be0f34b5SRichard Henderson     case INDEX_op_divu_i32:
1406be0f34b5SRichard Henderson         return TCG_TARGET_HAS_div_i32;
1407be0f34b5SRichard Henderson     case INDEX_op_rem_i32:
1408be0f34b5SRichard Henderson     case INDEX_op_remu_i32:
1409be0f34b5SRichard Henderson         return TCG_TARGET_HAS_rem_i32;
1410be0f34b5SRichard Henderson     case INDEX_op_div2_i32:
1411be0f34b5SRichard Henderson     case INDEX_op_divu2_i32:
1412be0f34b5SRichard Henderson         return TCG_TARGET_HAS_div2_i32;
1413be0f34b5SRichard Henderson     case INDEX_op_rotl_i32:
1414be0f34b5SRichard Henderson     case INDEX_op_rotr_i32:
1415be0f34b5SRichard Henderson         return TCG_TARGET_HAS_rot_i32;
1416be0f34b5SRichard Henderson     case INDEX_op_deposit_i32:
1417be0f34b5SRichard Henderson         return TCG_TARGET_HAS_deposit_i32;
1418be0f34b5SRichard Henderson     case INDEX_op_extract_i32:
1419be0f34b5SRichard Henderson         return TCG_TARGET_HAS_extract_i32;
1420be0f34b5SRichard Henderson     case INDEX_op_sextract_i32:
1421be0f34b5SRichard Henderson         return TCG_TARGET_HAS_sextract_i32;
1422be0f34b5SRichard Henderson     case INDEX_op_add2_i32:
1423be0f34b5SRichard Henderson         return TCG_TARGET_HAS_add2_i32;
1424be0f34b5SRichard Henderson     case INDEX_op_sub2_i32:
1425be0f34b5SRichard Henderson         return TCG_TARGET_HAS_sub2_i32;
1426be0f34b5SRichard Henderson     case INDEX_op_mulu2_i32:
1427be0f34b5SRichard Henderson         return TCG_TARGET_HAS_mulu2_i32;
1428be0f34b5SRichard Henderson     case INDEX_op_muls2_i32:
1429be0f34b5SRichard Henderson         return TCG_TARGET_HAS_muls2_i32;
1430be0f34b5SRichard Henderson     case INDEX_op_muluh_i32:
1431be0f34b5SRichard Henderson         return TCG_TARGET_HAS_muluh_i32;
1432be0f34b5SRichard Henderson     case INDEX_op_mulsh_i32:
1433be0f34b5SRichard Henderson         return TCG_TARGET_HAS_mulsh_i32;
1434be0f34b5SRichard Henderson     case INDEX_op_ext8s_i32:
1435be0f34b5SRichard Henderson         return TCG_TARGET_HAS_ext8s_i32;
1436be0f34b5SRichard Henderson     case INDEX_op_ext16s_i32:
1437be0f34b5SRichard Henderson         return TCG_TARGET_HAS_ext16s_i32;
1438be0f34b5SRichard Henderson     case INDEX_op_ext8u_i32:
1439be0f34b5SRichard Henderson         return TCG_TARGET_HAS_ext8u_i32;
1440be0f34b5SRichard Henderson     case INDEX_op_ext16u_i32:
1441be0f34b5SRichard Henderson         return TCG_TARGET_HAS_ext16u_i32;
1442be0f34b5SRichard Henderson     case INDEX_op_bswap16_i32:
1443be0f34b5SRichard Henderson         return TCG_TARGET_HAS_bswap16_i32;
1444be0f34b5SRichard Henderson     case INDEX_op_bswap32_i32:
1445be0f34b5SRichard Henderson         return TCG_TARGET_HAS_bswap32_i32;
1446be0f34b5SRichard Henderson     case INDEX_op_not_i32:
1447be0f34b5SRichard Henderson         return TCG_TARGET_HAS_not_i32;
1448be0f34b5SRichard Henderson     case INDEX_op_neg_i32:
1449be0f34b5SRichard Henderson         return TCG_TARGET_HAS_neg_i32;
1450be0f34b5SRichard Henderson     case INDEX_op_andc_i32:
1451be0f34b5SRichard Henderson         return TCG_TARGET_HAS_andc_i32;
1452be0f34b5SRichard Henderson     case INDEX_op_orc_i32:
1453be0f34b5SRichard Henderson         return TCG_TARGET_HAS_orc_i32;
1454be0f34b5SRichard Henderson     case INDEX_op_eqv_i32:
1455be0f34b5SRichard Henderson         return TCG_TARGET_HAS_eqv_i32;
1456be0f34b5SRichard Henderson     case INDEX_op_nand_i32:
1457be0f34b5SRichard Henderson         return TCG_TARGET_HAS_nand_i32;
1458be0f34b5SRichard Henderson     case INDEX_op_nor_i32:
1459be0f34b5SRichard Henderson         return TCG_TARGET_HAS_nor_i32;
1460be0f34b5SRichard Henderson     case INDEX_op_clz_i32:
1461be0f34b5SRichard Henderson         return TCG_TARGET_HAS_clz_i32;
1462be0f34b5SRichard Henderson     case INDEX_op_ctz_i32:
1463be0f34b5SRichard Henderson         return TCG_TARGET_HAS_ctz_i32;
1464be0f34b5SRichard Henderson     case INDEX_op_ctpop_i32:
1465be0f34b5SRichard Henderson         return TCG_TARGET_HAS_ctpop_i32;
1466be0f34b5SRichard Henderson 
1467be0f34b5SRichard Henderson     case INDEX_op_brcond2_i32:
1468be0f34b5SRichard Henderson     case INDEX_op_setcond2_i32:
1469be0f34b5SRichard Henderson         return TCG_TARGET_REG_BITS == 32;
1470be0f34b5SRichard Henderson 
1471be0f34b5SRichard Henderson     case INDEX_op_mov_i64:
1472be0f34b5SRichard Henderson     case INDEX_op_movi_i64:
1473be0f34b5SRichard Henderson     case INDEX_op_setcond_i64:
1474be0f34b5SRichard Henderson     case INDEX_op_brcond_i64:
1475be0f34b5SRichard Henderson     case INDEX_op_ld8u_i64:
1476be0f34b5SRichard Henderson     case INDEX_op_ld8s_i64:
1477be0f34b5SRichard Henderson     case INDEX_op_ld16u_i64:
1478be0f34b5SRichard Henderson     case INDEX_op_ld16s_i64:
1479be0f34b5SRichard Henderson     case INDEX_op_ld32u_i64:
1480be0f34b5SRichard Henderson     case INDEX_op_ld32s_i64:
1481be0f34b5SRichard Henderson     case INDEX_op_ld_i64:
1482be0f34b5SRichard Henderson     case INDEX_op_st8_i64:
1483be0f34b5SRichard Henderson     case INDEX_op_st16_i64:
1484be0f34b5SRichard Henderson     case INDEX_op_st32_i64:
1485be0f34b5SRichard Henderson     case INDEX_op_st_i64:
1486be0f34b5SRichard Henderson     case INDEX_op_add_i64:
1487be0f34b5SRichard Henderson     case INDEX_op_sub_i64:
1488be0f34b5SRichard Henderson     case INDEX_op_mul_i64:
1489be0f34b5SRichard Henderson     case INDEX_op_and_i64:
1490be0f34b5SRichard Henderson     case INDEX_op_or_i64:
1491be0f34b5SRichard Henderson     case INDEX_op_xor_i64:
1492be0f34b5SRichard Henderson     case INDEX_op_shl_i64:
1493be0f34b5SRichard Henderson     case INDEX_op_shr_i64:
1494be0f34b5SRichard Henderson     case INDEX_op_sar_i64:
1495be0f34b5SRichard Henderson     case INDEX_op_ext_i32_i64:
1496be0f34b5SRichard Henderson     case INDEX_op_extu_i32_i64:
1497be0f34b5SRichard Henderson         return TCG_TARGET_REG_BITS == 64;
1498be0f34b5SRichard Henderson 
1499be0f34b5SRichard Henderson     case INDEX_op_movcond_i64:
1500be0f34b5SRichard Henderson         return TCG_TARGET_HAS_movcond_i64;
1501be0f34b5SRichard Henderson     case INDEX_op_div_i64:
1502be0f34b5SRichard Henderson     case INDEX_op_divu_i64:
1503be0f34b5SRichard Henderson         return TCG_TARGET_HAS_div_i64;
1504be0f34b5SRichard Henderson     case INDEX_op_rem_i64:
1505be0f34b5SRichard Henderson     case INDEX_op_remu_i64:
1506be0f34b5SRichard Henderson         return TCG_TARGET_HAS_rem_i64;
1507be0f34b5SRichard Henderson     case INDEX_op_div2_i64:
1508be0f34b5SRichard Henderson     case INDEX_op_divu2_i64:
1509be0f34b5SRichard Henderson         return TCG_TARGET_HAS_div2_i64;
1510be0f34b5SRichard Henderson     case INDEX_op_rotl_i64:
1511be0f34b5SRichard Henderson     case INDEX_op_rotr_i64:
1512be0f34b5SRichard Henderson         return TCG_TARGET_HAS_rot_i64;
1513be0f34b5SRichard Henderson     case INDEX_op_deposit_i64:
1514be0f34b5SRichard Henderson         return TCG_TARGET_HAS_deposit_i64;
1515be0f34b5SRichard Henderson     case INDEX_op_extract_i64:
1516be0f34b5SRichard Henderson         return TCG_TARGET_HAS_extract_i64;
1517be0f34b5SRichard Henderson     case INDEX_op_sextract_i64:
1518be0f34b5SRichard Henderson         return TCG_TARGET_HAS_sextract_i64;
1519be0f34b5SRichard Henderson     case INDEX_op_extrl_i64_i32:
1520be0f34b5SRichard Henderson         return TCG_TARGET_HAS_extrl_i64_i32;
1521be0f34b5SRichard Henderson     case INDEX_op_extrh_i64_i32:
1522be0f34b5SRichard Henderson         return TCG_TARGET_HAS_extrh_i64_i32;
1523be0f34b5SRichard Henderson     case INDEX_op_ext8s_i64:
1524be0f34b5SRichard Henderson         return TCG_TARGET_HAS_ext8s_i64;
1525be0f34b5SRichard Henderson     case INDEX_op_ext16s_i64:
1526be0f34b5SRichard Henderson         return TCG_TARGET_HAS_ext16s_i64;
1527be0f34b5SRichard Henderson     case INDEX_op_ext32s_i64:
1528be0f34b5SRichard Henderson         return TCG_TARGET_HAS_ext32s_i64;
1529be0f34b5SRichard Henderson     case INDEX_op_ext8u_i64:
1530be0f34b5SRichard Henderson         return TCG_TARGET_HAS_ext8u_i64;
1531be0f34b5SRichard Henderson     case INDEX_op_ext16u_i64:
1532be0f34b5SRichard Henderson         return TCG_TARGET_HAS_ext16u_i64;
1533be0f34b5SRichard Henderson     case INDEX_op_ext32u_i64:
1534be0f34b5SRichard Henderson         return TCG_TARGET_HAS_ext32u_i64;
1535be0f34b5SRichard Henderson     case INDEX_op_bswap16_i64:
1536be0f34b5SRichard Henderson         return TCG_TARGET_HAS_bswap16_i64;
1537be0f34b5SRichard Henderson     case INDEX_op_bswap32_i64:
1538be0f34b5SRichard Henderson         return TCG_TARGET_HAS_bswap32_i64;
1539be0f34b5SRichard Henderson     case INDEX_op_bswap64_i64:
1540be0f34b5SRichard Henderson         return TCG_TARGET_HAS_bswap64_i64;
1541be0f34b5SRichard Henderson     case INDEX_op_not_i64:
1542be0f34b5SRichard Henderson         return TCG_TARGET_HAS_not_i64;
1543be0f34b5SRichard Henderson     case INDEX_op_neg_i64:
1544be0f34b5SRichard Henderson         return TCG_TARGET_HAS_neg_i64;
1545be0f34b5SRichard Henderson     case INDEX_op_andc_i64:
1546be0f34b5SRichard Henderson         return TCG_TARGET_HAS_andc_i64;
1547be0f34b5SRichard Henderson     case INDEX_op_orc_i64:
1548be0f34b5SRichard Henderson         return TCG_TARGET_HAS_orc_i64;
1549be0f34b5SRichard Henderson     case INDEX_op_eqv_i64:
1550be0f34b5SRichard Henderson         return TCG_TARGET_HAS_eqv_i64;
1551be0f34b5SRichard Henderson     case INDEX_op_nand_i64:
1552be0f34b5SRichard Henderson         return TCG_TARGET_HAS_nand_i64;
1553be0f34b5SRichard Henderson     case INDEX_op_nor_i64:
1554be0f34b5SRichard Henderson         return TCG_TARGET_HAS_nor_i64;
1555be0f34b5SRichard Henderson     case INDEX_op_clz_i64:
1556be0f34b5SRichard Henderson         return TCG_TARGET_HAS_clz_i64;
1557be0f34b5SRichard Henderson     case INDEX_op_ctz_i64:
1558be0f34b5SRichard Henderson         return TCG_TARGET_HAS_ctz_i64;
1559be0f34b5SRichard Henderson     case INDEX_op_ctpop_i64:
1560be0f34b5SRichard Henderson         return TCG_TARGET_HAS_ctpop_i64;
1561be0f34b5SRichard Henderson     case INDEX_op_add2_i64:
1562be0f34b5SRichard Henderson         return TCG_TARGET_HAS_add2_i64;
1563be0f34b5SRichard Henderson     case INDEX_op_sub2_i64:
1564be0f34b5SRichard Henderson         return TCG_TARGET_HAS_sub2_i64;
1565be0f34b5SRichard Henderson     case INDEX_op_mulu2_i64:
1566be0f34b5SRichard Henderson         return TCG_TARGET_HAS_mulu2_i64;
1567be0f34b5SRichard Henderson     case INDEX_op_muls2_i64:
1568be0f34b5SRichard Henderson         return TCG_TARGET_HAS_muls2_i64;
1569be0f34b5SRichard Henderson     case INDEX_op_muluh_i64:
1570be0f34b5SRichard Henderson         return TCG_TARGET_HAS_muluh_i64;
1571be0f34b5SRichard Henderson     case INDEX_op_mulsh_i64:
1572be0f34b5SRichard Henderson         return TCG_TARGET_HAS_mulsh_i64;
1573be0f34b5SRichard Henderson 
1574d2fd745fSRichard Henderson     case INDEX_op_mov_vec:
1575d2fd745fSRichard Henderson     case INDEX_op_dup_vec:
1576d2fd745fSRichard Henderson     case INDEX_op_dupi_vec:
1577d2fd745fSRichard Henderson     case INDEX_op_ld_vec:
1578d2fd745fSRichard Henderson     case INDEX_op_st_vec:
1579d2fd745fSRichard Henderson     case INDEX_op_add_vec:
1580d2fd745fSRichard Henderson     case INDEX_op_sub_vec:
1581d2fd745fSRichard Henderson     case INDEX_op_and_vec:
1582d2fd745fSRichard Henderson     case INDEX_op_or_vec:
1583d2fd745fSRichard Henderson     case INDEX_op_xor_vec:
1584212be173SRichard Henderson     case INDEX_op_cmp_vec:
1585d2fd745fSRichard Henderson         return have_vec;
1586d2fd745fSRichard Henderson     case INDEX_op_dup2_vec:
1587d2fd745fSRichard Henderson         return have_vec && TCG_TARGET_REG_BITS == 32;
1588d2fd745fSRichard Henderson     case INDEX_op_not_vec:
1589d2fd745fSRichard Henderson         return have_vec && TCG_TARGET_HAS_not_vec;
1590d2fd745fSRichard Henderson     case INDEX_op_neg_vec:
1591d2fd745fSRichard Henderson         return have_vec && TCG_TARGET_HAS_neg_vec;
1592d2fd745fSRichard Henderson     case INDEX_op_andc_vec:
1593d2fd745fSRichard Henderson         return have_vec && TCG_TARGET_HAS_andc_vec;
1594d2fd745fSRichard Henderson     case INDEX_op_orc_vec:
1595d2fd745fSRichard Henderson         return have_vec && TCG_TARGET_HAS_orc_vec;
15963774030aSRichard Henderson     case INDEX_op_mul_vec:
15973774030aSRichard Henderson         return have_vec && TCG_TARGET_HAS_mul_vec;
1598d0ec9796SRichard Henderson     case INDEX_op_shli_vec:
1599d0ec9796SRichard Henderson     case INDEX_op_shri_vec:
1600d0ec9796SRichard Henderson     case INDEX_op_sari_vec:
1601d0ec9796SRichard Henderson         return have_vec && TCG_TARGET_HAS_shi_vec;
1602d0ec9796SRichard Henderson     case INDEX_op_shls_vec:
1603d0ec9796SRichard Henderson     case INDEX_op_shrs_vec:
1604d0ec9796SRichard Henderson     case INDEX_op_sars_vec:
1605d0ec9796SRichard Henderson         return have_vec && TCG_TARGET_HAS_shs_vec;
1606d0ec9796SRichard Henderson     case INDEX_op_shlv_vec:
1607d0ec9796SRichard Henderson     case INDEX_op_shrv_vec:
1608d0ec9796SRichard Henderson     case INDEX_op_sarv_vec:
1609d0ec9796SRichard Henderson         return have_vec && TCG_TARGET_HAS_shv_vec;
1610d2fd745fSRichard Henderson 
1611db432672SRichard Henderson     default:
1612db432672SRichard Henderson         tcg_debug_assert(op > INDEX_op_last_generic && op < NB_OPS);
1613db432672SRichard Henderson         return true;
1614be0f34b5SRichard Henderson     }
1615be0f34b5SRichard Henderson }
1616be0f34b5SRichard Henderson 
161739cf05d3Sbellard /* Note: we convert the 64 bit args to 32 bit and do some alignment
161839cf05d3Sbellard    and endian swap. Maybe it would be better to do the alignment
161939cf05d3Sbellard    and endian swap in tcg_reg_alloc_call(). */
1620ae8b75dcSRichard Henderson void tcg_gen_callN(void *func, TCGTemp *ret, int nargs, TCGTemp **args)
1621c896fe29Sbellard {
162275e8b9b7SRichard Henderson     int i, real_args, nb_rets, pi;
1623bbb8a1b4SRichard Henderson     unsigned sizemask, flags;
1624afb49896SRichard Henderson     TCGHelperInfo *info;
162575e8b9b7SRichard Henderson     TCGOp *op;
1626afb49896SRichard Henderson 
1627619205fdSEmilio G. Cota     info = g_hash_table_lookup(helper_table, (gpointer)func);
1628bbb8a1b4SRichard Henderson     flags = info->flags;
1629bbb8a1b4SRichard Henderson     sizemask = info->sizemask;
16302bece2c8SRichard Henderson 
163134b1a49cSRichard Henderson #if defined(__sparc__) && !defined(__arch64__) \
163234b1a49cSRichard Henderson     && !defined(CONFIG_TCG_INTERPRETER)
163334b1a49cSRichard Henderson     /* We have 64-bit values in one register, but need to pass as two
163434b1a49cSRichard Henderson        separate parameters.  Split them.  */
163534b1a49cSRichard Henderson     int orig_sizemask = sizemask;
163634b1a49cSRichard Henderson     int orig_nargs = nargs;
163734b1a49cSRichard Henderson     TCGv_i64 retl, reth;
1638ae8b75dcSRichard Henderson     TCGTemp *split_args[MAX_OPC_PARAM];
163934b1a49cSRichard Henderson 
1640f764718dSRichard Henderson     retl = NULL;
1641f764718dSRichard Henderson     reth = NULL;
164234b1a49cSRichard Henderson     if (sizemask != 0) {
164334b1a49cSRichard Henderson         for (i = real_args = 0; i < nargs; ++i) {
164434b1a49cSRichard Henderson             int is_64bit = sizemask & (1 << (i+1)*2);
164534b1a49cSRichard Henderson             if (is_64bit) {
1646085272b3SRichard Henderson                 TCGv_i64 orig = temp_tcgv_i64(args[i]);
164734b1a49cSRichard Henderson                 TCGv_i32 h = tcg_temp_new_i32();
164834b1a49cSRichard Henderson                 TCGv_i32 l = tcg_temp_new_i32();
164934b1a49cSRichard Henderson                 tcg_gen_extr_i64_i32(l, h, orig);
1650ae8b75dcSRichard Henderson                 split_args[real_args++] = tcgv_i32_temp(h);
1651ae8b75dcSRichard Henderson                 split_args[real_args++] = tcgv_i32_temp(l);
165234b1a49cSRichard Henderson             } else {
165334b1a49cSRichard Henderson                 split_args[real_args++] = args[i];
165434b1a49cSRichard Henderson             }
165534b1a49cSRichard Henderson         }
165634b1a49cSRichard Henderson         nargs = real_args;
165734b1a49cSRichard Henderson         args = split_args;
165834b1a49cSRichard Henderson         sizemask = 0;
165934b1a49cSRichard Henderson     }
166034b1a49cSRichard Henderson #elif defined(TCG_TARGET_EXTEND_ARGS) && TCG_TARGET_REG_BITS == 64
16612bece2c8SRichard Henderson     for (i = 0; i < nargs; ++i) {
16622bece2c8SRichard Henderson         int is_64bit = sizemask & (1 << (i+1)*2);
16632bece2c8SRichard Henderson         int is_signed = sizemask & (2 << (i+1)*2);
16642bece2c8SRichard Henderson         if (!is_64bit) {
16652bece2c8SRichard Henderson             TCGv_i64 temp = tcg_temp_new_i64();
1666085272b3SRichard Henderson             TCGv_i64 orig = temp_tcgv_i64(args[i]);
16672bece2c8SRichard Henderson             if (is_signed) {
16682bece2c8SRichard Henderson                 tcg_gen_ext32s_i64(temp, orig);
16692bece2c8SRichard Henderson             } else {
16702bece2c8SRichard Henderson                 tcg_gen_ext32u_i64(temp, orig);
16712bece2c8SRichard Henderson             }
1672ae8b75dcSRichard Henderson             args[i] = tcgv_i64_temp(temp);
16732bece2c8SRichard Henderson         }
16742bece2c8SRichard Henderson     }
16752bece2c8SRichard Henderson #endif /* TCG_TARGET_EXTEND_ARGS */
16762bece2c8SRichard Henderson 
167715fa08f8SRichard Henderson     op = tcg_emit_op(INDEX_op_call);
167875e8b9b7SRichard Henderson 
167975e8b9b7SRichard Henderson     pi = 0;
1680ae8b75dcSRichard Henderson     if (ret != NULL) {
168134b1a49cSRichard Henderson #if defined(__sparc__) && !defined(__arch64__) \
168234b1a49cSRichard Henderson     && !defined(CONFIG_TCG_INTERPRETER)
168334b1a49cSRichard Henderson         if (orig_sizemask & 1) {
168434b1a49cSRichard Henderson             /* The 32-bit ABI is going to return the 64-bit value in
168534b1a49cSRichard Henderson                the %o0/%o1 register pair.  Prepare for this by using
168634b1a49cSRichard Henderson                two return temporaries, and reassemble below.  */
168734b1a49cSRichard Henderson             retl = tcg_temp_new_i64();
168834b1a49cSRichard Henderson             reth = tcg_temp_new_i64();
1689ae8b75dcSRichard Henderson             op->args[pi++] = tcgv_i64_arg(reth);
1690ae8b75dcSRichard Henderson             op->args[pi++] = tcgv_i64_arg(retl);
169134b1a49cSRichard Henderson             nb_rets = 2;
169234b1a49cSRichard Henderson         } else {
1693ae8b75dcSRichard Henderson             op->args[pi++] = temp_arg(ret);
169434b1a49cSRichard Henderson             nb_rets = 1;
169534b1a49cSRichard Henderson         }
169634b1a49cSRichard Henderson #else
169734b1a49cSRichard Henderson         if (TCG_TARGET_REG_BITS < 64 && (sizemask & 1)) {
169802eb19d0SRichard Henderson #ifdef HOST_WORDS_BIGENDIAN
1699ae8b75dcSRichard Henderson             op->args[pi++] = temp_arg(ret + 1);
1700ae8b75dcSRichard Henderson             op->args[pi++] = temp_arg(ret);
1701a7812ae4Spbrook #else
1702ae8b75dcSRichard Henderson             op->args[pi++] = temp_arg(ret);
1703ae8b75dcSRichard Henderson             op->args[pi++] = temp_arg(ret + 1);
1704a7812ae4Spbrook #endif
1705a7812ae4Spbrook             nb_rets = 2;
170634b1a49cSRichard Henderson         } else {
1707ae8b75dcSRichard Henderson             op->args[pi++] = temp_arg(ret);
1708a7812ae4Spbrook             nb_rets = 1;
1709a7812ae4Spbrook         }
171034b1a49cSRichard Henderson #endif
1711a7812ae4Spbrook     } else {
1712a7812ae4Spbrook         nb_rets = 0;
1713a7812ae4Spbrook     }
1714cd9090aaSRichard Henderson     TCGOP_CALLO(op) = nb_rets;
171575e8b9b7SRichard Henderson 
1716a7812ae4Spbrook     real_args = 0;
1717a7812ae4Spbrook     for (i = 0; i < nargs; i++) {
17182bece2c8SRichard Henderson         int is_64bit = sizemask & (1 << (i+1)*2);
1719bbb8a1b4SRichard Henderson         if (TCG_TARGET_REG_BITS < 64 && is_64bit) {
172039cf05d3Sbellard #ifdef TCG_TARGET_CALL_ALIGN_ARGS
172139cf05d3Sbellard             /* some targets want aligned 64 bit args */
1722ebd486d5Smalc             if (real_args & 1) {
172375e8b9b7SRichard Henderson                 op->args[pi++] = TCG_CALL_DUMMY_ARG;
1724ebd486d5Smalc                 real_args++;
172539cf05d3Sbellard             }
172639cf05d3Sbellard #endif
17273f90f252SRichard Henderson            /* If stack grows up, then we will be placing successive
17283f90f252SRichard Henderson               arguments at lower addresses, which means we need to
17293f90f252SRichard Henderson               reverse the order compared to how we would normally
17303f90f252SRichard Henderson               treat either big or little-endian.  For those arguments
17313f90f252SRichard Henderson               that will wind up in registers, this still works for
17323f90f252SRichard Henderson               HPPA (the only current STACK_GROWSUP target) since the
17333f90f252SRichard Henderson               argument registers are *also* allocated in decreasing
17343f90f252SRichard Henderson               order.  If another such target is added, this logic may
17353f90f252SRichard Henderson               have to get more complicated to differentiate between
17363f90f252SRichard Henderson               stack arguments and register arguments.  */
173702eb19d0SRichard Henderson #if defined(HOST_WORDS_BIGENDIAN) != defined(TCG_TARGET_STACK_GROWSUP)
1738ae8b75dcSRichard Henderson             op->args[pi++] = temp_arg(args[i] + 1);
1739ae8b75dcSRichard Henderson             op->args[pi++] = temp_arg(args[i]);
1740c896fe29Sbellard #else
1741ae8b75dcSRichard Henderson             op->args[pi++] = temp_arg(args[i]);
1742ae8b75dcSRichard Henderson             op->args[pi++] = temp_arg(args[i] + 1);
1743c896fe29Sbellard #endif
1744a7812ae4Spbrook             real_args += 2;
17452bece2c8SRichard Henderson             continue;
17462bece2c8SRichard Henderson         }
17472bece2c8SRichard Henderson 
1748ae8b75dcSRichard Henderson         op->args[pi++] = temp_arg(args[i]);
1749a7812ae4Spbrook         real_args++;
1750c896fe29Sbellard     }
175175e8b9b7SRichard Henderson     op->args[pi++] = (uintptr_t)func;
175275e8b9b7SRichard Henderson     op->args[pi++] = flags;
1753cd9090aaSRichard Henderson     TCGOP_CALLI(op) = real_args;
1754a7812ae4Spbrook 
175575e8b9b7SRichard Henderson     /* Make sure the fields didn't overflow.  */
1756cd9090aaSRichard Henderson     tcg_debug_assert(TCGOP_CALLI(op) == real_args);
175775e8b9b7SRichard Henderson     tcg_debug_assert(pi <= ARRAY_SIZE(op->args));
17582bece2c8SRichard Henderson 
175934b1a49cSRichard Henderson #if defined(__sparc__) && !defined(__arch64__) \
176034b1a49cSRichard Henderson     && !defined(CONFIG_TCG_INTERPRETER)
176134b1a49cSRichard Henderson     /* Free all of the parts we allocated above.  */
176234b1a49cSRichard Henderson     for (i = real_args = 0; i < orig_nargs; ++i) {
176334b1a49cSRichard Henderson         int is_64bit = orig_sizemask & (1 << (i+1)*2);
176434b1a49cSRichard Henderson         if (is_64bit) {
1765085272b3SRichard Henderson             tcg_temp_free_internal(args[real_args++]);
1766085272b3SRichard Henderson             tcg_temp_free_internal(args[real_args++]);
176734b1a49cSRichard Henderson         } else {
176834b1a49cSRichard Henderson             real_args++;
176934b1a49cSRichard Henderson         }
177034b1a49cSRichard Henderson     }
177134b1a49cSRichard Henderson     if (orig_sizemask & 1) {
177234b1a49cSRichard Henderson         /* The 32-bit ABI returned two 32-bit pieces.  Re-assemble them.
177334b1a49cSRichard Henderson            Note that describing these as TCGv_i64 eliminates an unnecessary
177434b1a49cSRichard Henderson            zero-extension that tcg_gen_concat_i32_i64 would create.  */
1775085272b3SRichard Henderson         tcg_gen_concat32_i64(temp_tcgv_i64(ret), retl, reth);
177634b1a49cSRichard Henderson         tcg_temp_free_i64(retl);
177734b1a49cSRichard Henderson         tcg_temp_free_i64(reth);
177834b1a49cSRichard Henderson     }
177934b1a49cSRichard Henderson #elif defined(TCG_TARGET_EXTEND_ARGS) && TCG_TARGET_REG_BITS == 64
17802bece2c8SRichard Henderson     for (i = 0; i < nargs; ++i) {
17812bece2c8SRichard Henderson         int is_64bit = sizemask & (1 << (i+1)*2);
17822bece2c8SRichard Henderson         if (!is_64bit) {
1783085272b3SRichard Henderson             tcg_temp_free_internal(args[i]);
17842bece2c8SRichard Henderson         }
17852bece2c8SRichard Henderson     }
17862bece2c8SRichard Henderson #endif /* TCG_TARGET_EXTEND_ARGS */
1787a7812ae4Spbrook }
1788c896fe29Sbellard 
17898fcd3692Sblueswir1 static void tcg_reg_alloc_start(TCGContext *s)
1790c896fe29Sbellard {
1791ac3b8891SRichard Henderson     int i, n;
1792c896fe29Sbellard     TCGTemp *ts;
1793ac3b8891SRichard Henderson 
1794ac3b8891SRichard Henderson     for (i = 0, n = s->nb_globals; i < n; i++) {
1795c896fe29Sbellard         ts = &s->temps[i];
1796ac3b8891SRichard Henderson         ts->val_type = (ts->fixed_reg ? TEMP_VAL_REG : TEMP_VAL_MEM);
1797c896fe29Sbellard     }
1798ac3b8891SRichard Henderson     for (n = s->nb_temps; i < n; i++) {
1799e8996ee0Sbellard         ts = &s->temps[i];
1800ac3b8891SRichard Henderson         ts->val_type = (ts->temp_local ? TEMP_VAL_MEM : TEMP_VAL_DEAD);
1801e8996ee0Sbellard         ts->mem_allocated = 0;
1802e8996ee0Sbellard         ts->fixed_reg = 0;
1803e8996ee0Sbellard     }
1804f8b2f202SRichard Henderson 
1805f8b2f202SRichard Henderson     memset(s->reg_to_temp, 0, sizeof(s->reg_to_temp));
1806c896fe29Sbellard }
1807c896fe29Sbellard 
1808f8b2f202SRichard Henderson static char *tcg_get_arg_str_ptr(TCGContext *s, char *buf, int buf_size,
1809f8b2f202SRichard Henderson                                  TCGTemp *ts)
1810c896fe29Sbellard {
18111807f4c4SRichard Henderson     int idx = temp_idx(ts);
1812ac56dd48Spbrook 
1813fa477d25SRichard Henderson     if (ts->temp_global) {
1814ac56dd48Spbrook         pstrcpy(buf, buf_size, ts->name);
1815f8b2f202SRichard Henderson     } else if (ts->temp_local) {
1816641d5fbeSbellard         snprintf(buf, buf_size, "loc%d", idx - s->nb_globals);
1817f8b2f202SRichard Henderson     } else {
1818ac56dd48Spbrook         snprintf(buf, buf_size, "tmp%d", idx - s->nb_globals);
1819c896fe29Sbellard     }
1820c896fe29Sbellard     return buf;
1821c896fe29Sbellard }
1822c896fe29Sbellard 
182343439139SRichard Henderson static char *tcg_get_arg_str(TCGContext *s, char *buf,
182443439139SRichard Henderson                              int buf_size, TCGArg arg)
1825f8b2f202SRichard Henderson {
182643439139SRichard Henderson     return tcg_get_arg_str_ptr(s, buf, buf_size, arg_temp(arg));
1827f8b2f202SRichard Henderson }
1828f8b2f202SRichard Henderson 
18296e085f72SRichard Henderson /* Find helper name.  */
18306e085f72SRichard Henderson static inline const char *tcg_find_helper(TCGContext *s, uintptr_t val)
1831e8996ee0Sbellard {
18326e085f72SRichard Henderson     const char *ret = NULL;
1833619205fdSEmilio G. Cota     if (helper_table) {
1834619205fdSEmilio G. Cota         TCGHelperInfo *info = g_hash_table_lookup(helper_table, (gpointer)val);
183572866e82SRichard Henderson         if (info) {
183672866e82SRichard Henderson             ret = info->name;
183772866e82SRichard Henderson         }
1838e8996ee0Sbellard     }
18396e085f72SRichard Henderson     return ret;
18404dc81f28Sbellard }
18414dc81f28Sbellard 
1842f48f3edeSblueswir1 static const char * const cond_name[] =
1843f48f3edeSblueswir1 {
18440aed257fSRichard Henderson     [TCG_COND_NEVER] = "never",
18450aed257fSRichard Henderson     [TCG_COND_ALWAYS] = "always",
1846f48f3edeSblueswir1     [TCG_COND_EQ] = "eq",
1847f48f3edeSblueswir1     [TCG_COND_NE] = "ne",
1848f48f3edeSblueswir1     [TCG_COND_LT] = "lt",
1849f48f3edeSblueswir1     [TCG_COND_GE] = "ge",
1850f48f3edeSblueswir1     [TCG_COND_LE] = "le",
1851f48f3edeSblueswir1     [TCG_COND_GT] = "gt",
1852f48f3edeSblueswir1     [TCG_COND_LTU] = "ltu",
1853f48f3edeSblueswir1     [TCG_COND_GEU] = "geu",
1854f48f3edeSblueswir1     [TCG_COND_LEU] = "leu",
1855f48f3edeSblueswir1     [TCG_COND_GTU] = "gtu"
1856f48f3edeSblueswir1 };
1857f48f3edeSblueswir1 
1858f713d6adSRichard Henderson static const char * const ldst_name[] =
1859f713d6adSRichard Henderson {
1860f713d6adSRichard Henderson     [MO_UB]   = "ub",
1861f713d6adSRichard Henderson     [MO_SB]   = "sb",
1862f713d6adSRichard Henderson     [MO_LEUW] = "leuw",
1863f713d6adSRichard Henderson     [MO_LESW] = "lesw",
1864f713d6adSRichard Henderson     [MO_LEUL] = "leul",
1865f713d6adSRichard Henderson     [MO_LESL] = "lesl",
1866f713d6adSRichard Henderson     [MO_LEQ]  = "leq",
1867f713d6adSRichard Henderson     [MO_BEUW] = "beuw",
1868f713d6adSRichard Henderson     [MO_BESW] = "besw",
1869f713d6adSRichard Henderson     [MO_BEUL] = "beul",
1870f713d6adSRichard Henderson     [MO_BESL] = "besl",
1871f713d6adSRichard Henderson     [MO_BEQ]  = "beq",
1872f713d6adSRichard Henderson };
1873f713d6adSRichard Henderson 
18741f00b27fSSergey Sorokin static const char * const alignment_name[(MO_AMASK >> MO_ASHIFT) + 1] = {
18751f00b27fSSergey Sorokin #ifdef ALIGNED_ONLY
18761f00b27fSSergey Sorokin     [MO_UNALN >> MO_ASHIFT]    = "un+",
18771f00b27fSSergey Sorokin     [MO_ALIGN >> MO_ASHIFT]    = "",
18781f00b27fSSergey Sorokin #else
18791f00b27fSSergey Sorokin     [MO_UNALN >> MO_ASHIFT]    = "",
18801f00b27fSSergey Sorokin     [MO_ALIGN >> MO_ASHIFT]    = "al+",
18811f00b27fSSergey Sorokin #endif
18821f00b27fSSergey Sorokin     [MO_ALIGN_2 >> MO_ASHIFT]  = "al2+",
18831f00b27fSSergey Sorokin     [MO_ALIGN_4 >> MO_ASHIFT]  = "al4+",
18841f00b27fSSergey Sorokin     [MO_ALIGN_8 >> MO_ASHIFT]  = "al8+",
18851f00b27fSSergey Sorokin     [MO_ALIGN_16 >> MO_ASHIFT] = "al16+",
18861f00b27fSSergey Sorokin     [MO_ALIGN_32 >> MO_ASHIFT] = "al32+",
18871f00b27fSSergey Sorokin     [MO_ALIGN_64 >> MO_ASHIFT] = "al64+",
18881f00b27fSSergey Sorokin };
18891f00b27fSSergey Sorokin 
1890*b016486eSRichard Henderson static inline bool tcg_regset_single(TCGRegSet d)
1891*b016486eSRichard Henderson {
1892*b016486eSRichard Henderson     return (d & (d - 1)) == 0;
1893*b016486eSRichard Henderson }
1894*b016486eSRichard Henderson 
1895*b016486eSRichard Henderson static inline TCGReg tcg_regset_first(TCGRegSet d)
1896*b016486eSRichard Henderson {
1897*b016486eSRichard Henderson     if (TCG_TARGET_NB_REGS <= 32) {
1898*b016486eSRichard Henderson         return ctz32(d);
1899*b016486eSRichard Henderson     } else {
1900*b016486eSRichard Henderson         return ctz64(d);
1901*b016486eSRichard Henderson     }
1902*b016486eSRichard Henderson }
1903*b016486eSRichard Henderson 
1904eeacee4dSBlue Swirl void tcg_dump_ops(TCGContext *s)
1905c896fe29Sbellard {
1906c896fe29Sbellard     char buf[128];
1907c45cb8bbSRichard Henderson     TCGOp *op;
1908c896fe29Sbellard 
190915fa08f8SRichard Henderson     QTAILQ_FOREACH(op, &s->ops, link) {
1910c45cb8bbSRichard Henderson         int i, k, nb_oargs, nb_iargs, nb_cargs;
1911c45cb8bbSRichard Henderson         const TCGOpDef *def;
1912c45cb8bbSRichard Henderson         TCGOpcode c;
1913bdfb460eSRichard Henderson         int col = 0;
1914c45cb8bbSRichard Henderson 
1915c45cb8bbSRichard Henderson         c = op->opc;
1916c896fe29Sbellard         def = &tcg_op_defs[c];
1917c45cb8bbSRichard Henderson 
1918765b842aSRichard Henderson         if (c == INDEX_op_insn_start) {
1919*b016486eSRichard Henderson             nb_oargs = 0;
192015fa08f8SRichard Henderson             col += qemu_log("\n ----");
19219aef40edSRichard Henderson 
19229aef40edSRichard Henderson             for (i = 0; i < TARGET_INSN_START_WORDS; ++i) {
19239aef40edSRichard Henderson                 target_ulong a;
19247e4597d7Sbellard #if TARGET_LONG_BITS > TCG_TARGET_REG_BITS
1925efee3746SRichard Henderson                 a = deposit64(op->args[i * 2], 32, 32, op->args[i * 2 + 1]);
19267e4597d7Sbellard #else
1927efee3746SRichard Henderson                 a = op->args[i];
19287e4597d7Sbellard #endif
1929bdfb460eSRichard Henderson                 col += qemu_log(" " TARGET_FMT_lx, a);
1930eeacee4dSBlue Swirl             }
19317e4597d7Sbellard         } else if (c == INDEX_op_call) {
1932c896fe29Sbellard             /* variable number of arguments */
1933cd9090aaSRichard Henderson             nb_oargs = TCGOP_CALLO(op);
1934cd9090aaSRichard Henderson             nb_iargs = TCGOP_CALLI(op);
1935c896fe29Sbellard             nb_cargs = def->nb_cargs;
1936b03cce8eSbellard 
1937cf066674SRichard Henderson             /* function name, flags, out args */
1938bdfb460eSRichard Henderson             col += qemu_log(" %s %s,$0x%" TCG_PRIlx ",$%d", def->name,
1939efee3746SRichard Henderson                             tcg_find_helper(s, op->args[nb_oargs + nb_iargs]),
1940efee3746SRichard Henderson                             op->args[nb_oargs + nb_iargs + 1], nb_oargs);
1941b03cce8eSbellard             for (i = 0; i < nb_oargs; i++) {
194243439139SRichard Henderson                 col += qemu_log(",%s", tcg_get_arg_str(s, buf, sizeof(buf),
1943efee3746SRichard Henderson                                                        op->args[i]));
1944b03cce8eSbellard             }
1945cf066674SRichard Henderson             for (i = 0; i < nb_iargs; i++) {
1946efee3746SRichard Henderson                 TCGArg arg = op->args[nb_oargs + i];
1947cf066674SRichard Henderson                 const char *t = "<dummy>";
1948cf066674SRichard Henderson                 if (arg != TCG_CALL_DUMMY_ARG) {
194943439139SRichard Henderson                     t = tcg_get_arg_str(s, buf, sizeof(buf), arg);
1950b03cce8eSbellard                 }
1951bdfb460eSRichard Henderson                 col += qemu_log(",%s", t);
1952e8996ee0Sbellard             }
1953b03cce8eSbellard         } else {
1954bdfb460eSRichard Henderson             col += qemu_log(" %s ", def->name);
1955c45cb8bbSRichard Henderson 
1956c896fe29Sbellard             nb_oargs = def->nb_oargs;
1957c896fe29Sbellard             nb_iargs = def->nb_iargs;
1958c896fe29Sbellard             nb_cargs = def->nb_cargs;
1959c896fe29Sbellard 
1960d2fd745fSRichard Henderson             if (def->flags & TCG_OPF_VECTOR) {
1961d2fd745fSRichard Henderson                 col += qemu_log("v%d,e%d,", 64 << TCGOP_VECL(op),
1962d2fd745fSRichard Henderson                                 8 << TCGOP_VECE(op));
1963d2fd745fSRichard Henderson             }
1964d2fd745fSRichard Henderson 
1965c896fe29Sbellard             k = 0;
1966c896fe29Sbellard             for (i = 0; i < nb_oargs; i++) {
1967eeacee4dSBlue Swirl                 if (k != 0) {
1968bdfb460eSRichard Henderson                     col += qemu_log(",");
1969eeacee4dSBlue Swirl                 }
197043439139SRichard Henderson                 col += qemu_log("%s", tcg_get_arg_str(s, buf, sizeof(buf),
1971efee3746SRichard Henderson                                                       op->args[k++]));
1972c896fe29Sbellard             }
1973c896fe29Sbellard             for (i = 0; i < nb_iargs; i++) {
1974eeacee4dSBlue Swirl                 if (k != 0) {
1975bdfb460eSRichard Henderson                     col += qemu_log(",");
1976eeacee4dSBlue Swirl                 }
197743439139SRichard Henderson                 col += qemu_log("%s", tcg_get_arg_str(s, buf, sizeof(buf),
1978efee3746SRichard Henderson                                                       op->args[k++]));
1979c896fe29Sbellard             }
1980be210acbSRichard Henderson             switch (c) {
1981be210acbSRichard Henderson             case INDEX_op_brcond_i32:
1982ffc5ea09SRichard Henderson             case INDEX_op_setcond_i32:
1983ffc5ea09SRichard Henderson             case INDEX_op_movcond_i32:
1984be210acbSRichard Henderson             case INDEX_op_brcond2_i32:
1985be210acbSRichard Henderson             case INDEX_op_setcond2_i32:
1986ffc5ea09SRichard Henderson             case INDEX_op_brcond_i64:
1987be210acbSRichard Henderson             case INDEX_op_setcond_i64:
1988ffc5ea09SRichard Henderson             case INDEX_op_movcond_i64:
1989212be173SRichard Henderson             case INDEX_op_cmp_vec:
1990efee3746SRichard Henderson                 if (op->args[k] < ARRAY_SIZE(cond_name)
1991efee3746SRichard Henderson                     && cond_name[op->args[k]]) {
1992efee3746SRichard Henderson                     col += qemu_log(",%s", cond_name[op->args[k++]]);
1993eeacee4dSBlue Swirl                 } else {
1994efee3746SRichard Henderson                     col += qemu_log(",$0x%" TCG_PRIlx, op->args[k++]);
1995eeacee4dSBlue Swirl                 }
1996f48f3edeSblueswir1                 i = 1;
1997be210acbSRichard Henderson                 break;
1998f713d6adSRichard Henderson             case INDEX_op_qemu_ld_i32:
1999f713d6adSRichard Henderson             case INDEX_op_qemu_st_i32:
2000f713d6adSRichard Henderson             case INDEX_op_qemu_ld_i64:
2001f713d6adSRichard Henderson             case INDEX_op_qemu_st_i64:
200259227d5dSRichard Henderson                 {
2003efee3746SRichard Henderson                     TCGMemOpIdx oi = op->args[k++];
200459227d5dSRichard Henderson                     TCGMemOp op = get_memop(oi);
200559227d5dSRichard Henderson                     unsigned ix = get_mmuidx(oi);
200659227d5dSRichard Henderson 
200759c4b7e8SRichard Henderson                     if (op & ~(MO_AMASK | MO_BSWAP | MO_SSIZE)) {
2008bdfb460eSRichard Henderson                         col += qemu_log(",$0x%x,%u", op, ix);
200959c4b7e8SRichard Henderson                     } else {
20101f00b27fSSergey Sorokin                         const char *s_al, *s_op;
20111f00b27fSSergey Sorokin                         s_al = alignment_name[(op & MO_AMASK) >> MO_ASHIFT];
201259c4b7e8SRichard Henderson                         s_op = ldst_name[op & (MO_BSWAP | MO_SSIZE)];
2013bdfb460eSRichard Henderson                         col += qemu_log(",%s%s,%u", s_al, s_op, ix);
2014f713d6adSRichard Henderson                     }
2015f713d6adSRichard Henderson                     i = 1;
201659227d5dSRichard Henderson                 }
2017f713d6adSRichard Henderson                 break;
2018be210acbSRichard Henderson             default:
2019f48f3edeSblueswir1                 i = 0;
2020be210acbSRichard Henderson                 break;
2021be210acbSRichard Henderson             }
202251e3972cSRichard Henderson             switch (c) {
202351e3972cSRichard Henderson             case INDEX_op_set_label:
202451e3972cSRichard Henderson             case INDEX_op_br:
202551e3972cSRichard Henderson             case INDEX_op_brcond_i32:
202651e3972cSRichard Henderson             case INDEX_op_brcond_i64:
202751e3972cSRichard Henderson             case INDEX_op_brcond2_i32:
2028efee3746SRichard Henderson                 col += qemu_log("%s$L%d", k ? "," : "",
2029efee3746SRichard Henderson                                 arg_label(op->args[k])->id);
203051e3972cSRichard Henderson                 i++, k++;
203151e3972cSRichard Henderson                 break;
203251e3972cSRichard Henderson             default:
203351e3972cSRichard Henderson                 break;
2034eeacee4dSBlue Swirl             }
203551e3972cSRichard Henderson             for (; i < nb_cargs; i++, k++) {
2036efee3746SRichard Henderson                 col += qemu_log("%s$0x%" TCG_PRIlx, k ? "," : "", op->args[k]);
2037bdfb460eSRichard Henderson             }
2038bdfb460eSRichard Henderson         }
2039bdfb460eSRichard Henderson         if (op->life) {
2040bdfb460eSRichard Henderson             unsigned life = op->life;
2041bdfb460eSRichard Henderson 
2042bdfb460eSRichard Henderson             for (; col < 48; ++col) {
2043bdfb460eSRichard Henderson                 putc(' ', qemu_logfile);
2044bdfb460eSRichard Henderson             }
2045bdfb460eSRichard Henderson 
2046bdfb460eSRichard Henderson             if (life & (SYNC_ARG * 3)) {
2047bdfb460eSRichard Henderson                 qemu_log("  sync:");
2048bdfb460eSRichard Henderson                 for (i = 0; i < 2; ++i) {
2049bdfb460eSRichard Henderson                     if (life & (SYNC_ARG << i)) {
2050bdfb460eSRichard Henderson                         qemu_log(" %d", i);
2051bdfb460eSRichard Henderson                     }
2052bdfb460eSRichard Henderson                 }
2053bdfb460eSRichard Henderson             }
2054bdfb460eSRichard Henderson             life /= DEAD_ARG;
2055bdfb460eSRichard Henderson             if (life) {
2056bdfb460eSRichard Henderson                 qemu_log("  dead:");
2057bdfb460eSRichard Henderson                 for (i = 0; life; ++i, life >>= 1) {
2058bdfb460eSRichard Henderson                     if (life & 1) {
2059bdfb460eSRichard Henderson                         qemu_log(" %d", i);
2060bdfb460eSRichard Henderson                     }
2061bdfb460eSRichard Henderson                 }
2062c896fe29Sbellard             }
2063b03cce8eSbellard         }
2064eeacee4dSBlue Swirl         qemu_log("\n");
2065c896fe29Sbellard     }
2066c896fe29Sbellard }
2067c896fe29Sbellard 
2068c896fe29Sbellard /* we give more priority to constraints with less registers */
2069c896fe29Sbellard static int get_constraint_priority(const TCGOpDef *def, int k)
2070c896fe29Sbellard {
2071c896fe29Sbellard     const TCGArgConstraint *arg_ct;
2072c896fe29Sbellard 
2073c896fe29Sbellard     int i, n;
2074c896fe29Sbellard     arg_ct = &def->args_ct[k];
2075c896fe29Sbellard     if (arg_ct->ct & TCG_CT_ALIAS) {
2076c896fe29Sbellard         /* an alias is equivalent to a single register */
2077c896fe29Sbellard         n = 1;
2078c896fe29Sbellard     } else {
2079c896fe29Sbellard         if (!(arg_ct->ct & TCG_CT_REG))
2080c896fe29Sbellard             return 0;
2081c896fe29Sbellard         n = 0;
2082c896fe29Sbellard         for(i = 0; i < TCG_TARGET_NB_REGS; i++) {
2083c896fe29Sbellard             if (tcg_regset_test_reg(arg_ct->u.regs, i))
2084c896fe29Sbellard                 n++;
2085c896fe29Sbellard         }
2086c896fe29Sbellard     }
2087c896fe29Sbellard     return TCG_TARGET_NB_REGS - n + 1;
2088c896fe29Sbellard }
2089c896fe29Sbellard 
2090c896fe29Sbellard /* sort from highest priority to lowest */
2091c896fe29Sbellard static void sort_constraints(TCGOpDef *def, int start, int n)
2092c896fe29Sbellard {
2093c896fe29Sbellard     int i, j, p1, p2, tmp;
2094c896fe29Sbellard 
2095c896fe29Sbellard     for(i = 0; i < n; i++)
2096c896fe29Sbellard         def->sorted_args[start + i] = start + i;
2097c896fe29Sbellard     if (n <= 1)
2098c896fe29Sbellard         return;
2099c896fe29Sbellard     for(i = 0; i < n - 1; i++) {
2100c896fe29Sbellard         for(j = i + 1; j < n; j++) {
2101c896fe29Sbellard             p1 = get_constraint_priority(def, def->sorted_args[start + i]);
2102c896fe29Sbellard             p2 = get_constraint_priority(def, def->sorted_args[start + j]);
2103c896fe29Sbellard             if (p1 < p2) {
2104c896fe29Sbellard                 tmp = def->sorted_args[start + i];
2105c896fe29Sbellard                 def->sorted_args[start + i] = def->sorted_args[start + j];
2106c896fe29Sbellard                 def->sorted_args[start + j] = tmp;
2107c896fe29Sbellard             }
2108c896fe29Sbellard         }
2109c896fe29Sbellard     }
2110c896fe29Sbellard }
2111c896fe29Sbellard 
2112f69d277eSRichard Henderson static void process_op_defs(TCGContext *s)
2113c896fe29Sbellard {
2114a9751609SRichard Henderson     TCGOpcode op;
2115c896fe29Sbellard 
2116f69d277eSRichard Henderson     for (op = 0; op < NB_OPS; op++) {
2117f69d277eSRichard Henderson         TCGOpDef *def = &tcg_op_defs[op];
2118f69d277eSRichard Henderson         const TCGTargetOpDef *tdefs;
2119069ea736SRichard Henderson         TCGType type;
2120069ea736SRichard Henderson         int i, nb_args;
2121f69d277eSRichard Henderson 
2122f69d277eSRichard Henderson         if (def->flags & TCG_OPF_NOT_PRESENT) {
2123f69d277eSRichard Henderson             continue;
2124f69d277eSRichard Henderson         }
2125f69d277eSRichard Henderson 
2126c896fe29Sbellard         nb_args = def->nb_iargs + def->nb_oargs;
2127f69d277eSRichard Henderson         if (nb_args == 0) {
2128f69d277eSRichard Henderson             continue;
2129f69d277eSRichard Henderson         }
2130f69d277eSRichard Henderson 
2131f69d277eSRichard Henderson         tdefs = tcg_target_op_def(op);
2132f69d277eSRichard Henderson         /* Missing TCGTargetOpDef entry. */
2133f69d277eSRichard Henderson         tcg_debug_assert(tdefs != NULL);
2134f69d277eSRichard Henderson 
2135069ea736SRichard Henderson         type = (def->flags & TCG_OPF_64BIT ? TCG_TYPE_I64 : TCG_TYPE_I32);
2136c896fe29Sbellard         for (i = 0; i < nb_args; i++) {
2137f69d277eSRichard Henderson             const char *ct_str = tdefs->args_ct_str[i];
2138f69d277eSRichard Henderson             /* Incomplete TCGTargetOpDef entry. */
2139eabb7b91SAurelien Jarno             tcg_debug_assert(ct_str != NULL);
2140f69d277eSRichard Henderson 
2141ccb1bb66SRichard Henderson             def->args_ct[i].u.regs = 0;
2142c896fe29Sbellard             def->args_ct[i].ct = 0;
214317280ff4SRichard Henderson             while (*ct_str != '\0') {
214417280ff4SRichard Henderson                 switch(*ct_str) {
214517280ff4SRichard Henderson                 case '0' ... '9':
214617280ff4SRichard Henderson                     {
214717280ff4SRichard Henderson                         int oarg = *ct_str - '0';
214817280ff4SRichard Henderson                         tcg_debug_assert(ct_str == tdefs->args_ct_str[i]);
2149eabb7b91SAurelien Jarno                         tcg_debug_assert(oarg < def->nb_oargs);
2150eabb7b91SAurelien Jarno                         tcg_debug_assert(def->args_ct[oarg].ct & TCG_CT_REG);
215117280ff4SRichard Henderson                         /* TCG_CT_ALIAS is for the output arguments.
215217280ff4SRichard Henderson                            The input is tagged with TCG_CT_IALIAS. */
2153c896fe29Sbellard                         def->args_ct[i] = def->args_ct[oarg];
215417280ff4SRichard Henderson                         def->args_ct[oarg].ct |= TCG_CT_ALIAS;
21555ff9d6a4Sbellard                         def->args_ct[oarg].alias_index = i;
2156c896fe29Sbellard                         def->args_ct[i].ct |= TCG_CT_IALIAS;
21575ff9d6a4Sbellard                         def->args_ct[i].alias_index = oarg;
215817280ff4SRichard Henderson                     }
215917280ff4SRichard Henderson                     ct_str++;
2160c896fe29Sbellard                     break;
216182790a87SRichard Henderson                 case '&':
216282790a87SRichard Henderson                     def->args_ct[i].ct |= TCG_CT_NEWREG;
216382790a87SRichard Henderson                     ct_str++;
216482790a87SRichard Henderson                     break;
2165c896fe29Sbellard                 case 'i':
2166c896fe29Sbellard                     def->args_ct[i].ct |= TCG_CT_CONST;
2167c896fe29Sbellard                     ct_str++;
2168c896fe29Sbellard                     break;
2169c896fe29Sbellard                 default:
2170069ea736SRichard Henderson                     ct_str = target_parse_constraint(&def->args_ct[i],
2171069ea736SRichard Henderson                                                      ct_str, type);
2172f69d277eSRichard Henderson                     /* Typo in TCGTargetOpDef constraint. */
2173069ea736SRichard Henderson                     tcg_debug_assert(ct_str != NULL);
2174c896fe29Sbellard                 }
2175c896fe29Sbellard             }
2176c896fe29Sbellard         }
2177c896fe29Sbellard 
2178c68aaa18SStefan Weil         /* TCGTargetOpDef entry with too much information? */
2179eabb7b91SAurelien Jarno         tcg_debug_assert(i == TCG_MAX_OP_ARGS || tdefs->args_ct_str[i] == NULL);
2180c68aaa18SStefan Weil 
2181c896fe29Sbellard         /* sort the constraints (XXX: this is just an heuristic) */
2182c896fe29Sbellard         sort_constraints(def, 0, def->nb_oargs);
2183c896fe29Sbellard         sort_constraints(def, def->nb_oargs, def->nb_iargs);
2184c896fe29Sbellard     }
2185c896fe29Sbellard }
2186c896fe29Sbellard 
21870c627cdcSRichard Henderson void tcg_op_remove(TCGContext *s, TCGOp *op)
21880c627cdcSRichard Henderson {
2189d88a117eSRichard Henderson     TCGLabel *label;
2190d88a117eSRichard Henderson 
2191d88a117eSRichard Henderson     switch (op->opc) {
2192d88a117eSRichard Henderson     case INDEX_op_br:
2193d88a117eSRichard Henderson         label = arg_label(op->args[0]);
2194d88a117eSRichard Henderson         label->refs--;
2195d88a117eSRichard Henderson         break;
2196d88a117eSRichard Henderson     case INDEX_op_brcond_i32:
2197d88a117eSRichard Henderson     case INDEX_op_brcond_i64:
2198d88a117eSRichard Henderson         label = arg_label(op->args[3]);
2199d88a117eSRichard Henderson         label->refs--;
2200d88a117eSRichard Henderson         break;
2201d88a117eSRichard Henderson     case INDEX_op_brcond2_i32:
2202d88a117eSRichard Henderson         label = arg_label(op->args[5]);
2203d88a117eSRichard Henderson         label->refs--;
2204d88a117eSRichard Henderson         break;
2205d88a117eSRichard Henderson     default:
2206d88a117eSRichard Henderson         break;
2207d88a117eSRichard Henderson     }
2208d88a117eSRichard Henderson 
220915fa08f8SRichard Henderson     QTAILQ_REMOVE(&s->ops, op, link);
221015fa08f8SRichard Henderson     QTAILQ_INSERT_TAIL(&s->free_ops, op, link);
2211abebf925SRichard Henderson     s->nb_ops--;
22120c627cdcSRichard Henderson 
22130c627cdcSRichard Henderson #ifdef CONFIG_PROFILER
2214c3fac113SEmilio G. Cota     atomic_set(&s->prof.del_op_count, s->prof.del_op_count + 1);
22150c627cdcSRichard Henderson #endif
22160c627cdcSRichard Henderson }
22170c627cdcSRichard Henderson 
221815fa08f8SRichard Henderson static TCGOp *tcg_op_alloc(TCGOpcode opc)
221915fa08f8SRichard Henderson {
222015fa08f8SRichard Henderson     TCGContext *s = tcg_ctx;
222115fa08f8SRichard Henderson     TCGOp *op;
222215fa08f8SRichard Henderson 
222315fa08f8SRichard Henderson     if (likely(QTAILQ_EMPTY(&s->free_ops))) {
222415fa08f8SRichard Henderson         op = tcg_malloc(sizeof(TCGOp));
222515fa08f8SRichard Henderson     } else {
222615fa08f8SRichard Henderson         op = QTAILQ_FIRST(&s->free_ops);
222715fa08f8SRichard Henderson         QTAILQ_REMOVE(&s->free_ops, op, link);
222815fa08f8SRichard Henderson     }
222915fa08f8SRichard Henderson     memset(op, 0, offsetof(TCGOp, link));
223015fa08f8SRichard Henderson     op->opc = opc;
2231abebf925SRichard Henderson     s->nb_ops++;
223215fa08f8SRichard Henderson 
223315fa08f8SRichard Henderson     return op;
223415fa08f8SRichard Henderson }
223515fa08f8SRichard Henderson 
223615fa08f8SRichard Henderson TCGOp *tcg_emit_op(TCGOpcode opc)
223715fa08f8SRichard Henderson {
223815fa08f8SRichard Henderson     TCGOp *op = tcg_op_alloc(opc);
223915fa08f8SRichard Henderson     QTAILQ_INSERT_TAIL(&tcg_ctx->ops, op, link);
224015fa08f8SRichard Henderson     return op;
224115fa08f8SRichard Henderson }
224215fa08f8SRichard Henderson 
2243ac1043f6SEmilio G. Cota TCGOp *tcg_op_insert_before(TCGContext *s, TCGOp *old_op, TCGOpcode opc)
22445a18407fSRichard Henderson {
224515fa08f8SRichard Henderson     TCGOp *new_op = tcg_op_alloc(opc);
224615fa08f8SRichard Henderson     QTAILQ_INSERT_BEFORE(old_op, new_op, link);
22475a18407fSRichard Henderson     return new_op;
22485a18407fSRichard Henderson }
22495a18407fSRichard Henderson 
2250ac1043f6SEmilio G. Cota TCGOp *tcg_op_insert_after(TCGContext *s, TCGOp *old_op, TCGOpcode opc)
22515a18407fSRichard Henderson {
225215fa08f8SRichard Henderson     TCGOp *new_op = tcg_op_alloc(opc);
225315fa08f8SRichard Henderson     QTAILQ_INSERT_AFTER(&s->ops, old_op, new_op, link);
22545a18407fSRichard Henderson     return new_op;
22555a18407fSRichard Henderson }
22565a18407fSRichard Henderson 
2257b4fc67c7SRichard Henderson /* Reachable analysis : remove unreachable code.  */
2258b4fc67c7SRichard Henderson static void reachable_code_pass(TCGContext *s)
2259b4fc67c7SRichard Henderson {
2260b4fc67c7SRichard Henderson     TCGOp *op, *op_next;
2261b4fc67c7SRichard Henderson     bool dead = false;
2262b4fc67c7SRichard Henderson 
2263b4fc67c7SRichard Henderson     QTAILQ_FOREACH_SAFE(op, &s->ops, link, op_next) {
2264b4fc67c7SRichard Henderson         bool remove = dead;
2265b4fc67c7SRichard Henderson         TCGLabel *label;
2266b4fc67c7SRichard Henderson         int call_flags;
2267b4fc67c7SRichard Henderson 
2268b4fc67c7SRichard Henderson         switch (op->opc) {
2269b4fc67c7SRichard Henderson         case INDEX_op_set_label:
2270b4fc67c7SRichard Henderson             label = arg_label(op->args[0]);
2271b4fc67c7SRichard Henderson             if (label->refs == 0) {
2272b4fc67c7SRichard Henderson                 /*
2273b4fc67c7SRichard Henderson                  * While there is an occasional backward branch, virtually
2274b4fc67c7SRichard Henderson                  * all branches generated by the translators are forward.
2275b4fc67c7SRichard Henderson                  * Which means that generally we will have already removed
2276b4fc67c7SRichard Henderson                  * all references to the label that will be, and there is
2277b4fc67c7SRichard Henderson                  * little to be gained by iterating.
2278b4fc67c7SRichard Henderson                  */
2279b4fc67c7SRichard Henderson                 remove = true;
2280b4fc67c7SRichard Henderson             } else {
2281b4fc67c7SRichard Henderson                 /* Once we see a label, insns become live again.  */
2282b4fc67c7SRichard Henderson                 dead = false;
2283b4fc67c7SRichard Henderson                 remove = false;
2284b4fc67c7SRichard Henderson 
2285b4fc67c7SRichard Henderson                 /*
2286b4fc67c7SRichard Henderson                  * Optimization can fold conditional branches to unconditional.
2287b4fc67c7SRichard Henderson                  * If we find a label with one reference which is preceded by
2288b4fc67c7SRichard Henderson                  * an unconditional branch to it, remove both.  This needed to
2289b4fc67c7SRichard Henderson                  * wait until the dead code in between them was removed.
2290b4fc67c7SRichard Henderson                  */
2291b4fc67c7SRichard Henderson                 if (label->refs == 1) {
2292b4fc67c7SRichard Henderson                     TCGOp *op_prev = QTAILQ_PREV(op, TCGOpHead, link);
2293b4fc67c7SRichard Henderson                     if (op_prev->opc == INDEX_op_br &&
2294b4fc67c7SRichard Henderson                         label == arg_label(op_prev->args[0])) {
2295b4fc67c7SRichard Henderson                         tcg_op_remove(s, op_prev);
2296b4fc67c7SRichard Henderson                         remove = true;
2297b4fc67c7SRichard Henderson                     }
2298b4fc67c7SRichard Henderson                 }
2299b4fc67c7SRichard Henderson             }
2300b4fc67c7SRichard Henderson             break;
2301b4fc67c7SRichard Henderson 
2302b4fc67c7SRichard Henderson         case INDEX_op_br:
2303b4fc67c7SRichard Henderson         case INDEX_op_exit_tb:
2304b4fc67c7SRichard Henderson         case INDEX_op_goto_ptr:
2305b4fc67c7SRichard Henderson             /* Unconditional branches; everything following is dead.  */
2306b4fc67c7SRichard Henderson             dead = true;
2307b4fc67c7SRichard Henderson             break;
2308b4fc67c7SRichard Henderson 
2309b4fc67c7SRichard Henderson         case INDEX_op_call:
2310b4fc67c7SRichard Henderson             /* Notice noreturn helper calls, raising exceptions.  */
2311b4fc67c7SRichard Henderson             call_flags = op->args[TCGOP_CALLO(op) + TCGOP_CALLI(op) + 1];
2312b4fc67c7SRichard Henderson             if (call_flags & TCG_CALL_NO_RETURN) {
2313b4fc67c7SRichard Henderson                 dead = true;
2314b4fc67c7SRichard Henderson             }
2315b4fc67c7SRichard Henderson             break;
2316b4fc67c7SRichard Henderson 
2317b4fc67c7SRichard Henderson         case INDEX_op_insn_start:
2318b4fc67c7SRichard Henderson             /* Never remove -- we need to keep these for unwind.  */
2319b4fc67c7SRichard Henderson             remove = false;
2320b4fc67c7SRichard Henderson             break;
2321b4fc67c7SRichard Henderson 
2322b4fc67c7SRichard Henderson         default:
2323b4fc67c7SRichard Henderson             break;
2324b4fc67c7SRichard Henderson         }
2325b4fc67c7SRichard Henderson 
2326b4fc67c7SRichard Henderson         if (remove) {
2327b4fc67c7SRichard Henderson             tcg_op_remove(s, op);
2328b4fc67c7SRichard Henderson         }
2329b4fc67c7SRichard Henderson     }
2330b4fc67c7SRichard Henderson }
2331b4fc67c7SRichard Henderson 
2332c70fbf0aSRichard Henderson #define TS_DEAD  1
2333c70fbf0aSRichard Henderson #define TS_MEM   2
2334c70fbf0aSRichard Henderson 
23355a18407fSRichard Henderson #define IS_DEAD_ARG(n)   (arg_life & (DEAD_ARG << (n)))
23365a18407fSRichard Henderson #define NEED_SYNC_ARG(n) (arg_life & (SYNC_ARG << (n)))
23375a18407fSRichard Henderson 
23389c43b68dSAurelien Jarno /* liveness analysis: end of function: all temps are dead, and globals
23399c43b68dSAurelien Jarno    should be in memory. */
2340b83eabeaSRichard Henderson static void tcg_la_func_end(TCGContext *s)
2341c896fe29Sbellard {
2342b83eabeaSRichard Henderson     int ng = s->nb_globals;
2343b83eabeaSRichard Henderson     int nt = s->nb_temps;
2344b83eabeaSRichard Henderson     int i;
2345b83eabeaSRichard Henderson 
2346b83eabeaSRichard Henderson     for (i = 0; i < ng; ++i) {
2347b83eabeaSRichard Henderson         s->temps[i].state = TS_DEAD | TS_MEM;
2348b83eabeaSRichard Henderson     }
2349b83eabeaSRichard Henderson     for (i = ng; i < nt; ++i) {
2350b83eabeaSRichard Henderson         s->temps[i].state = TS_DEAD;
2351b83eabeaSRichard Henderson     }
2352c896fe29Sbellard }
2353c896fe29Sbellard 
23549c43b68dSAurelien Jarno /* liveness analysis: end of basic block: all temps are dead, globals
23559c43b68dSAurelien Jarno    and local temps should be in memory. */
2356b83eabeaSRichard Henderson static void tcg_la_bb_end(TCGContext *s)
2357641d5fbeSbellard {
2358b83eabeaSRichard Henderson     int ng = s->nb_globals;
2359b83eabeaSRichard Henderson     int nt = s->nb_temps;
2360b83eabeaSRichard Henderson     int i;
2361641d5fbeSbellard 
2362b83eabeaSRichard Henderson     for (i = 0; i < ng; ++i) {
2363b83eabeaSRichard Henderson         s->temps[i].state = TS_DEAD | TS_MEM;
2364c70fbf0aSRichard Henderson     }
2365b83eabeaSRichard Henderson     for (i = ng; i < nt; ++i) {
2366b83eabeaSRichard Henderson         s->temps[i].state = (s->temps[i].temp_local
2367b83eabeaSRichard Henderson                              ? TS_DEAD | TS_MEM
2368b83eabeaSRichard Henderson                              : TS_DEAD);
2369641d5fbeSbellard     }
2370641d5fbeSbellard }
2371641d5fbeSbellard 
2372a1b3c48dSRichard Henderson /* Liveness analysis : update the opc_arg_life array to tell if a
2373c896fe29Sbellard    given input arguments is dead. Instructions updating dead
2374c896fe29Sbellard    temporaries are removed. */
2375b83eabeaSRichard Henderson static void liveness_pass_1(TCGContext *s)
2376c896fe29Sbellard {
2377c70fbf0aSRichard Henderson     int nb_globals = s->nb_globals;
237815fa08f8SRichard Henderson     TCGOp *op, *op_prev;
2379c896fe29Sbellard 
2380b83eabeaSRichard Henderson     tcg_la_func_end(s);
2381c896fe29Sbellard 
238215fa08f8SRichard Henderson     QTAILQ_FOREACH_REVERSE_SAFE(op, &s->ops, TCGOpHead, link, op_prev) {
2383c45cb8bbSRichard Henderson         int i, nb_iargs, nb_oargs;
2384c45cb8bbSRichard Henderson         TCGOpcode opc_new, opc_new2;
2385c45cb8bbSRichard Henderson         bool have_opc_new2;
2386a1b3c48dSRichard Henderson         TCGLifeData arg_life = 0;
2387b83eabeaSRichard Henderson         TCGTemp *arg_ts;
2388c45cb8bbSRichard Henderson         TCGOpcode opc = op->opc;
2389c45cb8bbSRichard Henderson         const TCGOpDef *def = &tcg_op_defs[opc];
2390c45cb8bbSRichard Henderson 
2391c45cb8bbSRichard Henderson         switch (opc) {
2392c896fe29Sbellard         case INDEX_op_call:
2393c6e113f5Sbellard             {
2394c6e113f5Sbellard                 int call_flags;
2395c6e113f5Sbellard 
2396cd9090aaSRichard Henderson                 nb_oargs = TCGOP_CALLO(op);
2397cd9090aaSRichard Henderson                 nb_iargs = TCGOP_CALLI(op);
2398efee3746SRichard Henderson                 call_flags = op->args[nb_oargs + nb_iargs + 1];
2399c6e113f5Sbellard 
2400c45cb8bbSRichard Henderson                 /* pure functions can be removed if their result is unused */
240178505279SAurelien Jarno                 if (call_flags & TCG_CALL_NO_SIDE_EFFECTS) {
2402c6e113f5Sbellard                     for (i = 0; i < nb_oargs; i++) {
2403b83eabeaSRichard Henderson                         arg_ts = arg_temp(op->args[i]);
2404b83eabeaSRichard Henderson                         if (arg_ts->state != TS_DEAD) {
2405c6e113f5Sbellard                             goto do_not_remove_call;
2406c6e113f5Sbellard                         }
24079c43b68dSAurelien Jarno                     }
2408c45cb8bbSRichard Henderson                     goto do_remove;
2409c6e113f5Sbellard                 } else {
2410c6e113f5Sbellard                 do_not_remove_call:
2411c896fe29Sbellard 
2412c896fe29Sbellard                     /* output args are dead */
2413c896fe29Sbellard                     for (i = 0; i < nb_oargs; i++) {
2414b83eabeaSRichard Henderson                         arg_ts = arg_temp(op->args[i]);
2415b83eabeaSRichard Henderson                         if (arg_ts->state & TS_DEAD) {
2416a1b3c48dSRichard Henderson                             arg_life |= DEAD_ARG << i;
24176b64b624SAurelien Jarno                         }
2418b83eabeaSRichard Henderson                         if (arg_ts->state & TS_MEM) {
2419a1b3c48dSRichard Henderson                             arg_life |= SYNC_ARG << i;
24209c43b68dSAurelien Jarno                         }
2421b83eabeaSRichard Henderson                         arg_ts->state = TS_DEAD;
2422c896fe29Sbellard                     }
2423c896fe29Sbellard 
242478505279SAurelien Jarno                     if (!(call_flags & (TCG_CALL_NO_WRITE_GLOBALS |
242578505279SAurelien Jarno                                         TCG_CALL_NO_READ_GLOBALS))) {
24269c43b68dSAurelien Jarno                         /* globals should go back to memory */
2427b83eabeaSRichard Henderson                         for (i = 0; i < nb_globals; i++) {
2428b83eabeaSRichard Henderson                             s->temps[i].state = TS_DEAD | TS_MEM;
2429b83eabeaSRichard Henderson                         }
2430c70fbf0aSRichard Henderson                     } else if (!(call_flags & TCG_CALL_NO_READ_GLOBALS)) {
2431c70fbf0aSRichard Henderson                         /* globals should be synced to memory */
2432c70fbf0aSRichard Henderson                         for (i = 0; i < nb_globals; i++) {
2433b83eabeaSRichard Henderson                             s->temps[i].state |= TS_MEM;
2434c70fbf0aSRichard Henderson                         }
2435b9c18f56Saurel32                     }
2436c896fe29Sbellard 
2437c19f47bfSAurelien Jarno                     /* record arguments that die in this helper */
2438866cb6cbSAurelien Jarno                     for (i = nb_oargs; i < nb_iargs + nb_oargs; i++) {
2439b83eabeaSRichard Henderson                         arg_ts = arg_temp(op->args[i]);
2440b83eabeaSRichard Henderson                         if (arg_ts && arg_ts->state & TS_DEAD) {
2441a1b3c48dSRichard Henderson                             arg_life |= DEAD_ARG << i;
2442c896fe29Sbellard                         }
2443c896fe29Sbellard                     }
244467cc32ebSVeres Lajos                     /* input arguments are live for preceding opcodes */
2445c70fbf0aSRichard Henderson                     for (i = nb_oargs; i < nb_iargs + nb_oargs; i++) {
2446b83eabeaSRichard Henderson                         arg_ts = arg_temp(op->args[i]);
2447b83eabeaSRichard Henderson                         if (arg_ts) {
2448b83eabeaSRichard Henderson                             arg_ts->state &= ~TS_DEAD;
2449c70fbf0aSRichard Henderson                         }
2450c19f47bfSAurelien Jarno                     }
2451c6e113f5Sbellard                 }
2452c6e113f5Sbellard             }
2453c896fe29Sbellard             break;
2454765b842aSRichard Henderson         case INDEX_op_insn_start:
2455c896fe29Sbellard             break;
24565ff9d6a4Sbellard         case INDEX_op_discard:
24575ff9d6a4Sbellard             /* mark the temporary as dead */
2458b83eabeaSRichard Henderson             arg_temp(op->args[0])->state = TS_DEAD;
24595ff9d6a4Sbellard             break;
24601305c451SRichard Henderson 
24611305c451SRichard Henderson         case INDEX_op_add2_i32:
2462c45cb8bbSRichard Henderson             opc_new = INDEX_op_add_i32;
2463f1fae40cSRichard Henderson             goto do_addsub2;
24641305c451SRichard Henderson         case INDEX_op_sub2_i32:
2465c45cb8bbSRichard Henderson             opc_new = INDEX_op_sub_i32;
2466f1fae40cSRichard Henderson             goto do_addsub2;
2467f1fae40cSRichard Henderson         case INDEX_op_add2_i64:
2468c45cb8bbSRichard Henderson             opc_new = INDEX_op_add_i64;
2469f1fae40cSRichard Henderson             goto do_addsub2;
2470f1fae40cSRichard Henderson         case INDEX_op_sub2_i64:
2471c45cb8bbSRichard Henderson             opc_new = INDEX_op_sub_i64;
2472f1fae40cSRichard Henderson         do_addsub2:
24731305c451SRichard Henderson             nb_iargs = 4;
24741305c451SRichard Henderson             nb_oargs = 2;
24751305c451SRichard Henderson             /* Test if the high part of the operation is dead, but not
24761305c451SRichard Henderson                the low part.  The result can be optimized to a simple
24771305c451SRichard Henderson                add or sub.  This happens often for x86_64 guest when the
24781305c451SRichard Henderson                cpu mode is set to 32 bit.  */
2479b83eabeaSRichard Henderson             if (arg_temp(op->args[1])->state == TS_DEAD) {
2480b83eabeaSRichard Henderson                 if (arg_temp(op->args[0])->state == TS_DEAD) {
24811305c451SRichard Henderson                     goto do_remove;
24821305c451SRichard Henderson                 }
2483c45cb8bbSRichard Henderson                 /* Replace the opcode and adjust the args in place,
2484c45cb8bbSRichard Henderson                    leaving 3 unused args at the end.  */
2485c45cb8bbSRichard Henderson                 op->opc = opc = opc_new;
2486efee3746SRichard Henderson                 op->args[1] = op->args[2];
2487efee3746SRichard Henderson                 op->args[2] = op->args[4];
24881305c451SRichard Henderson                 /* Fall through and mark the single-word operation live.  */
24891305c451SRichard Henderson                 nb_iargs = 2;
24901305c451SRichard Henderson                 nb_oargs = 1;
24911305c451SRichard Henderson             }
24921305c451SRichard Henderson             goto do_not_remove;
24931305c451SRichard Henderson 
24941414968aSRichard Henderson         case INDEX_op_mulu2_i32:
2495c45cb8bbSRichard Henderson             opc_new = INDEX_op_mul_i32;
2496c45cb8bbSRichard Henderson             opc_new2 = INDEX_op_muluh_i32;
2497c45cb8bbSRichard Henderson             have_opc_new2 = TCG_TARGET_HAS_muluh_i32;
249803271524SRichard Henderson             goto do_mul2;
2499f1fae40cSRichard Henderson         case INDEX_op_muls2_i32:
2500c45cb8bbSRichard Henderson             opc_new = INDEX_op_mul_i32;
2501c45cb8bbSRichard Henderson             opc_new2 = INDEX_op_mulsh_i32;
2502c45cb8bbSRichard Henderson             have_opc_new2 = TCG_TARGET_HAS_mulsh_i32;
2503f1fae40cSRichard Henderson             goto do_mul2;
2504f1fae40cSRichard Henderson         case INDEX_op_mulu2_i64:
2505c45cb8bbSRichard Henderson             opc_new = INDEX_op_mul_i64;
2506c45cb8bbSRichard Henderson             opc_new2 = INDEX_op_muluh_i64;
2507c45cb8bbSRichard Henderson             have_opc_new2 = TCG_TARGET_HAS_muluh_i64;
250803271524SRichard Henderson             goto do_mul2;
2509f1fae40cSRichard Henderson         case INDEX_op_muls2_i64:
2510c45cb8bbSRichard Henderson             opc_new = INDEX_op_mul_i64;
2511c45cb8bbSRichard Henderson             opc_new2 = INDEX_op_mulsh_i64;
2512c45cb8bbSRichard Henderson             have_opc_new2 = TCG_TARGET_HAS_mulsh_i64;
251303271524SRichard Henderson             goto do_mul2;
2514f1fae40cSRichard Henderson         do_mul2:
25151414968aSRichard Henderson             nb_iargs = 2;
25161414968aSRichard Henderson             nb_oargs = 2;
2517b83eabeaSRichard Henderson             if (arg_temp(op->args[1])->state == TS_DEAD) {
2518b83eabeaSRichard Henderson                 if (arg_temp(op->args[0])->state == TS_DEAD) {
251903271524SRichard Henderson                     /* Both parts of the operation are dead.  */
25201414968aSRichard Henderson                     goto do_remove;
25211414968aSRichard Henderson                 }
252203271524SRichard Henderson                 /* The high part of the operation is dead; generate the low. */
2523c45cb8bbSRichard Henderson                 op->opc = opc = opc_new;
2524efee3746SRichard Henderson                 op->args[1] = op->args[2];
2525efee3746SRichard Henderson                 op->args[2] = op->args[3];
2526b83eabeaSRichard Henderson             } else if (arg_temp(op->args[0])->state == TS_DEAD && have_opc_new2) {
252703271524SRichard Henderson                 /* The low part of the operation is dead; generate the high. */
2528c45cb8bbSRichard Henderson                 op->opc = opc = opc_new2;
2529efee3746SRichard Henderson                 op->args[0] = op->args[1];
2530efee3746SRichard Henderson                 op->args[1] = op->args[2];
2531efee3746SRichard Henderson                 op->args[2] = op->args[3];
253203271524SRichard Henderson             } else {
253303271524SRichard Henderson                 goto do_not_remove;
253403271524SRichard Henderson             }
253503271524SRichard Henderson             /* Mark the single-word operation live.  */
25361414968aSRichard Henderson             nb_oargs = 1;
25371414968aSRichard Henderson             goto do_not_remove;
25381414968aSRichard Henderson 
2539c896fe29Sbellard         default:
25401305c451SRichard Henderson             /* XXX: optimize by hardcoding common cases (e.g. triadic ops) */
2541c896fe29Sbellard             nb_iargs = def->nb_iargs;
2542c896fe29Sbellard             nb_oargs = def->nb_oargs;
2543c896fe29Sbellard 
2544c896fe29Sbellard             /* Test if the operation can be removed because all
25455ff9d6a4Sbellard                its outputs are dead. We assume that nb_oargs == 0
25465ff9d6a4Sbellard                implies side effects */
25475ff9d6a4Sbellard             if (!(def->flags & TCG_OPF_SIDE_EFFECTS) && nb_oargs != 0) {
2548c896fe29Sbellard                 for (i = 0; i < nb_oargs; i++) {
2549b83eabeaSRichard Henderson                     if (arg_temp(op->args[i])->state != TS_DEAD) {
2550c896fe29Sbellard                         goto do_not_remove;
2551c896fe29Sbellard                     }
25529c43b68dSAurelien Jarno                 }
25531305c451SRichard Henderson             do_remove:
25540c627cdcSRichard Henderson                 tcg_op_remove(s, op);
2555c896fe29Sbellard             } else {
2556c896fe29Sbellard             do_not_remove:
2557c896fe29Sbellard                 /* output args are dead */
2558c896fe29Sbellard                 for (i = 0; i < nb_oargs; i++) {
2559b83eabeaSRichard Henderson                     arg_ts = arg_temp(op->args[i]);
2560b83eabeaSRichard Henderson                     if (arg_ts->state & TS_DEAD) {
2561a1b3c48dSRichard Henderson                         arg_life |= DEAD_ARG << i;
25626b64b624SAurelien Jarno                     }
2563b83eabeaSRichard Henderson                     if (arg_ts->state & TS_MEM) {
2564a1b3c48dSRichard Henderson                         arg_life |= SYNC_ARG << i;
25659c43b68dSAurelien Jarno                     }
2566b83eabeaSRichard Henderson                     arg_ts->state = TS_DEAD;
2567c896fe29Sbellard                 }
2568c896fe29Sbellard 
2569c896fe29Sbellard                 /* if end of basic block, update */
2570c896fe29Sbellard                 if (def->flags & TCG_OPF_BB_END) {
2571b83eabeaSRichard Henderson                     tcg_la_bb_end(s);
25723d5c5f87SAurelien Jarno                 } else if (def->flags & TCG_OPF_SIDE_EFFECTS) {
25733d5c5f87SAurelien Jarno                     /* globals should be synced to memory */
2574c70fbf0aSRichard Henderson                     for (i = 0; i < nb_globals; i++) {
2575b83eabeaSRichard Henderson                         s->temps[i].state |= TS_MEM;
2576c70fbf0aSRichard Henderson                     }
2577c896fe29Sbellard                 }
2578c896fe29Sbellard 
2579c19f47bfSAurelien Jarno                 /* record arguments that die in this opcode */
2580866cb6cbSAurelien Jarno                 for (i = nb_oargs; i < nb_oargs + nb_iargs; i++) {
2581b83eabeaSRichard Henderson                     arg_ts = arg_temp(op->args[i]);
2582b83eabeaSRichard Henderson                     if (arg_ts->state & TS_DEAD) {
2583a1b3c48dSRichard Henderson                         arg_life |= DEAD_ARG << i;
2584c896fe29Sbellard                     }
2585c19f47bfSAurelien Jarno                 }
258667cc32ebSVeres Lajos                 /* input arguments are live for preceding opcodes */
2587c19f47bfSAurelien Jarno                 for (i = nb_oargs; i < nb_oargs + nb_iargs; i++) {
2588b83eabeaSRichard Henderson                     arg_temp(op->args[i])->state &= ~TS_DEAD;
2589c896fe29Sbellard                 }
2590c896fe29Sbellard             }
2591c896fe29Sbellard             break;
2592c896fe29Sbellard         }
2593bee158cbSRichard Henderson         op->life = arg_life;
2594c896fe29Sbellard     }
25951ff0a2c5SEvgeny Voevodin }
2596c896fe29Sbellard 
25975a18407fSRichard Henderson /* Liveness analysis: Convert indirect regs to direct temporaries.  */
2598b83eabeaSRichard Henderson static bool liveness_pass_2(TCGContext *s)
25995a18407fSRichard Henderson {
26005a18407fSRichard Henderson     int nb_globals = s->nb_globals;
260115fa08f8SRichard Henderson     int nb_temps, i;
26025a18407fSRichard Henderson     bool changes = false;
260315fa08f8SRichard Henderson     TCGOp *op, *op_next;
26045a18407fSRichard Henderson 
26055a18407fSRichard Henderson     /* Create a temporary for each indirect global.  */
26065a18407fSRichard Henderson     for (i = 0; i < nb_globals; ++i) {
26075a18407fSRichard Henderson         TCGTemp *its = &s->temps[i];
26085a18407fSRichard Henderson         if (its->indirect_reg) {
26095a18407fSRichard Henderson             TCGTemp *dts = tcg_temp_alloc(s);
26105a18407fSRichard Henderson             dts->type = its->type;
26115a18407fSRichard Henderson             dts->base_type = its->base_type;
2612b83eabeaSRichard Henderson             its->state_ptr = dts;
2613b83eabeaSRichard Henderson         } else {
2614b83eabeaSRichard Henderson             its->state_ptr = NULL;
26155a18407fSRichard Henderson         }
2616b83eabeaSRichard Henderson         /* All globals begin dead.  */
2617b83eabeaSRichard Henderson         its->state = TS_DEAD;
26185a18407fSRichard Henderson     }
2619b83eabeaSRichard Henderson     for (nb_temps = s->nb_temps; i < nb_temps; ++i) {
2620b83eabeaSRichard Henderson         TCGTemp *its = &s->temps[i];
2621b83eabeaSRichard Henderson         its->state_ptr = NULL;
2622b83eabeaSRichard Henderson         its->state = TS_DEAD;
2623b83eabeaSRichard Henderson     }
26245a18407fSRichard Henderson 
262515fa08f8SRichard Henderson     QTAILQ_FOREACH_SAFE(op, &s->ops, link, op_next) {
26265a18407fSRichard Henderson         TCGOpcode opc = op->opc;
26275a18407fSRichard Henderson         const TCGOpDef *def = &tcg_op_defs[opc];
26285a18407fSRichard Henderson         TCGLifeData arg_life = op->life;
26295a18407fSRichard Henderson         int nb_iargs, nb_oargs, call_flags;
2630b83eabeaSRichard Henderson         TCGTemp *arg_ts, *dir_ts;
26315a18407fSRichard Henderson 
26325a18407fSRichard Henderson         if (opc == INDEX_op_call) {
2633cd9090aaSRichard Henderson             nb_oargs = TCGOP_CALLO(op);
2634cd9090aaSRichard Henderson             nb_iargs = TCGOP_CALLI(op);
2635efee3746SRichard Henderson             call_flags = op->args[nb_oargs + nb_iargs + 1];
26365a18407fSRichard Henderson         } else {
26375a18407fSRichard Henderson             nb_iargs = def->nb_iargs;
26385a18407fSRichard Henderson             nb_oargs = def->nb_oargs;
26395a18407fSRichard Henderson 
26405a18407fSRichard Henderson             /* Set flags similar to how calls require.  */
26415a18407fSRichard Henderson             if (def->flags & TCG_OPF_BB_END) {
26425a18407fSRichard Henderson                 /* Like writing globals: save_globals */
26435a18407fSRichard Henderson                 call_flags = 0;
26445a18407fSRichard Henderson             } else if (def->flags & TCG_OPF_SIDE_EFFECTS) {
26455a18407fSRichard Henderson                 /* Like reading globals: sync_globals */
26465a18407fSRichard Henderson                 call_flags = TCG_CALL_NO_WRITE_GLOBALS;
26475a18407fSRichard Henderson             } else {
26485a18407fSRichard Henderson                 /* No effect on globals.  */
26495a18407fSRichard Henderson                 call_flags = (TCG_CALL_NO_READ_GLOBALS |
26505a18407fSRichard Henderson                               TCG_CALL_NO_WRITE_GLOBALS);
26515a18407fSRichard Henderson             }
26525a18407fSRichard Henderson         }
26535a18407fSRichard Henderson 
26545a18407fSRichard Henderson         /* Make sure that input arguments are available.  */
26555a18407fSRichard Henderson         for (i = nb_oargs; i < nb_iargs + nb_oargs; i++) {
2656b83eabeaSRichard Henderson             arg_ts = arg_temp(op->args[i]);
2657b83eabeaSRichard Henderson             if (arg_ts) {
2658b83eabeaSRichard Henderson                 dir_ts = arg_ts->state_ptr;
2659b83eabeaSRichard Henderson                 if (dir_ts && arg_ts->state == TS_DEAD) {
2660b83eabeaSRichard Henderson                     TCGOpcode lopc = (arg_ts->type == TCG_TYPE_I32
26615a18407fSRichard Henderson                                       ? INDEX_op_ld_i32
26625a18407fSRichard Henderson                                       : INDEX_op_ld_i64);
2663ac1043f6SEmilio G. Cota                     TCGOp *lop = tcg_op_insert_before(s, op, lopc);
26645a18407fSRichard Henderson 
2665b83eabeaSRichard Henderson                     lop->args[0] = temp_arg(dir_ts);
2666b83eabeaSRichard Henderson                     lop->args[1] = temp_arg(arg_ts->mem_base);
2667b83eabeaSRichard Henderson                     lop->args[2] = arg_ts->mem_offset;
26685a18407fSRichard Henderson 
26695a18407fSRichard Henderson                     /* Loaded, but synced with memory.  */
2670b83eabeaSRichard Henderson                     arg_ts->state = TS_MEM;
26715a18407fSRichard Henderson                 }
26725a18407fSRichard Henderson             }
26735a18407fSRichard Henderson         }
26745a18407fSRichard Henderson 
26755a18407fSRichard Henderson         /* Perform input replacement, and mark inputs that became dead.
26765a18407fSRichard Henderson            No action is required except keeping temp_state up to date
26775a18407fSRichard Henderson            so that we reload when needed.  */
26785a18407fSRichard Henderson         for (i = nb_oargs; i < nb_iargs + nb_oargs; i++) {
2679b83eabeaSRichard Henderson             arg_ts = arg_temp(op->args[i]);
2680b83eabeaSRichard Henderson             if (arg_ts) {
2681b83eabeaSRichard Henderson                 dir_ts = arg_ts->state_ptr;
2682b83eabeaSRichard Henderson                 if (dir_ts) {
2683b83eabeaSRichard Henderson                     op->args[i] = temp_arg(dir_ts);
26845a18407fSRichard Henderson                     changes = true;
26855a18407fSRichard Henderson                     if (IS_DEAD_ARG(i)) {
2686b83eabeaSRichard Henderson                         arg_ts->state = TS_DEAD;
26875a18407fSRichard Henderson                     }
26885a18407fSRichard Henderson                 }
26895a18407fSRichard Henderson             }
26905a18407fSRichard Henderson         }
26915a18407fSRichard Henderson 
26925a18407fSRichard Henderson         /* Liveness analysis should ensure that the following are
26935a18407fSRichard Henderson            all correct, for call sites and basic block end points.  */
26945a18407fSRichard Henderson         if (call_flags & TCG_CALL_NO_READ_GLOBALS) {
26955a18407fSRichard Henderson             /* Nothing to do */
26965a18407fSRichard Henderson         } else if (call_flags & TCG_CALL_NO_WRITE_GLOBALS) {
26975a18407fSRichard Henderson             for (i = 0; i < nb_globals; ++i) {
26985a18407fSRichard Henderson                 /* Liveness should see that globals are synced back,
26995a18407fSRichard Henderson                    that is, either TS_DEAD or TS_MEM.  */
2700b83eabeaSRichard Henderson                 arg_ts = &s->temps[i];
2701b83eabeaSRichard Henderson                 tcg_debug_assert(arg_ts->state_ptr == 0
2702b83eabeaSRichard Henderson                                  || arg_ts->state != 0);
27035a18407fSRichard Henderson             }
27045a18407fSRichard Henderson         } else {
27055a18407fSRichard Henderson             for (i = 0; i < nb_globals; ++i) {
27065a18407fSRichard Henderson                 /* Liveness should see that globals are saved back,
27075a18407fSRichard Henderson                    that is, TS_DEAD, waiting to be reloaded.  */
2708b83eabeaSRichard Henderson                 arg_ts = &s->temps[i];
2709b83eabeaSRichard Henderson                 tcg_debug_assert(arg_ts->state_ptr == 0
2710b83eabeaSRichard Henderson                                  || arg_ts->state == TS_DEAD);
27115a18407fSRichard Henderson             }
27125a18407fSRichard Henderson         }
27135a18407fSRichard Henderson 
27145a18407fSRichard Henderson         /* Outputs become available.  */
27155a18407fSRichard Henderson         for (i = 0; i < nb_oargs; i++) {
2716b83eabeaSRichard Henderson             arg_ts = arg_temp(op->args[i]);
2717b83eabeaSRichard Henderson             dir_ts = arg_ts->state_ptr;
2718b83eabeaSRichard Henderson             if (!dir_ts) {
27195a18407fSRichard Henderson                 continue;
27205a18407fSRichard Henderson             }
2721b83eabeaSRichard Henderson             op->args[i] = temp_arg(dir_ts);
27225a18407fSRichard Henderson             changes = true;
27235a18407fSRichard Henderson 
27245a18407fSRichard Henderson             /* The output is now live and modified.  */
2725b83eabeaSRichard Henderson             arg_ts->state = 0;
27265a18407fSRichard Henderson 
27275a18407fSRichard Henderson             /* Sync outputs upon their last write.  */
27285a18407fSRichard Henderson             if (NEED_SYNC_ARG(i)) {
2729b83eabeaSRichard Henderson                 TCGOpcode sopc = (arg_ts->type == TCG_TYPE_I32
27305a18407fSRichard Henderson                                   ? INDEX_op_st_i32
27315a18407fSRichard Henderson                                   : INDEX_op_st_i64);
2732ac1043f6SEmilio G. Cota                 TCGOp *sop = tcg_op_insert_after(s, op, sopc);
27335a18407fSRichard Henderson 
2734b83eabeaSRichard Henderson                 sop->args[0] = temp_arg(dir_ts);
2735b83eabeaSRichard Henderson                 sop->args[1] = temp_arg(arg_ts->mem_base);
2736b83eabeaSRichard Henderson                 sop->args[2] = arg_ts->mem_offset;
27375a18407fSRichard Henderson 
2738b83eabeaSRichard Henderson                 arg_ts->state = TS_MEM;
27395a18407fSRichard Henderson             }
27405a18407fSRichard Henderson             /* Drop outputs that are dead.  */
27415a18407fSRichard Henderson             if (IS_DEAD_ARG(i)) {
2742b83eabeaSRichard Henderson                 arg_ts->state = TS_DEAD;
27435a18407fSRichard Henderson             }
27445a18407fSRichard Henderson         }
27455a18407fSRichard Henderson     }
27465a18407fSRichard Henderson 
27475a18407fSRichard Henderson     return changes;
27485a18407fSRichard Henderson }
27495a18407fSRichard Henderson 
27508d8fdbaeSAurelien Jarno #ifdef CONFIG_DEBUG_TCG
2751c896fe29Sbellard static void dump_regs(TCGContext *s)
2752c896fe29Sbellard {
2753c896fe29Sbellard     TCGTemp *ts;
2754c896fe29Sbellard     int i;
2755c896fe29Sbellard     char buf[64];
2756c896fe29Sbellard 
2757c896fe29Sbellard     for(i = 0; i < s->nb_temps; i++) {
2758c896fe29Sbellard         ts = &s->temps[i];
275943439139SRichard Henderson         printf("  %10s: ", tcg_get_arg_str_ptr(s, buf, sizeof(buf), ts));
2760c896fe29Sbellard         switch(ts->val_type) {
2761c896fe29Sbellard         case TEMP_VAL_REG:
2762c896fe29Sbellard             printf("%s", tcg_target_reg_names[ts->reg]);
2763c896fe29Sbellard             break;
2764c896fe29Sbellard         case TEMP_VAL_MEM:
2765b3a62939SRichard Henderson             printf("%d(%s)", (int)ts->mem_offset,
2766b3a62939SRichard Henderson                    tcg_target_reg_names[ts->mem_base->reg]);
2767c896fe29Sbellard             break;
2768c896fe29Sbellard         case TEMP_VAL_CONST:
2769c896fe29Sbellard             printf("$0x%" TCG_PRIlx, ts->val);
2770c896fe29Sbellard             break;
2771c896fe29Sbellard         case TEMP_VAL_DEAD:
2772c896fe29Sbellard             printf("D");
2773c896fe29Sbellard             break;
2774c896fe29Sbellard         default:
2775c896fe29Sbellard             printf("???");
2776c896fe29Sbellard             break;
2777c896fe29Sbellard         }
2778c896fe29Sbellard         printf("\n");
2779c896fe29Sbellard     }
2780c896fe29Sbellard 
2781c896fe29Sbellard     for(i = 0; i < TCG_TARGET_NB_REGS; i++) {
2782f8b2f202SRichard Henderson         if (s->reg_to_temp[i] != NULL) {
2783c896fe29Sbellard             printf("%s: %s\n",
2784c896fe29Sbellard                    tcg_target_reg_names[i],
2785f8b2f202SRichard Henderson                    tcg_get_arg_str_ptr(s, buf, sizeof(buf), s->reg_to_temp[i]));
2786c896fe29Sbellard         }
2787c896fe29Sbellard     }
2788c896fe29Sbellard }
2789c896fe29Sbellard 
2790c896fe29Sbellard static void check_regs(TCGContext *s)
2791c896fe29Sbellard {
2792869938aeSRichard Henderson     int reg;
2793b6638662SRichard Henderson     int k;
2794c896fe29Sbellard     TCGTemp *ts;
2795c896fe29Sbellard     char buf[64];
2796c896fe29Sbellard 
2797c896fe29Sbellard     for (reg = 0; reg < TCG_TARGET_NB_REGS; reg++) {
2798f8b2f202SRichard Henderson         ts = s->reg_to_temp[reg];
2799f8b2f202SRichard Henderson         if (ts != NULL) {
2800f8b2f202SRichard Henderson             if (ts->val_type != TEMP_VAL_REG || ts->reg != reg) {
2801c896fe29Sbellard                 printf("Inconsistency for register %s:\n",
2802c896fe29Sbellard                        tcg_target_reg_names[reg]);
2803b03cce8eSbellard                 goto fail;
2804c896fe29Sbellard             }
2805c896fe29Sbellard         }
2806c896fe29Sbellard     }
2807c896fe29Sbellard     for (k = 0; k < s->nb_temps; k++) {
2808c896fe29Sbellard         ts = &s->temps[k];
2809f8b2f202SRichard Henderson         if (ts->val_type == TEMP_VAL_REG && !ts->fixed_reg
2810f8b2f202SRichard Henderson             && s->reg_to_temp[ts->reg] != ts) {
2811c896fe29Sbellard             printf("Inconsistency for temp %s:\n",
2812f8b2f202SRichard Henderson                    tcg_get_arg_str_ptr(s, buf, sizeof(buf), ts));
2813b03cce8eSbellard         fail:
2814c896fe29Sbellard             printf("reg state:\n");
2815c896fe29Sbellard             dump_regs(s);
2816c896fe29Sbellard             tcg_abort();
2817c896fe29Sbellard         }
2818c896fe29Sbellard     }
2819c896fe29Sbellard }
2820c896fe29Sbellard #endif
2821c896fe29Sbellard 
28222272e4a7SRichard Henderson static void temp_allocate_frame(TCGContext *s, TCGTemp *ts)
2823c896fe29Sbellard {
28249b9c37c3SRichard Henderson #if !(defined(__sparc__) && TCG_TARGET_REG_BITS == 64)
28259b9c37c3SRichard Henderson     /* Sparc64 stack is accessed with offset of 2047 */
2826b591dc59SBlue Swirl     s->current_frame_offset = (s->current_frame_offset +
2827b591dc59SBlue Swirl                                (tcg_target_long)sizeof(tcg_target_long) - 1) &
2828b591dc59SBlue Swirl         ~(sizeof(tcg_target_long) - 1);
2829f44c9960SBlue Swirl #endif
2830b591dc59SBlue Swirl     if (s->current_frame_offset + (tcg_target_long)sizeof(tcg_target_long) >
2831b591dc59SBlue Swirl         s->frame_end) {
28325ff9d6a4Sbellard         tcg_abort();
2833b591dc59SBlue Swirl     }
2834c896fe29Sbellard     ts->mem_offset = s->current_frame_offset;
2835b3a62939SRichard Henderson     ts->mem_base = s->frame_temp;
2836c896fe29Sbellard     ts->mem_allocated = 1;
2837e2c6d1b4SRichard Henderson     s->current_frame_offset += sizeof(tcg_target_long);
2838c896fe29Sbellard }
2839c896fe29Sbellard 
2840b3915dbbSRichard Henderson static void temp_load(TCGContext *, TCGTemp *, TCGRegSet, TCGRegSet);
2841b3915dbbSRichard Henderson 
284259d7c14eSRichard Henderson /* Mark a temporary as free or dead.  If 'free_or_dead' is negative,
284359d7c14eSRichard Henderson    mark it free; otherwise mark it dead.  */
284459d7c14eSRichard Henderson static void temp_free_or_dead(TCGContext *s, TCGTemp *ts, int free_or_dead)
2845c896fe29Sbellard {
284659d7c14eSRichard Henderson     if (ts->fixed_reg) {
284759d7c14eSRichard Henderson         return;
284859d7c14eSRichard Henderson     }
284959d7c14eSRichard Henderson     if (ts->val_type == TEMP_VAL_REG) {
285059d7c14eSRichard Henderson         s->reg_to_temp[ts->reg] = NULL;
285159d7c14eSRichard Henderson     }
285259d7c14eSRichard Henderson     ts->val_type = (free_or_dead < 0
285359d7c14eSRichard Henderson                     || ts->temp_local
2854fa477d25SRichard Henderson                     || ts->temp_global
285559d7c14eSRichard Henderson                     ? TEMP_VAL_MEM : TEMP_VAL_DEAD);
285659d7c14eSRichard Henderson }
2857c896fe29Sbellard 
285859d7c14eSRichard Henderson /* Mark a temporary as dead.  */
285959d7c14eSRichard Henderson static inline void temp_dead(TCGContext *s, TCGTemp *ts)
286059d7c14eSRichard Henderson {
286159d7c14eSRichard Henderson     temp_free_or_dead(s, ts, 1);
286259d7c14eSRichard Henderson }
286359d7c14eSRichard Henderson 
286459d7c14eSRichard Henderson /* Sync a temporary to memory. 'allocated_regs' is used in case a temporary
286559d7c14eSRichard Henderson    registers needs to be allocated to store a constant.  If 'free_or_dead'
286659d7c14eSRichard Henderson    is non-zero, subsequently release the temporary; if it is positive, the
286759d7c14eSRichard Henderson    temp is dead; if it is negative, the temp is free.  */
286859d7c14eSRichard Henderson static void temp_sync(TCGContext *s, TCGTemp *ts,
286959d7c14eSRichard Henderson                       TCGRegSet allocated_regs, int free_or_dead)
287059d7c14eSRichard Henderson {
287159d7c14eSRichard Henderson     if (ts->fixed_reg) {
287259d7c14eSRichard Henderson         return;
287359d7c14eSRichard Henderson     }
287459d7c14eSRichard Henderson     if (!ts->mem_coherent) {
28757f6ceedfSAurelien Jarno         if (!ts->mem_allocated) {
28762272e4a7SRichard Henderson             temp_allocate_frame(s, ts);
287759d7c14eSRichard Henderson         }
287859d7c14eSRichard Henderson         switch (ts->val_type) {
287959d7c14eSRichard Henderson         case TEMP_VAL_CONST:
288059d7c14eSRichard Henderson             /* If we're going to free the temp immediately, then we won't
288159d7c14eSRichard Henderson                require it later in a register, so attempt to store the
288259d7c14eSRichard Henderson                constant to memory directly.  */
288359d7c14eSRichard Henderson             if (free_or_dead
288459d7c14eSRichard Henderson                 && tcg_out_sti(s, ts->type, ts->val,
288559d7c14eSRichard Henderson                                ts->mem_base->reg, ts->mem_offset)) {
288659d7c14eSRichard Henderson                 break;
288759d7c14eSRichard Henderson             }
288859d7c14eSRichard Henderson             temp_load(s, ts, tcg_target_available_regs[ts->type],
288959d7c14eSRichard Henderson                       allocated_regs);
289059d7c14eSRichard Henderson             /* fallthrough */
289159d7c14eSRichard Henderson 
289259d7c14eSRichard Henderson         case TEMP_VAL_REG:
289359d7c14eSRichard Henderson             tcg_out_st(s, ts->type, ts->reg,
289459d7c14eSRichard Henderson                        ts->mem_base->reg, ts->mem_offset);
289559d7c14eSRichard Henderson             break;
289659d7c14eSRichard Henderson 
289759d7c14eSRichard Henderson         case TEMP_VAL_MEM:
289859d7c14eSRichard Henderson             break;
289959d7c14eSRichard Henderson 
290059d7c14eSRichard Henderson         case TEMP_VAL_DEAD:
290159d7c14eSRichard Henderson         default:
290259d7c14eSRichard Henderson             tcg_abort();
2903c896fe29Sbellard         }
29047f6ceedfSAurelien Jarno         ts->mem_coherent = 1;
29057f6ceedfSAurelien Jarno     }
290659d7c14eSRichard Henderson     if (free_or_dead) {
290759d7c14eSRichard Henderson         temp_free_or_dead(s, ts, free_or_dead);
290859d7c14eSRichard Henderson     }
290959d7c14eSRichard Henderson }
29107f6ceedfSAurelien Jarno 
29117f6ceedfSAurelien Jarno /* free register 'reg' by spilling the corresponding temporary if necessary */
2912b3915dbbSRichard Henderson static void tcg_reg_free(TCGContext *s, TCGReg reg, TCGRegSet allocated_regs)
29137f6ceedfSAurelien Jarno {
2914f8b2f202SRichard Henderson     TCGTemp *ts = s->reg_to_temp[reg];
2915f8b2f202SRichard Henderson     if (ts != NULL) {
291659d7c14eSRichard Henderson         temp_sync(s, ts, allocated_regs, -1);
2917c896fe29Sbellard     }
2918c896fe29Sbellard }
2919c896fe29Sbellard 
2920*b016486eSRichard Henderson /**
2921*b016486eSRichard Henderson  * tcg_reg_alloc:
2922*b016486eSRichard Henderson  * @required_regs: Set of registers in which we must allocate.
2923*b016486eSRichard Henderson  * @allocated_regs: Set of registers which must be avoided.
2924*b016486eSRichard Henderson  * @preferred_regs: Set of registers we should prefer.
2925*b016486eSRichard Henderson  * @rev: True if we search the registers in "indirect" order.
2926*b016486eSRichard Henderson  *
2927*b016486eSRichard Henderson  * The allocated register must be in @required_regs & ~@allocated_regs,
2928*b016486eSRichard Henderson  * but if we can put it in @preferred_regs we may save a move later.
2929*b016486eSRichard Henderson  */
2930*b016486eSRichard Henderson static TCGReg tcg_reg_alloc(TCGContext *s, TCGRegSet required_regs,
2931*b016486eSRichard Henderson                             TCGRegSet allocated_regs,
2932*b016486eSRichard Henderson                             TCGRegSet preferred_regs, bool rev)
2933c896fe29Sbellard {
2934*b016486eSRichard Henderson     int i, j, f, n = ARRAY_SIZE(tcg_target_reg_alloc_order);
2935*b016486eSRichard Henderson     TCGRegSet reg_ct[2];
293691478cefSRichard Henderson     const int *order;
2937c896fe29Sbellard 
2938*b016486eSRichard Henderson     reg_ct[1] = required_regs & ~allocated_regs;
2939*b016486eSRichard Henderson     tcg_debug_assert(reg_ct[1] != 0);
2940*b016486eSRichard Henderson     reg_ct[0] = reg_ct[1] & preferred_regs;
2941*b016486eSRichard Henderson 
2942*b016486eSRichard Henderson     /* Skip the preferred_regs option if it cannot be satisfied,
2943*b016486eSRichard Henderson        or if the preference made no difference.  */
2944*b016486eSRichard Henderson     f = reg_ct[0] == 0 || reg_ct[0] == reg_ct[1];
2945*b016486eSRichard Henderson 
294691478cefSRichard Henderson     order = rev ? indirect_reg_alloc_order : tcg_target_reg_alloc_order;
2947c896fe29Sbellard 
2948*b016486eSRichard Henderson     /* Try free registers, preferences first.  */
2949*b016486eSRichard Henderson     for (j = f; j < 2; j++) {
2950*b016486eSRichard Henderson         TCGRegSet set = reg_ct[j];
2951*b016486eSRichard Henderson 
2952*b016486eSRichard Henderson         if (tcg_regset_single(set)) {
2953*b016486eSRichard Henderson             /* One register in the set.  */
2954*b016486eSRichard Henderson             TCGReg reg = tcg_regset_first(set);
2955*b016486eSRichard Henderson             if (s->reg_to_temp[reg] == NULL) {
2956c896fe29Sbellard                 return reg;
2957c896fe29Sbellard             }
2958*b016486eSRichard Henderson         } else {
295991478cefSRichard Henderson             for (i = 0; i < n; i++) {
2960*b016486eSRichard Henderson                 TCGReg reg = order[i];
2961*b016486eSRichard Henderson                 if (s->reg_to_temp[reg] == NULL &&
2962*b016486eSRichard Henderson                     tcg_regset_test_reg(set, reg)) {
2963*b016486eSRichard Henderson                     return reg;
2964*b016486eSRichard Henderson                 }
2965*b016486eSRichard Henderson             }
2966*b016486eSRichard Henderson         }
2967*b016486eSRichard Henderson     }
2968*b016486eSRichard Henderson 
2969*b016486eSRichard Henderson     /* We must spill something.  */
2970*b016486eSRichard Henderson     for (j = f; j < 2; j++) {
2971*b016486eSRichard Henderson         TCGRegSet set = reg_ct[j];
2972*b016486eSRichard Henderson 
2973*b016486eSRichard Henderson         if (tcg_regset_single(set)) {
2974*b016486eSRichard Henderson             /* One register in the set.  */
2975*b016486eSRichard Henderson             TCGReg reg = tcg_regset_first(set);
2976b3915dbbSRichard Henderson             tcg_reg_free(s, reg, allocated_regs);
2977c896fe29Sbellard             return reg;
2978*b016486eSRichard Henderson         } else {
2979*b016486eSRichard Henderson             for (i = 0; i < n; i++) {
2980*b016486eSRichard Henderson                 TCGReg reg = order[i];
2981*b016486eSRichard Henderson                 if (tcg_regset_test_reg(set, reg)) {
2982*b016486eSRichard Henderson                     tcg_reg_free(s, reg, allocated_regs);
2983*b016486eSRichard Henderson                     return reg;
2984*b016486eSRichard Henderson                 }
2985*b016486eSRichard Henderson             }
2986c896fe29Sbellard         }
2987c896fe29Sbellard     }
2988c896fe29Sbellard 
2989c896fe29Sbellard     tcg_abort();
2990c896fe29Sbellard }
2991c896fe29Sbellard 
299240ae5c62SRichard Henderson /* Make sure the temporary is in a register.  If needed, allocate the register
299340ae5c62SRichard Henderson    from DESIRED while avoiding ALLOCATED.  */
299440ae5c62SRichard Henderson static void temp_load(TCGContext *s, TCGTemp *ts, TCGRegSet desired_regs,
299540ae5c62SRichard Henderson                       TCGRegSet allocated_regs)
299640ae5c62SRichard Henderson {
299740ae5c62SRichard Henderson     TCGReg reg;
299840ae5c62SRichard Henderson 
299940ae5c62SRichard Henderson     switch (ts->val_type) {
300040ae5c62SRichard Henderson     case TEMP_VAL_REG:
300140ae5c62SRichard Henderson         return;
300240ae5c62SRichard Henderson     case TEMP_VAL_CONST:
3003*b016486eSRichard Henderson         reg = tcg_reg_alloc(s, desired_regs, allocated_regs,
3004*b016486eSRichard Henderson                             0, ts->indirect_base);
300540ae5c62SRichard Henderson         tcg_out_movi(s, ts->type, reg, ts->val);
300640ae5c62SRichard Henderson         ts->mem_coherent = 0;
300740ae5c62SRichard Henderson         break;
300840ae5c62SRichard Henderson     case TEMP_VAL_MEM:
3009*b016486eSRichard Henderson         reg = tcg_reg_alloc(s, desired_regs, allocated_regs,
3010*b016486eSRichard Henderson                             0, ts->indirect_base);
301140ae5c62SRichard Henderson         tcg_out_ld(s, ts->type, reg, ts->mem_base->reg, ts->mem_offset);
301240ae5c62SRichard Henderson         ts->mem_coherent = 1;
301340ae5c62SRichard Henderson         break;
301440ae5c62SRichard Henderson     case TEMP_VAL_DEAD:
301540ae5c62SRichard Henderson     default:
301640ae5c62SRichard Henderson         tcg_abort();
301740ae5c62SRichard Henderson     }
301840ae5c62SRichard Henderson     ts->reg = reg;
301940ae5c62SRichard Henderson     ts->val_type = TEMP_VAL_REG;
302040ae5c62SRichard Henderson     s->reg_to_temp[reg] = ts;
302140ae5c62SRichard Henderson }
302240ae5c62SRichard Henderson 
302359d7c14eSRichard Henderson /* Save a temporary to memory. 'allocated_regs' is used in case a
3024e8996ee0Sbellard    temporary registers needs to be allocated to store a constant.  */
302559d7c14eSRichard Henderson static void temp_save(TCGContext *s, TCGTemp *ts, TCGRegSet allocated_regs)
30261ad80729SAurelien Jarno {
30272c0366f0SAurelien Jarno     /* The liveness analysis already ensures that globals are back
3028eabb7b91SAurelien Jarno        in memory. Keep an tcg_debug_assert for safety. */
3029f8bf00f1SRichard Henderson     tcg_debug_assert(ts->val_type == TEMP_VAL_MEM || ts->fixed_reg);
30301ad80729SAurelien Jarno }
30311ad80729SAurelien Jarno 
30329814dd27SDong Xu Wang /* save globals to their canonical location and assume they can be
3033641d5fbeSbellard    modified be the following code. 'allocated_regs' is used in case a
3034641d5fbeSbellard    temporary registers needs to be allocated to store a constant. */
3035641d5fbeSbellard static void save_globals(TCGContext *s, TCGRegSet allocated_regs)
3036641d5fbeSbellard {
3037ac3b8891SRichard Henderson     int i, n;
3038641d5fbeSbellard 
3039ac3b8891SRichard Henderson     for (i = 0, n = s->nb_globals; i < n; i++) {
3040b13eb728SRichard Henderson         temp_save(s, &s->temps[i], allocated_regs);
3041641d5fbeSbellard     }
3042e5097dc8Sbellard }
3043e5097dc8Sbellard 
30443d5c5f87SAurelien Jarno /* sync globals to their canonical location and assume they can be
30453d5c5f87SAurelien Jarno    read by the following code. 'allocated_regs' is used in case a
30463d5c5f87SAurelien Jarno    temporary registers needs to be allocated to store a constant. */
30473d5c5f87SAurelien Jarno static void sync_globals(TCGContext *s, TCGRegSet allocated_regs)
30483d5c5f87SAurelien Jarno {
3049ac3b8891SRichard Henderson     int i, n;
30503d5c5f87SAurelien Jarno 
3051ac3b8891SRichard Henderson     for (i = 0, n = s->nb_globals; i < n; i++) {
305212b9b11aSRichard Henderson         TCGTemp *ts = &s->temps[i];
305312b9b11aSRichard Henderson         tcg_debug_assert(ts->val_type != TEMP_VAL_REG
305412b9b11aSRichard Henderson                          || ts->fixed_reg
305512b9b11aSRichard Henderson                          || ts->mem_coherent);
30563d5c5f87SAurelien Jarno     }
30573d5c5f87SAurelien Jarno }
30583d5c5f87SAurelien Jarno 
3059e5097dc8Sbellard /* at the end of a basic block, we assume all temporaries are dead and
3060e8996ee0Sbellard    all globals are stored at their canonical location. */
3061e8996ee0Sbellard static void tcg_reg_alloc_bb_end(TCGContext *s, TCGRegSet allocated_regs)
3062e5097dc8Sbellard {
3063e5097dc8Sbellard     int i;
3064e5097dc8Sbellard 
3065c896fe29Sbellard     for (i = s->nb_globals; i < s->nb_temps; i++) {
3066b13eb728SRichard Henderson         TCGTemp *ts = &s->temps[i];
3067641d5fbeSbellard         if (ts->temp_local) {
3068b13eb728SRichard Henderson             temp_save(s, ts, allocated_regs);
3069641d5fbeSbellard         } else {
30702c0366f0SAurelien Jarno             /* The liveness analysis already ensures that temps are dead.
3071eabb7b91SAurelien Jarno                Keep an tcg_debug_assert for safety. */
3072eabb7b91SAurelien Jarno             tcg_debug_assert(ts->val_type == TEMP_VAL_DEAD);
3073c896fe29Sbellard         }
3074641d5fbeSbellard     }
3075e8996ee0Sbellard 
3076e8996ee0Sbellard     save_globals(s, allocated_regs);
3077c896fe29Sbellard }
3078c896fe29Sbellard 
30790fe4fca4SPaolo Bonzini static void tcg_reg_alloc_do_movi(TCGContext *s, TCGTemp *ots,
30800fe4fca4SPaolo Bonzini                                   tcg_target_ulong val, TCGLifeData arg_life)
3081e8996ee0Sbellard {
3082e8996ee0Sbellard     if (ots->fixed_reg) {
308359d7c14eSRichard Henderson         /* For fixed registers, we do not do any constant propagation.  */
3084e8996ee0Sbellard         tcg_out_movi(s, ots->type, ots->reg, val);
308559d7c14eSRichard Henderson         return;
308659d7c14eSRichard Henderson     }
308759d7c14eSRichard Henderson 
308859d7c14eSRichard Henderson     /* The movi is not explicitly generated here.  */
3089f8b2f202SRichard Henderson     if (ots->val_type == TEMP_VAL_REG) {
3090f8b2f202SRichard Henderson         s->reg_to_temp[ots->reg] = NULL;
3091f8b2f202SRichard Henderson     }
3092e8996ee0Sbellard     ots->val_type = TEMP_VAL_CONST;
3093e8996ee0Sbellard     ots->val = val;
309459d7c14eSRichard Henderson     ots->mem_coherent = 0;
3095ec7a869dSAurelien Jarno     if (NEED_SYNC_ARG(0)) {
309659d7c14eSRichard Henderson         temp_sync(s, ots, s->reserved_regs, IS_DEAD_ARG(0));
309759d7c14eSRichard Henderson     } else if (IS_DEAD_ARG(0)) {
3098f8bf00f1SRichard Henderson         temp_dead(s, ots);
30994c4e1ab2SAurelien Jarno     }
3100e8996ee0Sbellard }
3101e8996ee0Sbellard 
3102dd186292SRichard Henderson static void tcg_reg_alloc_movi(TCGContext *s, const TCGOp *op)
31030fe4fca4SPaolo Bonzini {
310443439139SRichard Henderson     TCGTemp *ots = arg_temp(op->args[0]);
3105dd186292SRichard Henderson     tcg_target_ulong val = op->args[1];
31060fe4fca4SPaolo Bonzini 
3107dd186292SRichard Henderson     tcg_reg_alloc_do_movi(s, ots, val, op->life);
31080fe4fca4SPaolo Bonzini }
31090fe4fca4SPaolo Bonzini 
3110dd186292SRichard Henderson static void tcg_reg_alloc_mov(TCGContext *s, const TCGOp *op)
3111c896fe29Sbellard {
3112dd186292SRichard Henderson     const TCGLifeData arg_life = op->life;
3113c29c1d7eSAurelien Jarno     TCGRegSet allocated_regs;
3114c896fe29Sbellard     TCGTemp *ts, *ots;
3115450445d5SRichard Henderson     TCGType otype, itype;
3116c896fe29Sbellard 
3117d21369f5SRichard Henderson     allocated_regs = s->reserved_regs;
311843439139SRichard Henderson     ots = arg_temp(op->args[0]);
311943439139SRichard Henderson     ts = arg_temp(op->args[1]);
3120450445d5SRichard Henderson 
3121450445d5SRichard Henderson     /* Note that otype != itype for no-op truncation.  */
3122450445d5SRichard Henderson     otype = ots->type;
3123450445d5SRichard Henderson     itype = ts->type;
3124c896fe29Sbellard 
31250fe4fca4SPaolo Bonzini     if (ts->val_type == TEMP_VAL_CONST) {
31260fe4fca4SPaolo Bonzini         /* propagate constant or generate sti */
31270fe4fca4SPaolo Bonzini         tcg_target_ulong val = ts->val;
31280fe4fca4SPaolo Bonzini         if (IS_DEAD_ARG(1)) {
31290fe4fca4SPaolo Bonzini             temp_dead(s, ts);
31300fe4fca4SPaolo Bonzini         }
31310fe4fca4SPaolo Bonzini         tcg_reg_alloc_do_movi(s, ots, val, arg_life);
31320fe4fca4SPaolo Bonzini         return;
31330fe4fca4SPaolo Bonzini     }
31340fe4fca4SPaolo Bonzini 
31350fe4fca4SPaolo Bonzini     /* If the source value is in memory we're going to be forced
31360fe4fca4SPaolo Bonzini        to have it in a register in order to perform the copy.  Copy
31370fe4fca4SPaolo Bonzini        the SOURCE value into its own register first, that way we
31380fe4fca4SPaolo Bonzini        don't have to reload SOURCE the next time it is used. */
31390fe4fca4SPaolo Bonzini     if (ts->val_type == TEMP_VAL_MEM) {
314040ae5c62SRichard Henderson         temp_load(s, ts, tcg_target_available_regs[itype], allocated_regs);
3141c29c1d7eSAurelien Jarno     }
3142c29c1d7eSAurelien Jarno 
31430fe4fca4SPaolo Bonzini     tcg_debug_assert(ts->val_type == TEMP_VAL_REG);
3144c29c1d7eSAurelien Jarno     if (IS_DEAD_ARG(0) && !ots->fixed_reg) {
3145c29c1d7eSAurelien Jarno         /* mov to a non-saved dead register makes no sense (even with
3146c29c1d7eSAurelien Jarno            liveness analysis disabled). */
3147eabb7b91SAurelien Jarno         tcg_debug_assert(NEED_SYNC_ARG(0));
3148c29c1d7eSAurelien Jarno         if (!ots->mem_allocated) {
31492272e4a7SRichard Henderson             temp_allocate_frame(s, ots);
3150c29c1d7eSAurelien Jarno         }
3151b3a62939SRichard Henderson         tcg_out_st(s, otype, ts->reg, ots->mem_base->reg, ots->mem_offset);
3152c29c1d7eSAurelien Jarno         if (IS_DEAD_ARG(1)) {
3153f8bf00f1SRichard Henderson             temp_dead(s, ts);
3154c29c1d7eSAurelien Jarno         }
3155f8bf00f1SRichard Henderson         temp_dead(s, ots);
3156e8996ee0Sbellard     } else {
3157c29c1d7eSAurelien Jarno         if (IS_DEAD_ARG(1) && !ts->fixed_reg && !ots->fixed_reg) {
3158c29c1d7eSAurelien Jarno             /* the mov can be suppressed */
3159c29c1d7eSAurelien Jarno             if (ots->val_type == TEMP_VAL_REG) {
3160f8b2f202SRichard Henderson                 s->reg_to_temp[ots->reg] = NULL;
3161c896fe29Sbellard             }
3162c29c1d7eSAurelien Jarno             ots->reg = ts->reg;
3163f8bf00f1SRichard Henderson             temp_dead(s, ts);
3164c29c1d7eSAurelien Jarno         } else {
3165c29c1d7eSAurelien Jarno             if (ots->val_type != TEMP_VAL_REG) {
3166c29c1d7eSAurelien Jarno                 /* When allocating a new register, make sure to not spill the
3167c29c1d7eSAurelien Jarno                    input one. */
3168c29c1d7eSAurelien Jarno                 tcg_regset_set_reg(allocated_regs, ts->reg);
3169450445d5SRichard Henderson                 ots->reg = tcg_reg_alloc(s, tcg_target_available_regs[otype],
3170*b016486eSRichard Henderson                                          allocated_regs, 0,
3171*b016486eSRichard Henderson                                          ots->indirect_base);
3172c29c1d7eSAurelien Jarno             }
3173450445d5SRichard Henderson             tcg_out_mov(s, otype, ots->reg, ts->reg);
3174c29c1d7eSAurelien Jarno         }
3175c896fe29Sbellard         ots->val_type = TEMP_VAL_REG;
3176c896fe29Sbellard         ots->mem_coherent = 0;
3177f8b2f202SRichard Henderson         s->reg_to_temp[ots->reg] = ots;
3178ec7a869dSAurelien Jarno         if (NEED_SYNC_ARG(0)) {
317959d7c14eSRichard Henderson             temp_sync(s, ots, allocated_regs, 0);
3180c29c1d7eSAurelien Jarno         }
3181ec7a869dSAurelien Jarno     }
3182c896fe29Sbellard }
3183c896fe29Sbellard 
3184dd186292SRichard Henderson static void tcg_reg_alloc_op(TCGContext *s, const TCGOp *op)
3185c896fe29Sbellard {
3186dd186292SRichard Henderson     const TCGLifeData arg_life = op->life;
3187dd186292SRichard Henderson     const TCGOpDef * const def = &tcg_op_defs[op->opc];
318882790a87SRichard Henderson     TCGRegSet i_allocated_regs;
318982790a87SRichard Henderson     TCGRegSet o_allocated_regs;
3190b6638662SRichard Henderson     int i, k, nb_iargs, nb_oargs;
3191b6638662SRichard Henderson     TCGReg reg;
3192c896fe29Sbellard     TCGArg arg;
3193c896fe29Sbellard     const TCGArgConstraint *arg_ct;
3194c896fe29Sbellard     TCGTemp *ts;
3195c896fe29Sbellard     TCGArg new_args[TCG_MAX_OP_ARGS];
3196c896fe29Sbellard     int const_args[TCG_MAX_OP_ARGS];
3197c896fe29Sbellard 
3198c896fe29Sbellard     nb_oargs = def->nb_oargs;
3199c896fe29Sbellard     nb_iargs = def->nb_iargs;
3200c896fe29Sbellard 
3201c896fe29Sbellard     /* copy constants */
3202c896fe29Sbellard     memcpy(new_args + nb_oargs + nb_iargs,
3203dd186292SRichard Henderson            op->args + nb_oargs + nb_iargs,
3204c896fe29Sbellard            sizeof(TCGArg) * def->nb_cargs);
3205c896fe29Sbellard 
3206d21369f5SRichard Henderson     i_allocated_regs = s->reserved_regs;
3207d21369f5SRichard Henderson     o_allocated_regs = s->reserved_regs;
320882790a87SRichard Henderson 
3209c896fe29Sbellard     /* satisfy input constraints */
3210c896fe29Sbellard     for (k = 0; k < nb_iargs; k++) {
3211c896fe29Sbellard         i = def->sorted_args[nb_oargs + k];
3212dd186292SRichard Henderson         arg = op->args[i];
3213c896fe29Sbellard         arg_ct = &def->args_ct[i];
321443439139SRichard Henderson         ts = arg_temp(arg);
321540ae5c62SRichard Henderson 
321640ae5c62SRichard Henderson         if (ts->val_type == TEMP_VAL_CONST
321740ae5c62SRichard Henderson             && tcg_target_const_match(ts->val, ts->type, arg_ct)) {
3218c896fe29Sbellard             /* constant is OK for instruction */
3219c896fe29Sbellard             const_args[i] = 1;
3220c896fe29Sbellard             new_args[i] = ts->val;
3221c896fe29Sbellard             goto iarg_end;
3222c896fe29Sbellard         }
322340ae5c62SRichard Henderson 
322482790a87SRichard Henderson         temp_load(s, ts, arg_ct->u.regs, i_allocated_regs);
322540ae5c62SRichard Henderson 
32265ff9d6a4Sbellard         if (arg_ct->ct & TCG_CT_IALIAS) {
32275ff9d6a4Sbellard             if (ts->fixed_reg) {
32285ff9d6a4Sbellard                 /* if fixed register, we must allocate a new register
32295ff9d6a4Sbellard                    if the alias is not the same register */
3230dd186292SRichard Henderson                 if (arg != op->args[arg_ct->alias_index])
32315ff9d6a4Sbellard                     goto allocate_in_reg;
32325ff9d6a4Sbellard             } else {
3233c896fe29Sbellard                 /* if the input is aliased to an output and if it is
3234c896fe29Sbellard                    not dead after the instruction, we must allocate
3235c896fe29Sbellard                    a new register and move it */
3236866cb6cbSAurelien Jarno                 if (!IS_DEAD_ARG(i)) {
3237c896fe29Sbellard                     goto allocate_in_reg;
3238c896fe29Sbellard                 }
32397e1df267SAurelien Jarno                 /* check if the current register has already been allocated
32407e1df267SAurelien Jarno                    for another input aliased to an output */
32417e1df267SAurelien Jarno                 int k2, i2;
32427e1df267SAurelien Jarno                 for (k2 = 0 ; k2 < k ; k2++) {
32437e1df267SAurelien Jarno                     i2 = def->sorted_args[nb_oargs + k2];
32447e1df267SAurelien Jarno                     if ((def->args_ct[i2].ct & TCG_CT_IALIAS) &&
32457e1df267SAurelien Jarno                         (new_args[i2] == ts->reg)) {
32467e1df267SAurelien Jarno                         goto allocate_in_reg;
32477e1df267SAurelien Jarno                     }
32487e1df267SAurelien Jarno                 }
32495ff9d6a4Sbellard             }
3250866cb6cbSAurelien Jarno         }
3251c896fe29Sbellard         reg = ts->reg;
3252c896fe29Sbellard         if (tcg_regset_test_reg(arg_ct->u.regs, reg)) {
3253c896fe29Sbellard             /* nothing to do : the constraint is satisfied */
3254c896fe29Sbellard         } else {
3255c896fe29Sbellard         allocate_in_reg:
3256c896fe29Sbellard             /* allocate a new register matching the constraint
3257c896fe29Sbellard                and move the temporary register into it */
325882790a87SRichard Henderson             reg = tcg_reg_alloc(s, arg_ct->u.regs, i_allocated_regs,
3259*b016486eSRichard Henderson                                 0, ts->indirect_base);
32603b6dac34SRichard Henderson             tcg_out_mov(s, ts->type, reg, ts->reg);
3261c896fe29Sbellard         }
3262c896fe29Sbellard         new_args[i] = reg;
3263c896fe29Sbellard         const_args[i] = 0;
326482790a87SRichard Henderson         tcg_regset_set_reg(i_allocated_regs, reg);
3265c896fe29Sbellard     iarg_end: ;
3266c896fe29Sbellard     }
3267c896fe29Sbellard 
3268c896fe29Sbellard     /* mark dead temporaries and free the associated registers */
3269866cb6cbSAurelien Jarno     for (i = nb_oargs; i < nb_oargs + nb_iargs; i++) {
3270866cb6cbSAurelien Jarno         if (IS_DEAD_ARG(i)) {
327143439139SRichard Henderson             temp_dead(s, arg_temp(op->args[i]));
3272c896fe29Sbellard         }
3273c896fe29Sbellard     }
3274c896fe29Sbellard 
3275a52ad07eSAurelien Jarno     if (def->flags & TCG_OPF_BB_END) {
327682790a87SRichard Henderson         tcg_reg_alloc_bb_end(s, i_allocated_regs);
3277a52ad07eSAurelien Jarno     } else {
3278c896fe29Sbellard         if (def->flags & TCG_OPF_CALL_CLOBBER) {
3279b03cce8eSbellard             /* XXX: permit generic clobber register list ? */
3280c8074023SRichard Henderson             for (i = 0; i < TCG_TARGET_NB_REGS; i++) {
3281c8074023SRichard Henderson                 if (tcg_regset_test_reg(tcg_target_call_clobber_regs, i)) {
328282790a87SRichard Henderson                     tcg_reg_free(s, i, i_allocated_regs);
3283c896fe29Sbellard                 }
3284c896fe29Sbellard             }
32853d5c5f87SAurelien Jarno         }
32863d5c5f87SAurelien Jarno         if (def->flags & TCG_OPF_SIDE_EFFECTS) {
32873d5c5f87SAurelien Jarno             /* sync globals if the op has side effects and might trigger
32883d5c5f87SAurelien Jarno                an exception. */
328982790a87SRichard Henderson             sync_globals(s, i_allocated_regs);
3290c896fe29Sbellard         }
3291c896fe29Sbellard 
3292c896fe29Sbellard         /* satisfy the output constraints */
3293c896fe29Sbellard         for(k = 0; k < nb_oargs; k++) {
3294c896fe29Sbellard             i = def->sorted_args[k];
3295dd186292SRichard Henderson             arg = op->args[i];
3296c896fe29Sbellard             arg_ct = &def->args_ct[i];
329743439139SRichard Henderson             ts = arg_temp(arg);
329817280ff4SRichard Henderson             if ((arg_ct->ct & TCG_CT_ALIAS)
329917280ff4SRichard Henderson                 && !const_args[arg_ct->alias_index]) {
33005ff9d6a4Sbellard                 reg = new_args[arg_ct->alias_index];
330182790a87SRichard Henderson             } else if (arg_ct->ct & TCG_CT_NEWREG) {
330282790a87SRichard Henderson                 reg = tcg_reg_alloc(s, arg_ct->u.regs,
330382790a87SRichard Henderson                                     i_allocated_regs | o_allocated_regs,
3304*b016486eSRichard Henderson                                     0, ts->indirect_base);
3305c896fe29Sbellard             } else {
3306c896fe29Sbellard                 /* if fixed register, we try to use it */
3307c896fe29Sbellard                 reg = ts->reg;
3308c896fe29Sbellard                 if (ts->fixed_reg &&
3309c896fe29Sbellard                     tcg_regset_test_reg(arg_ct->u.regs, reg)) {
3310c896fe29Sbellard                     goto oarg_end;
3311c896fe29Sbellard                 }
331282790a87SRichard Henderson                 reg = tcg_reg_alloc(s, arg_ct->u.regs, o_allocated_regs,
3313*b016486eSRichard Henderson                                     0, ts->indirect_base);
3314c896fe29Sbellard             }
331582790a87SRichard Henderson             tcg_regset_set_reg(o_allocated_regs, reg);
3316c896fe29Sbellard             /* if a fixed register is used, then a move will be done afterwards */
3317c896fe29Sbellard             if (!ts->fixed_reg) {
3318639368ddSAurelien Jarno                 if (ts->val_type == TEMP_VAL_REG) {
3319f8b2f202SRichard Henderson                     s->reg_to_temp[ts->reg] = NULL;
3320639368ddSAurelien Jarno                 }
3321c896fe29Sbellard                 ts->val_type = TEMP_VAL_REG;
3322c896fe29Sbellard                 ts->reg = reg;
3323c896fe29Sbellard                 /* temp value is modified, so the value kept in memory is
3324c896fe29Sbellard                    potentially not the same */
3325c896fe29Sbellard                 ts->mem_coherent = 0;
3326f8b2f202SRichard Henderson                 s->reg_to_temp[reg] = ts;
3327c896fe29Sbellard             }
3328c896fe29Sbellard         oarg_end:
3329c896fe29Sbellard             new_args[i] = reg;
3330c896fe29Sbellard         }
3331e8996ee0Sbellard     }
3332c896fe29Sbellard 
3333c896fe29Sbellard     /* emit instruction */
3334d2fd745fSRichard Henderson     if (def->flags & TCG_OPF_VECTOR) {
3335d2fd745fSRichard Henderson         tcg_out_vec_op(s, op->opc, TCGOP_VECL(op), TCGOP_VECE(op),
3336d2fd745fSRichard Henderson                        new_args, const_args);
3337d2fd745fSRichard Henderson     } else {
3338dd186292SRichard Henderson         tcg_out_op(s, op->opc, new_args, const_args);
3339d2fd745fSRichard Henderson     }
3340c896fe29Sbellard 
3341c896fe29Sbellard     /* move the outputs in the correct register if needed */
3342c896fe29Sbellard     for(i = 0; i < nb_oargs; i++) {
334343439139SRichard Henderson         ts = arg_temp(op->args[i]);
3344c896fe29Sbellard         reg = new_args[i];
3345c896fe29Sbellard         if (ts->fixed_reg && ts->reg != reg) {
33463b6dac34SRichard Henderson             tcg_out_mov(s, ts->type, ts->reg, reg);
3347c896fe29Sbellard         }
3348ec7a869dSAurelien Jarno         if (NEED_SYNC_ARG(i)) {
334982790a87SRichard Henderson             temp_sync(s, ts, o_allocated_regs, IS_DEAD_ARG(i));
335059d7c14eSRichard Henderson         } else if (IS_DEAD_ARG(i)) {
3351f8bf00f1SRichard Henderson             temp_dead(s, ts);
3352ec7a869dSAurelien Jarno         }
3353c896fe29Sbellard     }
3354c896fe29Sbellard }
3355c896fe29Sbellard 
3356b03cce8eSbellard #ifdef TCG_TARGET_STACK_GROWSUP
3357b03cce8eSbellard #define STACK_DIR(x) (-(x))
3358b03cce8eSbellard #else
3359b03cce8eSbellard #define STACK_DIR(x) (x)
3360b03cce8eSbellard #endif
3361b03cce8eSbellard 
3362dd186292SRichard Henderson static void tcg_reg_alloc_call(TCGContext *s, TCGOp *op)
3363c896fe29Sbellard {
3364cd9090aaSRichard Henderson     const int nb_oargs = TCGOP_CALLO(op);
3365cd9090aaSRichard Henderson     const int nb_iargs = TCGOP_CALLI(op);
3366dd186292SRichard Henderson     const TCGLifeData arg_life = op->life;
3367b6638662SRichard Henderson     int flags, nb_regs, i;
3368b6638662SRichard Henderson     TCGReg reg;
3369cf066674SRichard Henderson     TCGArg arg;
3370c896fe29Sbellard     TCGTemp *ts;
3371d3452f1fSRichard Henderson     intptr_t stack_offset;
3372d3452f1fSRichard Henderson     size_t call_stack_size;
3373cf066674SRichard Henderson     tcg_insn_unit *func_addr;
3374cf066674SRichard Henderson     int allocate_args;
3375c896fe29Sbellard     TCGRegSet allocated_regs;
3376c896fe29Sbellard 
3377dd186292SRichard Henderson     func_addr = (tcg_insn_unit *)(intptr_t)op->args[nb_oargs + nb_iargs];
3378dd186292SRichard Henderson     flags = op->args[nb_oargs + nb_iargs + 1];
3379c896fe29Sbellard 
33806e17d0c5SStefan Weil     nb_regs = ARRAY_SIZE(tcg_target_call_iarg_regs);
3381c45cb8bbSRichard Henderson     if (nb_regs > nb_iargs) {
3382c45cb8bbSRichard Henderson         nb_regs = nb_iargs;
3383cf066674SRichard Henderson     }
3384c896fe29Sbellard 
3385c896fe29Sbellard     /* assign stack slots first */
3386c45cb8bbSRichard Henderson     call_stack_size = (nb_iargs - nb_regs) * sizeof(tcg_target_long);
3387c896fe29Sbellard     call_stack_size = (call_stack_size + TCG_TARGET_STACK_ALIGN - 1) &
3388c896fe29Sbellard         ~(TCG_TARGET_STACK_ALIGN - 1);
3389b03cce8eSbellard     allocate_args = (call_stack_size > TCG_STATIC_CALL_ARGS_SIZE);
3390b03cce8eSbellard     if (allocate_args) {
3391345649c0SBlue Swirl         /* XXX: if more than TCG_STATIC_CALL_ARGS_SIZE is needed,
3392345649c0SBlue Swirl            preallocate call stack */
3393345649c0SBlue Swirl         tcg_abort();
3394b03cce8eSbellard     }
339539cf05d3Sbellard 
339639cf05d3Sbellard     stack_offset = TCG_TARGET_CALL_STACK_OFFSET;
3397c45cb8bbSRichard Henderson     for (i = nb_regs; i < nb_iargs; i++) {
3398dd186292SRichard Henderson         arg = op->args[nb_oargs + i];
339939cf05d3Sbellard #ifdef TCG_TARGET_STACK_GROWSUP
340039cf05d3Sbellard         stack_offset -= sizeof(tcg_target_long);
340139cf05d3Sbellard #endif
340239cf05d3Sbellard         if (arg != TCG_CALL_DUMMY_ARG) {
340343439139SRichard Henderson             ts = arg_temp(arg);
340440ae5c62SRichard Henderson             temp_load(s, ts, tcg_target_available_regs[ts->type],
340540ae5c62SRichard Henderson                       s->reserved_regs);
3406e4d5434cSblueswir1             tcg_out_st(s, ts->type, ts->reg, TCG_REG_CALL_STACK, stack_offset);
340739cf05d3Sbellard         }
340839cf05d3Sbellard #ifndef TCG_TARGET_STACK_GROWSUP
340939cf05d3Sbellard         stack_offset += sizeof(tcg_target_long);
341039cf05d3Sbellard #endif
3411c896fe29Sbellard     }
3412c896fe29Sbellard 
3413c896fe29Sbellard     /* assign input registers */
3414d21369f5SRichard Henderson     allocated_regs = s->reserved_regs;
3415c896fe29Sbellard     for (i = 0; i < nb_regs; i++) {
3416dd186292SRichard Henderson         arg = op->args[nb_oargs + i];
341739cf05d3Sbellard         if (arg != TCG_CALL_DUMMY_ARG) {
341843439139SRichard Henderson             ts = arg_temp(arg);
3419c896fe29Sbellard             reg = tcg_target_call_iarg_regs[i];
3420b3915dbbSRichard Henderson             tcg_reg_free(s, reg, allocated_regs);
342140ae5c62SRichard Henderson 
3422c896fe29Sbellard             if (ts->val_type == TEMP_VAL_REG) {
3423c896fe29Sbellard                 if (ts->reg != reg) {
34243b6dac34SRichard Henderson                     tcg_out_mov(s, ts->type, reg, ts->reg);
3425c896fe29Sbellard                 }
3426c896fe29Sbellard             } else {
3427ccb1bb66SRichard Henderson                 TCGRegSet arg_set = 0;
342840ae5c62SRichard Henderson 
342940ae5c62SRichard Henderson                 tcg_regset_set_reg(arg_set, reg);
343040ae5c62SRichard Henderson                 temp_load(s, ts, arg_set, allocated_regs);
3431c896fe29Sbellard             }
343240ae5c62SRichard Henderson 
3433c896fe29Sbellard             tcg_regset_set_reg(allocated_regs, reg);
3434c896fe29Sbellard         }
343539cf05d3Sbellard     }
3436c896fe29Sbellard 
3437c896fe29Sbellard     /* mark dead temporaries and free the associated registers */
3438866cb6cbSAurelien Jarno     for (i = nb_oargs; i < nb_iargs + nb_oargs; i++) {
3439866cb6cbSAurelien Jarno         if (IS_DEAD_ARG(i)) {
344043439139SRichard Henderson             temp_dead(s, arg_temp(op->args[i]));
3441c896fe29Sbellard         }
3442c896fe29Sbellard     }
3443c896fe29Sbellard 
3444c896fe29Sbellard     /* clobber call registers */
3445c8074023SRichard Henderson     for (i = 0; i < TCG_TARGET_NB_REGS; i++) {
3446c8074023SRichard Henderson         if (tcg_regset_test_reg(tcg_target_call_clobber_regs, i)) {
3447b3915dbbSRichard Henderson             tcg_reg_free(s, i, allocated_regs);
3448c896fe29Sbellard         }
3449c896fe29Sbellard     }
3450c896fe29Sbellard 
345178505279SAurelien Jarno     /* Save globals if they might be written by the helper, sync them if
345278505279SAurelien Jarno        they might be read. */
345378505279SAurelien Jarno     if (flags & TCG_CALL_NO_READ_GLOBALS) {
345478505279SAurelien Jarno         /* Nothing to do */
345578505279SAurelien Jarno     } else if (flags & TCG_CALL_NO_WRITE_GLOBALS) {
345678505279SAurelien Jarno         sync_globals(s, allocated_regs);
345778505279SAurelien Jarno     } else {
3458e8996ee0Sbellard         save_globals(s, allocated_regs);
3459b9c18f56Saurel32     }
3460c896fe29Sbellard 
3461cf066674SRichard Henderson     tcg_out_call(s, func_addr);
3462c896fe29Sbellard 
3463c896fe29Sbellard     /* assign output registers and emit moves if needed */
3464c896fe29Sbellard     for(i = 0; i < nb_oargs; i++) {
3465dd186292SRichard Henderson         arg = op->args[i];
346643439139SRichard Henderson         ts = arg_temp(arg);
3467c896fe29Sbellard         reg = tcg_target_call_oarg_regs[i];
3468eabb7b91SAurelien Jarno         tcg_debug_assert(s->reg_to_temp[reg] == NULL);
346934b1a49cSRichard Henderson 
3470c896fe29Sbellard         if (ts->fixed_reg) {
3471c896fe29Sbellard             if (ts->reg != reg) {
34723b6dac34SRichard Henderson                 tcg_out_mov(s, ts->type, ts->reg, reg);
3473c896fe29Sbellard             }
3474c896fe29Sbellard         } else {
3475639368ddSAurelien Jarno             if (ts->val_type == TEMP_VAL_REG) {
3476f8b2f202SRichard Henderson                 s->reg_to_temp[ts->reg] = NULL;
3477639368ddSAurelien Jarno             }
3478c896fe29Sbellard             ts->val_type = TEMP_VAL_REG;
3479c896fe29Sbellard             ts->reg = reg;
3480c896fe29Sbellard             ts->mem_coherent = 0;
3481f8b2f202SRichard Henderson             s->reg_to_temp[reg] = ts;
3482ec7a869dSAurelien Jarno             if (NEED_SYNC_ARG(i)) {
348359d7c14eSRichard Henderson                 temp_sync(s, ts, allocated_regs, IS_DEAD_ARG(i));
348459d7c14eSRichard Henderson             } else if (IS_DEAD_ARG(i)) {
3485f8bf00f1SRichard Henderson                 temp_dead(s, ts);
3486c896fe29Sbellard             }
3487c896fe29Sbellard         }
34888c11ad25SAurelien Jarno     }
3489c896fe29Sbellard }
3490c896fe29Sbellard 
3491c896fe29Sbellard #ifdef CONFIG_PROFILER
3492c896fe29Sbellard 
3493c3fac113SEmilio G. Cota /* avoid copy/paste errors */
3494c3fac113SEmilio G. Cota #define PROF_ADD(to, from, field)                       \
3495c3fac113SEmilio G. Cota     do {                                                \
3496c3fac113SEmilio G. Cota         (to)->field += atomic_read(&((from)->field));   \
3497c3fac113SEmilio G. Cota     } while (0)
3498c896fe29Sbellard 
3499c3fac113SEmilio G. Cota #define PROF_MAX(to, from, field)                                       \
3500c3fac113SEmilio G. Cota     do {                                                                \
3501c3fac113SEmilio G. Cota         typeof((from)->field) val__ = atomic_read(&((from)->field));    \
3502c3fac113SEmilio G. Cota         if (val__ > (to)->field) {                                      \
3503c3fac113SEmilio G. Cota             (to)->field = val__;                                        \
3504c3fac113SEmilio G. Cota         }                                                               \
3505c3fac113SEmilio G. Cota     } while (0)
3506c3fac113SEmilio G. Cota 
3507c3fac113SEmilio G. Cota /* Pass in a zero'ed @prof */
3508c3fac113SEmilio G. Cota static inline
3509c3fac113SEmilio G. Cota void tcg_profile_snapshot(TCGProfile *prof, bool counters, bool table)
3510c896fe29Sbellard {
35113468b59eSEmilio G. Cota     unsigned int n_ctxs = atomic_read(&n_tcg_ctxs);
3512c3fac113SEmilio G. Cota     unsigned int i;
3513c3fac113SEmilio G. Cota 
35143468b59eSEmilio G. Cota     for (i = 0; i < n_ctxs; i++) {
35153468b59eSEmilio G. Cota         TCGContext *s = atomic_read(&tcg_ctxs[i]);
35163468b59eSEmilio G. Cota         const TCGProfile *orig = &s->prof;
3517c3fac113SEmilio G. Cota 
3518c3fac113SEmilio G. Cota         if (counters) {
351972fd2efbSEmilio G. Cota             PROF_ADD(prof, orig, cpu_exec_time);
3520c3fac113SEmilio G. Cota             PROF_ADD(prof, orig, tb_count1);
3521c3fac113SEmilio G. Cota             PROF_ADD(prof, orig, tb_count);
3522c3fac113SEmilio G. Cota             PROF_ADD(prof, orig, op_count);
3523c3fac113SEmilio G. Cota             PROF_MAX(prof, orig, op_count_max);
3524c3fac113SEmilio G. Cota             PROF_ADD(prof, orig, temp_count);
3525c3fac113SEmilio G. Cota             PROF_MAX(prof, orig, temp_count_max);
3526c3fac113SEmilio G. Cota             PROF_ADD(prof, orig, del_op_count);
3527c3fac113SEmilio G. Cota             PROF_ADD(prof, orig, code_in_len);
3528c3fac113SEmilio G. Cota             PROF_ADD(prof, orig, code_out_len);
3529c3fac113SEmilio G. Cota             PROF_ADD(prof, orig, search_out_len);
3530c3fac113SEmilio G. Cota             PROF_ADD(prof, orig, interm_time);
3531c3fac113SEmilio G. Cota             PROF_ADD(prof, orig, code_time);
3532c3fac113SEmilio G. Cota             PROF_ADD(prof, orig, la_time);
3533c3fac113SEmilio G. Cota             PROF_ADD(prof, orig, opt_time);
3534c3fac113SEmilio G. Cota             PROF_ADD(prof, orig, restore_count);
3535c3fac113SEmilio G. Cota             PROF_ADD(prof, orig, restore_time);
3536c3fac113SEmilio G. Cota         }
3537c3fac113SEmilio G. Cota         if (table) {
3538c896fe29Sbellard             int i;
3539d70724ceSzhanghailiang 
354015fc7daaSRichard Henderson             for (i = 0; i < NB_OPS; i++) {
3541c3fac113SEmilio G. Cota                 PROF_ADD(prof, orig, table_op_count[i]);
3542c3fac113SEmilio G. Cota             }
3543c3fac113SEmilio G. Cota         }
3544c3fac113SEmilio G. Cota     }
3545c3fac113SEmilio G. Cota }
3546c3fac113SEmilio G. Cota 
3547c3fac113SEmilio G. Cota #undef PROF_ADD
3548c3fac113SEmilio G. Cota #undef PROF_MAX
3549c3fac113SEmilio G. Cota 
3550c3fac113SEmilio G. Cota static void tcg_profile_snapshot_counters(TCGProfile *prof)
3551c3fac113SEmilio G. Cota {
3552c3fac113SEmilio G. Cota     tcg_profile_snapshot(prof, true, false);
3553c3fac113SEmilio G. Cota }
3554c3fac113SEmilio G. Cota 
3555c3fac113SEmilio G. Cota static void tcg_profile_snapshot_table(TCGProfile *prof)
3556c3fac113SEmilio G. Cota {
3557c3fac113SEmilio G. Cota     tcg_profile_snapshot(prof, false, true);
3558c3fac113SEmilio G. Cota }
3559c3fac113SEmilio G. Cota 
3560c3fac113SEmilio G. Cota void tcg_dump_op_count(FILE *f, fprintf_function cpu_fprintf)
3561c3fac113SEmilio G. Cota {
3562c3fac113SEmilio G. Cota     TCGProfile prof = {};
3563c3fac113SEmilio G. Cota     int i;
3564c3fac113SEmilio G. Cota 
3565c3fac113SEmilio G. Cota     tcg_profile_snapshot_table(&prof);
3566c3fac113SEmilio G. Cota     for (i = 0; i < NB_OPS; i++) {
3567246ae24dSMax Filippov         cpu_fprintf(f, "%s %" PRId64 "\n", tcg_op_defs[i].name,
3568c3fac113SEmilio G. Cota                     prof.table_op_count[i]);
3569c896fe29Sbellard     }
3570c896fe29Sbellard }
357172fd2efbSEmilio G. Cota 
357272fd2efbSEmilio G. Cota int64_t tcg_cpu_exec_time(void)
357372fd2efbSEmilio G. Cota {
357472fd2efbSEmilio G. Cota     unsigned int n_ctxs = atomic_read(&n_tcg_ctxs);
357572fd2efbSEmilio G. Cota     unsigned int i;
357672fd2efbSEmilio G. Cota     int64_t ret = 0;
357772fd2efbSEmilio G. Cota 
357872fd2efbSEmilio G. Cota     for (i = 0; i < n_ctxs; i++) {
357972fd2efbSEmilio G. Cota         const TCGContext *s = atomic_read(&tcg_ctxs[i]);
358072fd2efbSEmilio G. Cota         const TCGProfile *prof = &s->prof;
358172fd2efbSEmilio G. Cota 
358272fd2efbSEmilio G. Cota         ret += atomic_read(&prof->cpu_exec_time);
358372fd2efbSEmilio G. Cota     }
358472fd2efbSEmilio G. Cota     return ret;
358572fd2efbSEmilio G. Cota }
3586246ae24dSMax Filippov #else
3587246ae24dSMax Filippov void tcg_dump_op_count(FILE *f, fprintf_function cpu_fprintf)
3588246ae24dSMax Filippov {
3589246ae24dSMax Filippov     cpu_fprintf(f, "[TCG profiler not compiled]\n");
3590246ae24dSMax Filippov }
359172fd2efbSEmilio G. Cota 
359272fd2efbSEmilio G. Cota int64_t tcg_cpu_exec_time(void)
359372fd2efbSEmilio G. Cota {
359472fd2efbSEmilio G. Cota     error_report("%s: TCG profiler not compiled", __func__);
359572fd2efbSEmilio G. Cota     exit(EXIT_FAILURE);
359672fd2efbSEmilio G. Cota }
3597c896fe29Sbellard #endif
3598c896fe29Sbellard 
3599c896fe29Sbellard 
36005bd2ec3dSAlex Bennée int tcg_gen_code(TCGContext *s, TranslationBlock *tb)
3601c896fe29Sbellard {
3602c3fac113SEmilio G. Cota #ifdef CONFIG_PROFILER
3603c3fac113SEmilio G. Cota     TCGProfile *prof = &s->prof;
3604c3fac113SEmilio G. Cota #endif
360515fa08f8SRichard Henderson     int i, num_insns;
360615fa08f8SRichard Henderson     TCGOp *op;
3607c896fe29Sbellard 
360804fe6400SRichard Henderson #ifdef CONFIG_PROFILER
360904fe6400SRichard Henderson     {
3610c1f543b7SEmilio G. Cota         int n = 0;
361104fe6400SRichard Henderson 
361215fa08f8SRichard Henderson         QTAILQ_FOREACH(op, &s->ops, link) {
361315fa08f8SRichard Henderson             n++;
361415fa08f8SRichard Henderson         }
3615c3fac113SEmilio G. Cota         atomic_set(&prof->op_count, prof->op_count + n);
3616c3fac113SEmilio G. Cota         if (n > prof->op_count_max) {
3617c3fac113SEmilio G. Cota             atomic_set(&prof->op_count_max, n);
361804fe6400SRichard Henderson         }
361904fe6400SRichard Henderson 
362004fe6400SRichard Henderson         n = s->nb_temps;
3621c3fac113SEmilio G. Cota         atomic_set(&prof->temp_count, prof->temp_count + n);
3622c3fac113SEmilio G. Cota         if (n > prof->temp_count_max) {
3623c3fac113SEmilio G. Cota             atomic_set(&prof->temp_count_max, n);
362404fe6400SRichard Henderson         }
362504fe6400SRichard Henderson     }
362604fe6400SRichard Henderson #endif
362704fe6400SRichard Henderson 
3628c896fe29Sbellard #ifdef DEBUG_DISAS
3629d977e1c2SAlex Bennée     if (unlikely(qemu_loglevel_mask(CPU_LOG_TB_OP)
3630d977e1c2SAlex Bennée                  && qemu_log_in_addr_range(tb->pc))) {
36311ee73216SRichard Henderson         qemu_log_lock();
363293fcfe39Saliguori         qemu_log("OP:\n");
3633eeacee4dSBlue Swirl         tcg_dump_ops(s);
363493fcfe39Saliguori         qemu_log("\n");
36351ee73216SRichard Henderson         qemu_log_unlock();
3636c896fe29Sbellard     }
3637c896fe29Sbellard #endif
3638c896fe29Sbellard 
3639c5cc28ffSAurelien Jarno #ifdef CONFIG_PROFILER
3640c3fac113SEmilio G. Cota     atomic_set(&prof->opt_time, prof->opt_time - profile_getclock());
3641c5cc28ffSAurelien Jarno #endif
3642c5cc28ffSAurelien Jarno 
36438f2e8c07SKirill Batuzov #ifdef USE_TCG_OPTIMIZATIONS
3644c45cb8bbSRichard Henderson     tcg_optimize(s);
36458f2e8c07SKirill Batuzov #endif
36468f2e8c07SKirill Batuzov 
3647a23a9ec6Sbellard #ifdef CONFIG_PROFILER
3648c3fac113SEmilio G. Cota     atomic_set(&prof->opt_time, prof->opt_time + profile_getclock());
3649c3fac113SEmilio G. Cota     atomic_set(&prof->la_time, prof->la_time - profile_getclock());
3650a23a9ec6Sbellard #endif
3651c5cc28ffSAurelien Jarno 
3652b4fc67c7SRichard Henderson     reachable_code_pass(s);
3653b83eabeaSRichard Henderson     liveness_pass_1(s);
36545a18407fSRichard Henderson 
36555a18407fSRichard Henderson     if (s->nb_indirects > 0) {
36565a18407fSRichard Henderson #ifdef DEBUG_DISAS
36575a18407fSRichard Henderson         if (unlikely(qemu_loglevel_mask(CPU_LOG_TB_OP_IND)
36585a18407fSRichard Henderson                      && qemu_log_in_addr_range(tb->pc))) {
36591ee73216SRichard Henderson             qemu_log_lock();
36605a18407fSRichard Henderson             qemu_log("OP before indirect lowering:\n");
36615a18407fSRichard Henderson             tcg_dump_ops(s);
36625a18407fSRichard Henderson             qemu_log("\n");
36631ee73216SRichard Henderson             qemu_log_unlock();
36645a18407fSRichard Henderson         }
36655a18407fSRichard Henderson #endif
36665a18407fSRichard Henderson         /* Replace indirect temps with direct temps.  */
3667b83eabeaSRichard Henderson         if (liveness_pass_2(s)) {
36685a18407fSRichard Henderson             /* If changes were made, re-run liveness.  */
3669b83eabeaSRichard Henderson             liveness_pass_1(s);
36705a18407fSRichard Henderson         }
36715a18407fSRichard Henderson     }
3672c5cc28ffSAurelien Jarno 
3673a23a9ec6Sbellard #ifdef CONFIG_PROFILER
3674c3fac113SEmilio G. Cota     atomic_set(&prof->la_time, prof->la_time + profile_getclock());
3675a23a9ec6Sbellard #endif
3676c896fe29Sbellard 
3677c896fe29Sbellard #ifdef DEBUG_DISAS
3678d977e1c2SAlex Bennée     if (unlikely(qemu_loglevel_mask(CPU_LOG_TB_OP_OPT)
3679d977e1c2SAlex Bennée                  && qemu_log_in_addr_range(tb->pc))) {
36801ee73216SRichard Henderson         qemu_log_lock();
3681c5cc28ffSAurelien Jarno         qemu_log("OP after optimization and liveness analysis:\n");
3682eeacee4dSBlue Swirl         tcg_dump_ops(s);
368393fcfe39Saliguori         qemu_log("\n");
36841ee73216SRichard Henderson         qemu_log_unlock();
3685c896fe29Sbellard     }
3686c896fe29Sbellard #endif
3687c896fe29Sbellard 
3688c896fe29Sbellard     tcg_reg_alloc_start(s);
3689c896fe29Sbellard 
3690e7e168f4SEmilio G. Cota     s->code_buf = tb->tc.ptr;
3691e7e168f4SEmilio G. Cota     s->code_ptr = tb->tc.ptr;
3692c896fe29Sbellard 
3693659ef5cbSRichard Henderson #ifdef TCG_TARGET_NEED_LDST_LABELS
36946001f772SLaurent Vivier     QSIMPLEQ_INIT(&s->ldst_labels);
3695659ef5cbSRichard Henderson #endif
369657a26946SRichard Henderson #ifdef TCG_TARGET_NEED_POOL_LABELS
369757a26946SRichard Henderson     s->pool_labels = NULL;
369857a26946SRichard Henderson #endif
36999ecefc84SRichard Henderson 
3700fca8a500SRichard Henderson     num_insns = -1;
370115fa08f8SRichard Henderson     QTAILQ_FOREACH(op, &s->ops, link) {
3702c45cb8bbSRichard Henderson         TCGOpcode opc = op->opc;
3703b3db8758Sblueswir1 
3704c896fe29Sbellard #ifdef CONFIG_PROFILER
3705c3fac113SEmilio G. Cota         atomic_set(&prof->table_op_count[opc], prof->table_op_count[opc] + 1);
3706c896fe29Sbellard #endif
3707c45cb8bbSRichard Henderson 
3708c896fe29Sbellard         switch (opc) {
3709c896fe29Sbellard         case INDEX_op_mov_i32:
3710c896fe29Sbellard         case INDEX_op_mov_i64:
3711d2fd745fSRichard Henderson         case INDEX_op_mov_vec:
3712dd186292SRichard Henderson             tcg_reg_alloc_mov(s, op);
3713c896fe29Sbellard             break;
3714e8996ee0Sbellard         case INDEX_op_movi_i32:
3715e8996ee0Sbellard         case INDEX_op_movi_i64:
3716d2fd745fSRichard Henderson         case INDEX_op_dupi_vec:
3717dd186292SRichard Henderson             tcg_reg_alloc_movi(s, op);
3718e8996ee0Sbellard             break;
3719765b842aSRichard Henderson         case INDEX_op_insn_start:
3720fca8a500SRichard Henderson             if (num_insns >= 0) {
37219f754620SRichard Henderson                 size_t off = tcg_current_code_size(s);
37229f754620SRichard Henderson                 s->gen_insn_end_off[num_insns] = off;
37239f754620SRichard Henderson                 /* Assert that we do not overflow our stored offset.  */
37249f754620SRichard Henderson                 assert(s->gen_insn_end_off[num_insns] == off);
3725fca8a500SRichard Henderson             }
3726fca8a500SRichard Henderson             num_insns++;
3727bad729e2SRichard Henderson             for (i = 0; i < TARGET_INSN_START_WORDS; ++i) {
3728bad729e2SRichard Henderson                 target_ulong a;
3729bad729e2SRichard Henderson #if TARGET_LONG_BITS > TCG_TARGET_REG_BITS
3730efee3746SRichard Henderson                 a = deposit64(op->args[i * 2], 32, 32, op->args[i * 2 + 1]);
3731bad729e2SRichard Henderson #else
3732efee3746SRichard Henderson                 a = op->args[i];
3733bad729e2SRichard Henderson #endif
3734fca8a500SRichard Henderson                 s->gen_insn_data[num_insns][i] = a;
3735bad729e2SRichard Henderson             }
3736c896fe29Sbellard             break;
37375ff9d6a4Sbellard         case INDEX_op_discard:
373843439139SRichard Henderson             temp_dead(s, arg_temp(op->args[0]));
37395ff9d6a4Sbellard             break;
3740c896fe29Sbellard         case INDEX_op_set_label:
3741e8996ee0Sbellard             tcg_reg_alloc_bb_end(s, s->reserved_regs);
3742efee3746SRichard Henderson             tcg_out_label(s, arg_label(op->args[0]), s->code_ptr);
3743c896fe29Sbellard             break;
3744c896fe29Sbellard         case INDEX_op_call:
3745dd186292SRichard Henderson             tcg_reg_alloc_call(s, op);
3746c45cb8bbSRichard Henderson             break;
3747c896fe29Sbellard         default:
374825c4d9ccSRichard Henderson             /* Sanity check that we've not introduced any unhandled opcodes. */
3749be0f34b5SRichard Henderson             tcg_debug_assert(tcg_op_supported(opc));
3750c896fe29Sbellard             /* Note: in order to speed up the code, it would be much
3751c896fe29Sbellard                faster to have specialized register allocator functions for
3752c896fe29Sbellard                some common argument patterns */
3753dd186292SRichard Henderson             tcg_reg_alloc_op(s, op);
3754c896fe29Sbellard             break;
3755c896fe29Sbellard         }
37568d8fdbaeSAurelien Jarno #ifdef CONFIG_DEBUG_TCG
3757c896fe29Sbellard         check_regs(s);
3758c896fe29Sbellard #endif
3759b125f9dcSRichard Henderson         /* Test for (pending) buffer overflow.  The assumption is that any
3760b125f9dcSRichard Henderson            one operation beginning below the high water mark cannot overrun
3761b125f9dcSRichard Henderson            the buffer completely.  Thus we can test for overflow after
3762b125f9dcSRichard Henderson            generating code without having to check during generation.  */
3763644da9b3SJohn Clarke         if (unlikely((void *)s->code_ptr > s->code_gen_highwater)) {
3764b125f9dcSRichard Henderson             return -1;
3765b125f9dcSRichard Henderson         }
3766c896fe29Sbellard     }
3767fca8a500SRichard Henderson     tcg_debug_assert(num_insns >= 0);
3768fca8a500SRichard Henderson     s->gen_insn_end_off[num_insns] = tcg_current_code_size(s);
3769c45cb8bbSRichard Henderson 
3770b76f0d8cSYeongkyoon Lee     /* Generate TB finalization at the end of block */
3771659ef5cbSRichard Henderson #ifdef TCG_TARGET_NEED_LDST_LABELS
3772659ef5cbSRichard Henderson     if (!tcg_out_ldst_finalize(s)) {
377323dceda6SRichard Henderson         return -1;
377423dceda6SRichard Henderson     }
3775659ef5cbSRichard Henderson #endif
377657a26946SRichard Henderson #ifdef TCG_TARGET_NEED_POOL_LABELS
377757a26946SRichard Henderson     if (!tcg_out_pool_finalize(s)) {
377857a26946SRichard Henderson         return -1;
377957a26946SRichard Henderson     }
378057a26946SRichard Henderson #endif
3781c896fe29Sbellard 
3782c896fe29Sbellard     /* flush instruction cache */
37831813e175SRichard Henderson     flush_icache_range((uintptr_t)s->code_buf, (uintptr_t)s->code_ptr);
37842aeabc08SStefan Weil 
37851813e175SRichard Henderson     return tcg_current_code_size(s);
3786c896fe29Sbellard }
3787c896fe29Sbellard 
3788a23a9ec6Sbellard #ifdef CONFIG_PROFILER
3789405cf9ffSStefan Weil void tcg_dump_info(FILE *f, fprintf_function cpu_fprintf)
3790a23a9ec6Sbellard {
3791c3fac113SEmilio G. Cota     TCGProfile prof = {};
3792c3fac113SEmilio G. Cota     const TCGProfile *s;
3793c3fac113SEmilio G. Cota     int64_t tb_count;
3794c3fac113SEmilio G. Cota     int64_t tb_div_count;
3795c3fac113SEmilio G. Cota     int64_t tot;
3796c3fac113SEmilio G. Cota 
3797c3fac113SEmilio G. Cota     tcg_profile_snapshot_counters(&prof);
3798c3fac113SEmilio G. Cota     s = &prof;
3799c3fac113SEmilio G. Cota     tb_count = s->tb_count;
3800c3fac113SEmilio G. Cota     tb_div_count = tb_count ? tb_count : 1;
3801c3fac113SEmilio G. Cota     tot = s->interm_time + s->code_time;
3802a23a9ec6Sbellard 
3803a23a9ec6Sbellard     cpu_fprintf(f, "JIT cycles          %" PRId64 " (%0.3f s at 2.4 GHz)\n",
3804a23a9ec6Sbellard                 tot, tot / 2.4e9);
3805a23a9ec6Sbellard     cpu_fprintf(f, "translated TBs      %" PRId64 " (aborted=%" PRId64 " %0.1f%%)\n",
3806fca8a500SRichard Henderson                 tb_count, s->tb_count1 - tb_count,
3807fca8a500SRichard Henderson                 (double)(s->tb_count1 - s->tb_count)
3808fca8a500SRichard Henderson                 / (s->tb_count1 ? s->tb_count1 : 1) * 100.0);
3809a23a9ec6Sbellard     cpu_fprintf(f, "avg ops/TB          %0.1f max=%d\n",
3810fca8a500SRichard Henderson                 (double)s->op_count / tb_div_count, s->op_count_max);
3811a23a9ec6Sbellard     cpu_fprintf(f, "deleted ops/TB      %0.2f\n",
3812fca8a500SRichard Henderson                 (double)s->del_op_count / tb_div_count);
3813a23a9ec6Sbellard     cpu_fprintf(f, "avg temps/TB        %0.2f max=%d\n",
3814fca8a500SRichard Henderson                 (double)s->temp_count / tb_div_count, s->temp_count_max);
3815fca8a500SRichard Henderson     cpu_fprintf(f, "avg host code/TB    %0.1f\n",
3816fca8a500SRichard Henderson                 (double)s->code_out_len / tb_div_count);
3817fca8a500SRichard Henderson     cpu_fprintf(f, "avg search data/TB  %0.1f\n",
3818fca8a500SRichard Henderson                 (double)s->search_out_len / tb_div_count);
3819a23a9ec6Sbellard 
3820a23a9ec6Sbellard     cpu_fprintf(f, "cycles/op           %0.1f\n",
3821a23a9ec6Sbellard                 s->op_count ? (double)tot / s->op_count : 0);
3822a23a9ec6Sbellard     cpu_fprintf(f, "cycles/in byte      %0.1f\n",
3823a23a9ec6Sbellard                 s->code_in_len ? (double)tot / s->code_in_len : 0);
3824a23a9ec6Sbellard     cpu_fprintf(f, "cycles/out byte     %0.1f\n",
3825a23a9ec6Sbellard                 s->code_out_len ? (double)tot / s->code_out_len : 0);
3826fca8a500SRichard Henderson     cpu_fprintf(f, "cycles/search byte     %0.1f\n",
3827fca8a500SRichard Henderson                 s->search_out_len ? (double)tot / s->search_out_len : 0);
3828fca8a500SRichard Henderson     if (tot == 0) {
3829a23a9ec6Sbellard         tot = 1;
3830fca8a500SRichard Henderson     }
3831a23a9ec6Sbellard     cpu_fprintf(f, "  gen_interm time   %0.1f%%\n",
3832a23a9ec6Sbellard                 (double)s->interm_time / tot * 100.0);
3833a23a9ec6Sbellard     cpu_fprintf(f, "  gen_code time     %0.1f%%\n",
3834a23a9ec6Sbellard                 (double)s->code_time / tot * 100.0);
3835c5cc28ffSAurelien Jarno     cpu_fprintf(f, "optim./code time    %0.1f%%\n",
3836c5cc28ffSAurelien Jarno                 (double)s->opt_time / (s->code_time ? s->code_time : 1)
3837c5cc28ffSAurelien Jarno                 * 100.0);
3838a23a9ec6Sbellard     cpu_fprintf(f, "liveness/code time  %0.1f%%\n",
3839a23a9ec6Sbellard                 (double)s->la_time / (s->code_time ? s->code_time : 1) * 100.0);
3840a23a9ec6Sbellard     cpu_fprintf(f, "cpu_restore count   %" PRId64 "\n",
3841a23a9ec6Sbellard                 s->restore_count);
3842a23a9ec6Sbellard     cpu_fprintf(f, "  avg cycles        %0.1f\n",
3843a23a9ec6Sbellard                 s->restore_count ? (double)s->restore_time / s->restore_count : 0);
3844a23a9ec6Sbellard }
3845a23a9ec6Sbellard #else
3846405cf9ffSStefan Weil void tcg_dump_info(FILE *f, fprintf_function cpu_fprintf)
3847a23a9ec6Sbellard {
384824bf7b3aSbellard     cpu_fprintf(f, "[TCG profiler not compiled]\n");
3849a23a9ec6Sbellard }
3850a23a9ec6Sbellard #endif
3851813da627SRichard Henderson 
3852813da627SRichard Henderson #ifdef ELF_HOST_MACHINE
38535872bbf2SRichard Henderson /* In order to use this feature, the backend needs to do three things:
38545872bbf2SRichard Henderson 
38555872bbf2SRichard Henderson    (1) Define ELF_HOST_MACHINE to indicate both what value to
38565872bbf2SRichard Henderson        put into the ELF image and to indicate support for the feature.
38575872bbf2SRichard Henderson 
38585872bbf2SRichard Henderson    (2) Define tcg_register_jit.  This should create a buffer containing
38595872bbf2SRichard Henderson        the contents of a .debug_frame section that describes the post-
38605872bbf2SRichard Henderson        prologue unwind info for the tcg machine.
38615872bbf2SRichard Henderson 
38625872bbf2SRichard Henderson    (3) Call tcg_register_jit_int, with the constructed .debug_frame.
38635872bbf2SRichard Henderson */
3864813da627SRichard Henderson 
3865813da627SRichard Henderson /* Begin GDB interface.  THE FOLLOWING MUST MATCH GDB DOCS.  */
3866813da627SRichard Henderson typedef enum {
3867813da627SRichard Henderson     JIT_NOACTION = 0,
3868813da627SRichard Henderson     JIT_REGISTER_FN,
3869813da627SRichard Henderson     JIT_UNREGISTER_FN
3870813da627SRichard Henderson } jit_actions_t;
3871813da627SRichard Henderson 
3872813da627SRichard Henderson struct jit_code_entry {
3873813da627SRichard Henderson     struct jit_code_entry *next_entry;
3874813da627SRichard Henderson     struct jit_code_entry *prev_entry;
3875813da627SRichard Henderson     const void *symfile_addr;
3876813da627SRichard Henderson     uint64_t symfile_size;
3877813da627SRichard Henderson };
3878813da627SRichard Henderson 
3879813da627SRichard Henderson struct jit_descriptor {
3880813da627SRichard Henderson     uint32_t version;
3881813da627SRichard Henderson     uint32_t action_flag;
3882813da627SRichard Henderson     struct jit_code_entry *relevant_entry;
3883813da627SRichard Henderson     struct jit_code_entry *first_entry;
3884813da627SRichard Henderson };
3885813da627SRichard Henderson 
3886813da627SRichard Henderson void __jit_debug_register_code(void) __attribute__((noinline));
3887813da627SRichard Henderson void __jit_debug_register_code(void)
3888813da627SRichard Henderson {
3889813da627SRichard Henderson     asm("");
3890813da627SRichard Henderson }
3891813da627SRichard Henderson 
3892813da627SRichard Henderson /* Must statically initialize the version, because GDB may check
3893813da627SRichard Henderson    the version before we can set it.  */
3894813da627SRichard Henderson struct jit_descriptor __jit_debug_descriptor = { 1, 0, 0, 0 };
3895813da627SRichard Henderson 
3896813da627SRichard Henderson /* End GDB interface.  */
3897813da627SRichard Henderson 
3898813da627SRichard Henderson static int find_string(const char *strtab, const char *str)
3899813da627SRichard Henderson {
3900813da627SRichard Henderson     const char *p = strtab + 1;
3901813da627SRichard Henderson 
3902813da627SRichard Henderson     while (1) {
3903813da627SRichard Henderson         if (strcmp(p, str) == 0) {
3904813da627SRichard Henderson             return p - strtab;
3905813da627SRichard Henderson         }
3906813da627SRichard Henderson         p += strlen(p) + 1;
3907813da627SRichard Henderson     }
3908813da627SRichard Henderson }
3909813da627SRichard Henderson 
39105872bbf2SRichard Henderson static void tcg_register_jit_int(void *buf_ptr, size_t buf_size,
39112c90784aSRichard Henderson                                  const void *debug_frame,
39122c90784aSRichard Henderson                                  size_t debug_frame_size)
3913813da627SRichard Henderson {
39145872bbf2SRichard Henderson     struct __attribute__((packed)) DebugInfo {
39155872bbf2SRichard Henderson         uint32_t  len;
39165872bbf2SRichard Henderson         uint16_t  version;
39175872bbf2SRichard Henderson         uint32_t  abbrev;
39185872bbf2SRichard Henderson         uint8_t   ptr_size;
39195872bbf2SRichard Henderson         uint8_t   cu_die;
39205872bbf2SRichard Henderson         uint16_t  cu_lang;
39215872bbf2SRichard Henderson         uintptr_t cu_low_pc;
39225872bbf2SRichard Henderson         uintptr_t cu_high_pc;
39235872bbf2SRichard Henderson         uint8_t   fn_die;
39245872bbf2SRichard Henderson         char      fn_name[16];
39255872bbf2SRichard Henderson         uintptr_t fn_low_pc;
39265872bbf2SRichard Henderson         uintptr_t fn_high_pc;
39275872bbf2SRichard Henderson         uint8_t   cu_eoc;
39285872bbf2SRichard Henderson     };
3929813da627SRichard Henderson 
3930813da627SRichard Henderson     struct ElfImage {
3931813da627SRichard Henderson         ElfW(Ehdr) ehdr;
3932813da627SRichard Henderson         ElfW(Phdr) phdr;
39335872bbf2SRichard Henderson         ElfW(Shdr) shdr[7];
39345872bbf2SRichard Henderson         ElfW(Sym)  sym[2];
39355872bbf2SRichard Henderson         struct DebugInfo di;
39365872bbf2SRichard Henderson         uint8_t    da[24];
39375872bbf2SRichard Henderson         char       str[80];
39385872bbf2SRichard Henderson     };
39395872bbf2SRichard Henderson 
39405872bbf2SRichard Henderson     struct ElfImage *img;
39415872bbf2SRichard Henderson 
39425872bbf2SRichard Henderson     static const struct ElfImage img_template = {
39435872bbf2SRichard Henderson         .ehdr = {
39445872bbf2SRichard Henderson             .e_ident[EI_MAG0] = ELFMAG0,
39455872bbf2SRichard Henderson             .e_ident[EI_MAG1] = ELFMAG1,
39465872bbf2SRichard Henderson             .e_ident[EI_MAG2] = ELFMAG2,
39475872bbf2SRichard Henderson             .e_ident[EI_MAG3] = ELFMAG3,
39485872bbf2SRichard Henderson             .e_ident[EI_CLASS] = ELF_CLASS,
39495872bbf2SRichard Henderson             .e_ident[EI_DATA] = ELF_DATA,
39505872bbf2SRichard Henderson             .e_ident[EI_VERSION] = EV_CURRENT,
39515872bbf2SRichard Henderson             .e_type = ET_EXEC,
39525872bbf2SRichard Henderson             .e_machine = ELF_HOST_MACHINE,
39535872bbf2SRichard Henderson             .e_version = EV_CURRENT,
39545872bbf2SRichard Henderson             .e_phoff = offsetof(struct ElfImage, phdr),
39555872bbf2SRichard Henderson             .e_shoff = offsetof(struct ElfImage, shdr),
39565872bbf2SRichard Henderson             .e_ehsize = sizeof(ElfW(Shdr)),
39575872bbf2SRichard Henderson             .e_phentsize = sizeof(ElfW(Phdr)),
39585872bbf2SRichard Henderson             .e_phnum = 1,
39595872bbf2SRichard Henderson             .e_shentsize = sizeof(ElfW(Shdr)),
39605872bbf2SRichard Henderson             .e_shnum = ARRAY_SIZE(img->shdr),
39615872bbf2SRichard Henderson             .e_shstrndx = ARRAY_SIZE(img->shdr) - 1,
3962abbb3eaeSRichard Henderson #ifdef ELF_HOST_FLAGS
3963abbb3eaeSRichard Henderson             .e_flags = ELF_HOST_FLAGS,
3964abbb3eaeSRichard Henderson #endif
3965abbb3eaeSRichard Henderson #ifdef ELF_OSABI
3966abbb3eaeSRichard Henderson             .e_ident[EI_OSABI] = ELF_OSABI,
3967abbb3eaeSRichard Henderson #endif
39685872bbf2SRichard Henderson         },
39695872bbf2SRichard Henderson         .phdr = {
39705872bbf2SRichard Henderson             .p_type = PT_LOAD,
39715872bbf2SRichard Henderson             .p_flags = PF_X,
39725872bbf2SRichard Henderson         },
39735872bbf2SRichard Henderson         .shdr = {
39745872bbf2SRichard Henderson             [0] = { .sh_type = SHT_NULL },
39755872bbf2SRichard Henderson             /* Trick: The contents of code_gen_buffer are not present in
39765872bbf2SRichard Henderson                this fake ELF file; that got allocated elsewhere.  Therefore
39775872bbf2SRichard Henderson                we mark .text as SHT_NOBITS (similar to .bss) so that readers
39785872bbf2SRichard Henderson                will not look for contents.  We can record any address.  */
39795872bbf2SRichard Henderson             [1] = { /* .text */
39805872bbf2SRichard Henderson                 .sh_type = SHT_NOBITS,
39815872bbf2SRichard Henderson                 .sh_flags = SHF_EXECINSTR | SHF_ALLOC,
39825872bbf2SRichard Henderson             },
39835872bbf2SRichard Henderson             [2] = { /* .debug_info */
39845872bbf2SRichard Henderson                 .sh_type = SHT_PROGBITS,
39855872bbf2SRichard Henderson                 .sh_offset = offsetof(struct ElfImage, di),
39865872bbf2SRichard Henderson                 .sh_size = sizeof(struct DebugInfo),
39875872bbf2SRichard Henderson             },
39885872bbf2SRichard Henderson             [3] = { /* .debug_abbrev */
39895872bbf2SRichard Henderson                 .sh_type = SHT_PROGBITS,
39905872bbf2SRichard Henderson                 .sh_offset = offsetof(struct ElfImage, da),
39915872bbf2SRichard Henderson                 .sh_size = sizeof(img->da),
39925872bbf2SRichard Henderson             },
39935872bbf2SRichard Henderson             [4] = { /* .debug_frame */
39945872bbf2SRichard Henderson                 .sh_type = SHT_PROGBITS,
39955872bbf2SRichard Henderson                 .sh_offset = sizeof(struct ElfImage),
39965872bbf2SRichard Henderson             },
39975872bbf2SRichard Henderson             [5] = { /* .symtab */
39985872bbf2SRichard Henderson                 .sh_type = SHT_SYMTAB,
39995872bbf2SRichard Henderson                 .sh_offset = offsetof(struct ElfImage, sym),
40005872bbf2SRichard Henderson                 .sh_size = sizeof(img->sym),
40015872bbf2SRichard Henderson                 .sh_info = 1,
40025872bbf2SRichard Henderson                 .sh_link = ARRAY_SIZE(img->shdr) - 1,
40035872bbf2SRichard Henderson                 .sh_entsize = sizeof(ElfW(Sym)),
40045872bbf2SRichard Henderson             },
40055872bbf2SRichard Henderson             [6] = { /* .strtab */
40065872bbf2SRichard Henderson                 .sh_type = SHT_STRTAB,
40075872bbf2SRichard Henderson                 .sh_offset = offsetof(struct ElfImage, str),
40085872bbf2SRichard Henderson                 .sh_size = sizeof(img->str),
40095872bbf2SRichard Henderson             }
40105872bbf2SRichard Henderson         },
40115872bbf2SRichard Henderson         .sym = {
40125872bbf2SRichard Henderson             [1] = { /* code_gen_buffer */
40135872bbf2SRichard Henderson                 .st_info = ELF_ST_INFO(STB_GLOBAL, STT_FUNC),
40145872bbf2SRichard Henderson                 .st_shndx = 1,
40155872bbf2SRichard Henderson             }
40165872bbf2SRichard Henderson         },
40175872bbf2SRichard Henderson         .di = {
40185872bbf2SRichard Henderson             .len = sizeof(struct DebugInfo) - 4,
40195872bbf2SRichard Henderson             .version = 2,
40205872bbf2SRichard Henderson             .ptr_size = sizeof(void *),
40215872bbf2SRichard Henderson             .cu_die = 1,
40225872bbf2SRichard Henderson             .cu_lang = 0x8001,  /* DW_LANG_Mips_Assembler */
40235872bbf2SRichard Henderson             .fn_die = 2,
40245872bbf2SRichard Henderson             .fn_name = "code_gen_buffer"
40255872bbf2SRichard Henderson         },
40265872bbf2SRichard Henderson         .da = {
40275872bbf2SRichard Henderson             1,          /* abbrev number (the cu) */
40285872bbf2SRichard Henderson             0x11, 1,    /* DW_TAG_compile_unit, has children */
40295872bbf2SRichard Henderson             0x13, 0x5,  /* DW_AT_language, DW_FORM_data2 */
40305872bbf2SRichard Henderson             0x11, 0x1,  /* DW_AT_low_pc, DW_FORM_addr */
40315872bbf2SRichard Henderson             0x12, 0x1,  /* DW_AT_high_pc, DW_FORM_addr */
40325872bbf2SRichard Henderson             0, 0,       /* end of abbrev */
40335872bbf2SRichard Henderson             2,          /* abbrev number (the fn) */
40345872bbf2SRichard Henderson             0x2e, 0,    /* DW_TAG_subprogram, no children */
40355872bbf2SRichard Henderson             0x3, 0x8,   /* DW_AT_name, DW_FORM_string */
40365872bbf2SRichard Henderson             0x11, 0x1,  /* DW_AT_low_pc, DW_FORM_addr */
40375872bbf2SRichard Henderson             0x12, 0x1,  /* DW_AT_high_pc, DW_FORM_addr */
40385872bbf2SRichard Henderson             0, 0,       /* end of abbrev */
40395872bbf2SRichard Henderson             0           /* no more abbrev */
40405872bbf2SRichard Henderson         },
40415872bbf2SRichard Henderson         .str = "\0" ".text\0" ".debug_info\0" ".debug_abbrev\0"
40425872bbf2SRichard Henderson                ".debug_frame\0" ".symtab\0" ".strtab\0" "code_gen_buffer",
4043813da627SRichard Henderson     };
4044813da627SRichard Henderson 
4045813da627SRichard Henderson     /* We only need a single jit entry; statically allocate it.  */
4046813da627SRichard Henderson     static struct jit_code_entry one_entry;
4047813da627SRichard Henderson 
40485872bbf2SRichard Henderson     uintptr_t buf = (uintptr_t)buf_ptr;
4049813da627SRichard Henderson     size_t img_size = sizeof(struct ElfImage) + debug_frame_size;
40502c90784aSRichard Henderson     DebugFrameHeader *dfh;
4051813da627SRichard Henderson 
40525872bbf2SRichard Henderson     img = g_malloc(img_size);
40535872bbf2SRichard Henderson     *img = img_template;
4054813da627SRichard Henderson 
40555872bbf2SRichard Henderson     img->phdr.p_vaddr = buf;
40565872bbf2SRichard Henderson     img->phdr.p_paddr = buf;
40575872bbf2SRichard Henderson     img->phdr.p_memsz = buf_size;
4058813da627SRichard Henderson 
40595872bbf2SRichard Henderson     img->shdr[1].sh_name = find_string(img->str, ".text");
40605872bbf2SRichard Henderson     img->shdr[1].sh_addr = buf;
40615872bbf2SRichard Henderson     img->shdr[1].sh_size = buf_size;
4062813da627SRichard Henderson 
40635872bbf2SRichard Henderson     img->shdr[2].sh_name = find_string(img->str, ".debug_info");
40645872bbf2SRichard Henderson     img->shdr[3].sh_name = find_string(img->str, ".debug_abbrev");
40655872bbf2SRichard Henderson 
40665872bbf2SRichard Henderson     img->shdr[4].sh_name = find_string(img->str, ".debug_frame");
40675872bbf2SRichard Henderson     img->shdr[4].sh_size = debug_frame_size;
40685872bbf2SRichard Henderson 
40695872bbf2SRichard Henderson     img->shdr[5].sh_name = find_string(img->str, ".symtab");
40705872bbf2SRichard Henderson     img->shdr[6].sh_name = find_string(img->str, ".strtab");
40715872bbf2SRichard Henderson 
40725872bbf2SRichard Henderson     img->sym[1].st_name = find_string(img->str, "code_gen_buffer");
40735872bbf2SRichard Henderson     img->sym[1].st_value = buf;
40745872bbf2SRichard Henderson     img->sym[1].st_size = buf_size;
40755872bbf2SRichard Henderson 
40765872bbf2SRichard Henderson     img->di.cu_low_pc = buf;
407745aba097SRichard Henderson     img->di.cu_high_pc = buf + buf_size;
40785872bbf2SRichard Henderson     img->di.fn_low_pc = buf;
407945aba097SRichard Henderson     img->di.fn_high_pc = buf + buf_size;
4080813da627SRichard Henderson 
40812c90784aSRichard Henderson     dfh = (DebugFrameHeader *)(img + 1);
40822c90784aSRichard Henderson     memcpy(dfh, debug_frame, debug_frame_size);
40832c90784aSRichard Henderson     dfh->fde.func_start = buf;
40842c90784aSRichard Henderson     dfh->fde.func_len = buf_size;
40852c90784aSRichard Henderson 
4086813da627SRichard Henderson #ifdef DEBUG_JIT
4087813da627SRichard Henderson     /* Enable this block to be able to debug the ELF image file creation.
4088813da627SRichard Henderson        One can use readelf, objdump, or other inspection utilities.  */
4089813da627SRichard Henderson     {
4090813da627SRichard Henderson         FILE *f = fopen("/tmp/qemu.jit", "w+b");
4091813da627SRichard Henderson         if (f) {
40925872bbf2SRichard Henderson             if (fwrite(img, img_size, 1, f) != img_size) {
4093813da627SRichard Henderson                 /* Avoid stupid unused return value warning for fwrite.  */
4094813da627SRichard Henderson             }
4095813da627SRichard Henderson             fclose(f);
4096813da627SRichard Henderson         }
4097813da627SRichard Henderson     }
4098813da627SRichard Henderson #endif
4099813da627SRichard Henderson 
4100813da627SRichard Henderson     one_entry.symfile_addr = img;
4101813da627SRichard Henderson     one_entry.symfile_size = img_size;
4102813da627SRichard Henderson 
4103813da627SRichard Henderson     __jit_debug_descriptor.action_flag = JIT_REGISTER_FN;
4104813da627SRichard Henderson     __jit_debug_descriptor.relevant_entry = &one_entry;
4105813da627SRichard Henderson     __jit_debug_descriptor.first_entry = &one_entry;
4106813da627SRichard Henderson     __jit_debug_register_code();
4107813da627SRichard Henderson }
4108813da627SRichard Henderson #else
41095872bbf2SRichard Henderson /* No support for the feature.  Provide the entry point expected by exec.c,
41105872bbf2SRichard Henderson    and implement the internal function we declared earlier.  */
4111813da627SRichard Henderson 
4112813da627SRichard Henderson static void tcg_register_jit_int(void *buf, size_t size,
41132c90784aSRichard Henderson                                  const void *debug_frame,
41142c90784aSRichard Henderson                                  size_t debug_frame_size)
4115813da627SRichard Henderson {
4116813da627SRichard Henderson }
4117813da627SRichard Henderson 
4118813da627SRichard Henderson void tcg_register_jit(void *buf, size_t buf_size)
4119813da627SRichard Henderson {
4120813da627SRichard Henderson }
4121813da627SRichard Henderson #endif /* ELF_HOST_MACHINE */
4122db432672SRichard Henderson 
4123db432672SRichard Henderson #if !TCG_TARGET_MAYBE_vec
4124db432672SRichard Henderson void tcg_expand_vec_op(TCGOpcode o, TCGType t, unsigned e, TCGArg a0, ...)
4125db432672SRichard Henderson {
4126db432672SRichard Henderson     g_assert_not_reached();
4127db432672SRichard Henderson }
4128db432672SRichard Henderson #endif
4129