xref: /qemu/tcg/tcg.c (revision 152c35aab43213335e1ae8b865d259c0222dd110)
1c896fe29Sbellard /*
2c896fe29Sbellard  * Tiny Code Generator for QEMU
3c896fe29Sbellard  *
4c896fe29Sbellard  * Copyright (c) 2008 Fabrice Bellard
5c896fe29Sbellard  *
6c896fe29Sbellard  * Permission is hereby granted, free of charge, to any person obtaining a copy
7c896fe29Sbellard  * of this software and associated documentation files (the "Software"), to deal
8c896fe29Sbellard  * in the Software without restriction, including without limitation the rights
9c896fe29Sbellard  * to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
10c896fe29Sbellard  * copies of the Software, and to permit persons to whom the Software is
11c896fe29Sbellard  * furnished to do so, subject to the following conditions:
12c896fe29Sbellard  *
13c896fe29Sbellard  * The above copyright notice and this permission notice shall be included in
14c896fe29Sbellard  * all copies or substantial portions of the Software.
15c896fe29Sbellard  *
16c896fe29Sbellard  * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
17c896fe29Sbellard  * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
18c896fe29Sbellard  * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
19c896fe29Sbellard  * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
20c896fe29Sbellard  * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
21c896fe29Sbellard  * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
22c896fe29Sbellard  * THE SOFTWARE.
23c896fe29Sbellard  */
24c896fe29Sbellard 
25c896fe29Sbellard /* define it to use liveness analysis (better code) */
268f2e8c07SKirill Batuzov #define USE_TCG_OPTIMIZATIONS
27c896fe29Sbellard 
28757e725bSPeter Maydell #include "qemu/osdep.h"
29cca82982Saurel32 
30813da627SRichard Henderson /* Define to jump the ELF file used to communicate with GDB.  */
31813da627SRichard Henderson #undef DEBUG_JIT
32813da627SRichard Henderson 
3372fd2efbSEmilio G. Cota #include "qemu/error-report.h"
34f348b6d1SVeronia Bahaa #include "qemu/cutils.h"
351de7afc9SPaolo Bonzini #include "qemu/host-utils.h"
361de7afc9SPaolo Bonzini #include "qemu/timer.h"
37c896fe29Sbellard 
38c5d3c498SStefan Weil /* Note: the long term plan is to reduce the dependencies on the QEMU
39c896fe29Sbellard    CPU definitions. Currently they are used for qemu_ld/st
40c896fe29Sbellard    instructions */
41c896fe29Sbellard #define NO_CPU_IO_DEFS
42c896fe29Sbellard #include "cpu.h"
43c896fe29Sbellard 
4463c91552SPaolo Bonzini #include "exec/cpu-common.h"
4563c91552SPaolo Bonzini #include "exec/exec-all.h"
4663c91552SPaolo Bonzini 
47c896fe29Sbellard #include "tcg-op.h"
48813da627SRichard Henderson 
49edee2579SRichard Henderson #if UINTPTR_MAX == UINT32_MAX
50813da627SRichard Henderson # define ELF_CLASS  ELFCLASS32
51edee2579SRichard Henderson #else
52edee2579SRichard Henderson # define ELF_CLASS  ELFCLASS64
53813da627SRichard Henderson #endif
54813da627SRichard Henderson #ifdef HOST_WORDS_BIGENDIAN
55813da627SRichard Henderson # define ELF_DATA   ELFDATA2MSB
56813da627SRichard Henderson #else
57813da627SRichard Henderson # define ELF_DATA   ELFDATA2LSB
58813da627SRichard Henderson #endif
59813da627SRichard Henderson 
60c896fe29Sbellard #include "elf.h"
61508127e2SPaolo Bonzini #include "exec/log.h"
623468b59eSEmilio G. Cota #include "sysemu/sysemu.h"
63c896fe29Sbellard 
64ce151109SPeter Maydell /* Forward declarations for functions declared in tcg-target.inc.c and
65ce151109SPeter Maydell    used here. */
66e4d58b41SRichard Henderson static void tcg_target_init(TCGContext *s);
67f69d277eSRichard Henderson static const TCGTargetOpDef *tcg_target_op_def(TCGOpcode);
68e4d58b41SRichard Henderson static void tcg_target_qemu_prologue(TCGContext *s);
696ac17786SRichard Henderson static bool patch_reloc(tcg_insn_unit *code_ptr, int type,
702ba7fae2SRichard Henderson                         intptr_t value, intptr_t addend);
71c896fe29Sbellard 
72497a22ebSRichard Henderson /* The CIE and FDE header definitions will be common to all hosts.  */
73497a22ebSRichard Henderson typedef struct {
74497a22ebSRichard Henderson     uint32_t len __attribute__((aligned((sizeof(void *)))));
75497a22ebSRichard Henderson     uint32_t id;
76497a22ebSRichard Henderson     uint8_t version;
77497a22ebSRichard Henderson     char augmentation[1];
78497a22ebSRichard Henderson     uint8_t code_align;
79497a22ebSRichard Henderson     uint8_t data_align;
80497a22ebSRichard Henderson     uint8_t return_column;
81497a22ebSRichard Henderson } DebugFrameCIE;
82497a22ebSRichard Henderson 
83497a22ebSRichard Henderson typedef struct QEMU_PACKED {
84497a22ebSRichard Henderson     uint32_t len __attribute__((aligned((sizeof(void *)))));
85497a22ebSRichard Henderson     uint32_t cie_offset;
86edee2579SRichard Henderson     uintptr_t func_start;
87edee2579SRichard Henderson     uintptr_t func_len;
88497a22ebSRichard Henderson } DebugFrameFDEHeader;
89497a22ebSRichard Henderson 
902c90784aSRichard Henderson typedef struct QEMU_PACKED {
912c90784aSRichard Henderson     DebugFrameCIE cie;
922c90784aSRichard Henderson     DebugFrameFDEHeader fde;
932c90784aSRichard Henderson } DebugFrameHeader;
942c90784aSRichard Henderson 
95813da627SRichard Henderson static void tcg_register_jit_int(void *buf, size_t size,
962c90784aSRichard Henderson                                  const void *debug_frame,
972c90784aSRichard Henderson                                  size_t debug_frame_size)
98813da627SRichard Henderson     __attribute__((unused));
99813da627SRichard Henderson 
100ce151109SPeter Maydell /* Forward declarations for functions declared and used in tcg-target.inc.c. */
101069ea736SRichard Henderson static const char *target_parse_constraint(TCGArgConstraint *ct,
102069ea736SRichard Henderson                                            const char *ct_str, TCGType type);
1032a534affSRichard Henderson static void tcg_out_ld(TCGContext *s, TCGType type, TCGReg ret, TCGReg arg1,
104a05b5b9bSRichard Henderson                        intptr_t arg2);
1052a534affSRichard Henderson static void tcg_out_mov(TCGContext *s, TCGType type, TCGReg ret, TCGReg arg);
106c0ad3001SStefan Weil static void tcg_out_movi(TCGContext *s, TCGType type,
1072a534affSRichard Henderson                          TCGReg ret, tcg_target_long arg);
108c0ad3001SStefan Weil static void tcg_out_op(TCGContext *s, TCGOpcode opc, const TCGArg *args,
109c0ad3001SStefan Weil                        const int *const_args);
110d2fd745fSRichard Henderson #if TCG_TARGET_MAYBE_vec
111d2fd745fSRichard Henderson static void tcg_out_vec_op(TCGContext *s, TCGOpcode opc, unsigned vecl,
112d2fd745fSRichard Henderson                            unsigned vece, const TCGArg *args,
113d2fd745fSRichard Henderson                            const int *const_args);
114d2fd745fSRichard Henderson #else
115d2fd745fSRichard Henderson static inline void tcg_out_vec_op(TCGContext *s, TCGOpcode opc, unsigned vecl,
116d2fd745fSRichard Henderson                                   unsigned vece, const TCGArg *args,
117d2fd745fSRichard Henderson                                   const int *const_args)
118d2fd745fSRichard Henderson {
119d2fd745fSRichard Henderson     g_assert_not_reached();
120d2fd745fSRichard Henderson }
121d2fd745fSRichard Henderson #endif
1222a534affSRichard Henderson static void tcg_out_st(TCGContext *s, TCGType type, TCGReg arg, TCGReg arg1,
123a05b5b9bSRichard Henderson                        intptr_t arg2);
12459d7c14eSRichard Henderson static bool tcg_out_sti(TCGContext *s, TCGType type, TCGArg val,
12559d7c14eSRichard Henderson                         TCGReg base, intptr_t ofs);
126cf066674SRichard Henderson static void tcg_out_call(TCGContext *s, tcg_insn_unit *target);
127f6c6afc1SRichard Henderson static int tcg_target_const_match(tcg_target_long val, TCGType type,
128c0ad3001SStefan Weil                                   const TCGArgConstraint *arg_ct);
129659ef5cbSRichard Henderson #ifdef TCG_TARGET_NEED_LDST_LABELS
130659ef5cbSRichard Henderson static bool tcg_out_ldst_finalize(TCGContext *s);
131659ef5cbSRichard Henderson #endif
132c896fe29Sbellard 
133a505785cSEmilio G. Cota #define TCG_HIGHWATER 1024
134a505785cSEmilio G. Cota 
135df2cce29SEmilio G. Cota static TCGContext **tcg_ctxs;
136df2cce29SEmilio G. Cota static unsigned int n_tcg_ctxs;
1371c2adb95SRichard Henderson TCGv_env cpu_env = 0;
138df2cce29SEmilio G. Cota 
139be2cdc5eSEmilio G. Cota struct tcg_region_tree {
140be2cdc5eSEmilio G. Cota     QemuMutex lock;
141be2cdc5eSEmilio G. Cota     GTree *tree;
142be2cdc5eSEmilio G. Cota     /* padding to avoid false sharing is computed at run-time */
143be2cdc5eSEmilio G. Cota };
144be2cdc5eSEmilio G. Cota 
145e8feb96fSEmilio G. Cota /*
146e8feb96fSEmilio G. Cota  * We divide code_gen_buffer into equally-sized "regions" that TCG threads
147e8feb96fSEmilio G. Cota  * dynamically allocate from as demand dictates. Given appropriate region
148e8feb96fSEmilio G. Cota  * sizing, this minimizes flushes even when some TCG threads generate a lot
149e8feb96fSEmilio G. Cota  * more code than others.
150e8feb96fSEmilio G. Cota  */
151e8feb96fSEmilio G. Cota struct tcg_region_state {
152e8feb96fSEmilio G. Cota     QemuMutex lock;
153e8feb96fSEmilio G. Cota 
154e8feb96fSEmilio G. Cota     /* fields set at init time */
155e8feb96fSEmilio G. Cota     void *start;
156e8feb96fSEmilio G. Cota     void *start_aligned;
157e8feb96fSEmilio G. Cota     void *end;
158e8feb96fSEmilio G. Cota     size_t n;
159e8feb96fSEmilio G. Cota     size_t size; /* size of one region */
160e8feb96fSEmilio G. Cota     size_t stride; /* .size + guard size */
161e8feb96fSEmilio G. Cota 
162e8feb96fSEmilio G. Cota     /* fields protected by the lock */
163e8feb96fSEmilio G. Cota     size_t current; /* current region index */
164e8feb96fSEmilio G. Cota     size_t agg_size_full; /* aggregate size of full regions */
165e8feb96fSEmilio G. Cota };
166e8feb96fSEmilio G. Cota 
167e8feb96fSEmilio G. Cota static struct tcg_region_state region;
168be2cdc5eSEmilio G. Cota /*
169be2cdc5eSEmilio G. Cota  * This is an array of struct tcg_region_tree's, with padding.
170be2cdc5eSEmilio G. Cota  * We use void * to simplify the computation of region_trees[i]; each
171be2cdc5eSEmilio G. Cota  * struct is found every tree_size bytes.
172be2cdc5eSEmilio G. Cota  */
173be2cdc5eSEmilio G. Cota static void *region_trees;
174be2cdc5eSEmilio G. Cota static size_t tree_size;
175d2fd745fSRichard Henderson static TCGRegSet tcg_target_available_regs[TCG_TYPE_COUNT];
176b1d8e52eSblueswir1 static TCGRegSet tcg_target_call_clobber_regs;
177c896fe29Sbellard 
1781813e175SRichard Henderson #if TCG_TARGET_INSN_UNIT_SIZE == 1
1794196dca6SPeter Maydell static __attribute__((unused)) inline void tcg_out8(TCGContext *s, uint8_t v)
180c896fe29Sbellard {
181c896fe29Sbellard     *s->code_ptr++ = v;
182c896fe29Sbellard }
183c896fe29Sbellard 
1844196dca6SPeter Maydell static __attribute__((unused)) inline void tcg_patch8(tcg_insn_unit *p,
1854196dca6SPeter Maydell                                                       uint8_t v)
1865c53bb81SPeter Maydell {
1871813e175SRichard Henderson     *p = v;
1885c53bb81SPeter Maydell }
1891813e175SRichard Henderson #endif
1905c53bb81SPeter Maydell 
1911813e175SRichard Henderson #if TCG_TARGET_INSN_UNIT_SIZE <= 2
1924196dca6SPeter Maydell static __attribute__((unused)) inline void tcg_out16(TCGContext *s, uint16_t v)
193c896fe29Sbellard {
1941813e175SRichard Henderson     if (TCG_TARGET_INSN_UNIT_SIZE == 2) {
1951813e175SRichard Henderson         *s->code_ptr++ = v;
1961813e175SRichard Henderson     } else {
1971813e175SRichard Henderson         tcg_insn_unit *p = s->code_ptr;
1984387345aSPeter Maydell         memcpy(p, &v, sizeof(v));
1991813e175SRichard Henderson         s->code_ptr = p + (2 / TCG_TARGET_INSN_UNIT_SIZE);
2001813e175SRichard Henderson     }
201c896fe29Sbellard }
202c896fe29Sbellard 
2034196dca6SPeter Maydell static __attribute__((unused)) inline void tcg_patch16(tcg_insn_unit *p,
2044196dca6SPeter Maydell                                                        uint16_t v)
2055c53bb81SPeter Maydell {
2061813e175SRichard Henderson     if (TCG_TARGET_INSN_UNIT_SIZE == 2) {
2071813e175SRichard Henderson         *p = v;
2081813e175SRichard Henderson     } else {
2095c53bb81SPeter Maydell         memcpy(p, &v, sizeof(v));
2105c53bb81SPeter Maydell     }
2111813e175SRichard Henderson }
2121813e175SRichard Henderson #endif
2135c53bb81SPeter Maydell 
2141813e175SRichard Henderson #if TCG_TARGET_INSN_UNIT_SIZE <= 4
2154196dca6SPeter Maydell static __attribute__((unused)) inline void tcg_out32(TCGContext *s, uint32_t v)
216c896fe29Sbellard {
2171813e175SRichard Henderson     if (TCG_TARGET_INSN_UNIT_SIZE == 4) {
2181813e175SRichard Henderson         *s->code_ptr++ = v;
2191813e175SRichard Henderson     } else {
2201813e175SRichard Henderson         tcg_insn_unit *p = s->code_ptr;
2214387345aSPeter Maydell         memcpy(p, &v, sizeof(v));
2221813e175SRichard Henderson         s->code_ptr = p + (4 / TCG_TARGET_INSN_UNIT_SIZE);
2231813e175SRichard Henderson     }
224c896fe29Sbellard }
225c896fe29Sbellard 
2264196dca6SPeter Maydell static __attribute__((unused)) inline void tcg_patch32(tcg_insn_unit *p,
2274196dca6SPeter Maydell                                                        uint32_t v)
2285c53bb81SPeter Maydell {
2291813e175SRichard Henderson     if (TCG_TARGET_INSN_UNIT_SIZE == 4) {
2301813e175SRichard Henderson         *p = v;
2311813e175SRichard Henderson     } else {
2325c53bb81SPeter Maydell         memcpy(p, &v, sizeof(v));
2335c53bb81SPeter Maydell     }
2341813e175SRichard Henderson }
2351813e175SRichard Henderson #endif
2365c53bb81SPeter Maydell 
2371813e175SRichard Henderson #if TCG_TARGET_INSN_UNIT_SIZE <= 8
2384196dca6SPeter Maydell static __attribute__((unused)) inline void tcg_out64(TCGContext *s, uint64_t v)
239ac26eb69SRichard Henderson {
2401813e175SRichard Henderson     if (TCG_TARGET_INSN_UNIT_SIZE == 8) {
2411813e175SRichard Henderson         *s->code_ptr++ = v;
2421813e175SRichard Henderson     } else {
2431813e175SRichard Henderson         tcg_insn_unit *p = s->code_ptr;
2444387345aSPeter Maydell         memcpy(p, &v, sizeof(v));
2451813e175SRichard Henderson         s->code_ptr = p + (8 / TCG_TARGET_INSN_UNIT_SIZE);
2461813e175SRichard Henderson     }
247ac26eb69SRichard Henderson }
248ac26eb69SRichard Henderson 
2494196dca6SPeter Maydell static __attribute__((unused)) inline void tcg_patch64(tcg_insn_unit *p,
2504196dca6SPeter Maydell                                                        uint64_t v)
2515c53bb81SPeter Maydell {
2521813e175SRichard Henderson     if (TCG_TARGET_INSN_UNIT_SIZE == 8) {
2531813e175SRichard Henderson         *p = v;
2541813e175SRichard Henderson     } else {
2555c53bb81SPeter Maydell         memcpy(p, &v, sizeof(v));
2565c53bb81SPeter Maydell     }
2571813e175SRichard Henderson }
2581813e175SRichard Henderson #endif
2595c53bb81SPeter Maydell 
260c896fe29Sbellard /* label relocation processing */
261c896fe29Sbellard 
2621813e175SRichard Henderson static void tcg_out_reloc(TCGContext *s, tcg_insn_unit *code_ptr, int type,
263bec16311SRichard Henderson                           TCGLabel *l, intptr_t addend)
264c896fe29Sbellard {
265c896fe29Sbellard     TCGRelocation *r;
266c896fe29Sbellard 
267c896fe29Sbellard     if (l->has_value) {
268623e265cSpbrook         /* FIXME: This may break relocations on RISC targets that
269623e265cSpbrook            modify instruction fields in place.  The caller may not have
270623e265cSpbrook            written the initial value.  */
2716ac17786SRichard Henderson         bool ok = patch_reloc(code_ptr, type, l->u.value, addend);
2726ac17786SRichard Henderson         tcg_debug_assert(ok);
273c896fe29Sbellard     } else {
274c896fe29Sbellard         /* add a new relocation entry */
275c896fe29Sbellard         r = tcg_malloc(sizeof(TCGRelocation));
276c896fe29Sbellard         r->type = type;
277c896fe29Sbellard         r->ptr = code_ptr;
278c896fe29Sbellard         r->addend = addend;
279c896fe29Sbellard         r->next = l->u.first_reloc;
280c896fe29Sbellard         l->u.first_reloc = r;
281c896fe29Sbellard     }
282c896fe29Sbellard }
283c896fe29Sbellard 
284bec16311SRichard Henderson static void tcg_out_label(TCGContext *s, TCGLabel *l, tcg_insn_unit *ptr)
285c896fe29Sbellard {
2862ba7fae2SRichard Henderson     intptr_t value = (intptr_t)ptr;
2871813e175SRichard Henderson     TCGRelocation *r;
288c896fe29Sbellard 
289eabb7b91SAurelien Jarno     tcg_debug_assert(!l->has_value);
2901813e175SRichard Henderson 
2911813e175SRichard Henderson     for (r = l->u.first_reloc; r != NULL; r = r->next) {
2926ac17786SRichard Henderson         bool ok = patch_reloc(r->ptr, r->type, value, r->addend);
2936ac17786SRichard Henderson         tcg_debug_assert(ok);
294c896fe29Sbellard     }
2951813e175SRichard Henderson 
296c896fe29Sbellard     l->has_value = 1;
2971813e175SRichard Henderson     l->u.value_ptr = ptr;
298c896fe29Sbellard }
299c896fe29Sbellard 
30042a268c2SRichard Henderson TCGLabel *gen_new_label(void)
301c896fe29Sbellard {
302b1311c4aSEmilio G. Cota     TCGContext *s = tcg_ctx;
30351e3972cSRichard Henderson     TCGLabel *l = tcg_malloc(sizeof(TCGLabel));
304c896fe29Sbellard 
30551e3972cSRichard Henderson     *l = (TCGLabel){
30651e3972cSRichard Henderson         .id = s->nb_labels++
30751e3972cSRichard Henderson     };
30842a268c2SRichard Henderson 
30942a268c2SRichard Henderson     return l;
310c896fe29Sbellard }
311c896fe29Sbellard 
3129f754620SRichard Henderson static void set_jmp_reset_offset(TCGContext *s, int which)
3139f754620SRichard Henderson {
3149f754620SRichard Henderson     size_t off = tcg_current_code_size(s);
3159f754620SRichard Henderson     s->tb_jmp_reset_offset[which] = off;
3169f754620SRichard Henderson     /* Make sure that we didn't overflow the stored offset.  */
3179f754620SRichard Henderson     assert(s->tb_jmp_reset_offset[which] == off);
3189f754620SRichard Henderson }
3199f754620SRichard Henderson 
320ce151109SPeter Maydell #include "tcg-target.inc.c"
321c896fe29Sbellard 
322be2cdc5eSEmilio G. Cota /* compare a pointer @ptr and a tb_tc @s */
323be2cdc5eSEmilio G. Cota static int ptr_cmp_tb_tc(const void *ptr, const struct tb_tc *s)
324be2cdc5eSEmilio G. Cota {
325be2cdc5eSEmilio G. Cota     if (ptr >= s->ptr + s->size) {
326be2cdc5eSEmilio G. Cota         return 1;
327be2cdc5eSEmilio G. Cota     } else if (ptr < s->ptr) {
328be2cdc5eSEmilio G. Cota         return -1;
329be2cdc5eSEmilio G. Cota     }
330be2cdc5eSEmilio G. Cota     return 0;
331be2cdc5eSEmilio G. Cota }
332be2cdc5eSEmilio G. Cota 
333be2cdc5eSEmilio G. Cota static gint tb_tc_cmp(gconstpointer ap, gconstpointer bp)
334be2cdc5eSEmilio G. Cota {
335be2cdc5eSEmilio G. Cota     const struct tb_tc *a = ap;
336be2cdc5eSEmilio G. Cota     const struct tb_tc *b = bp;
337be2cdc5eSEmilio G. Cota 
338be2cdc5eSEmilio G. Cota     /*
339be2cdc5eSEmilio G. Cota      * When both sizes are set, we know this isn't a lookup.
340be2cdc5eSEmilio G. Cota      * This is the most likely case: every TB must be inserted; lookups
341be2cdc5eSEmilio G. Cota      * are a lot less frequent.
342be2cdc5eSEmilio G. Cota      */
343be2cdc5eSEmilio G. Cota     if (likely(a->size && b->size)) {
344be2cdc5eSEmilio G. Cota         if (a->ptr > b->ptr) {
345be2cdc5eSEmilio G. Cota             return 1;
346be2cdc5eSEmilio G. Cota         } else if (a->ptr < b->ptr) {
347be2cdc5eSEmilio G. Cota             return -1;
348be2cdc5eSEmilio G. Cota         }
349be2cdc5eSEmilio G. Cota         /* a->ptr == b->ptr should happen only on deletions */
350be2cdc5eSEmilio G. Cota         g_assert(a->size == b->size);
351be2cdc5eSEmilio G. Cota         return 0;
352be2cdc5eSEmilio G. Cota     }
353be2cdc5eSEmilio G. Cota     /*
354be2cdc5eSEmilio G. Cota      * All lookups have either .size field set to 0.
355be2cdc5eSEmilio G. Cota      * From the glib sources we see that @ap is always the lookup key. However
356be2cdc5eSEmilio G. Cota      * the docs provide no guarantee, so we just mark this case as likely.
357be2cdc5eSEmilio G. Cota      */
358be2cdc5eSEmilio G. Cota     if (likely(a->size == 0)) {
359be2cdc5eSEmilio G. Cota         return ptr_cmp_tb_tc(a->ptr, b);
360be2cdc5eSEmilio G. Cota     }
361be2cdc5eSEmilio G. Cota     return ptr_cmp_tb_tc(b->ptr, a);
362be2cdc5eSEmilio G. Cota }
363be2cdc5eSEmilio G. Cota 
364be2cdc5eSEmilio G. Cota static void tcg_region_trees_init(void)
365be2cdc5eSEmilio G. Cota {
366be2cdc5eSEmilio G. Cota     size_t i;
367be2cdc5eSEmilio G. Cota 
368be2cdc5eSEmilio G. Cota     tree_size = ROUND_UP(sizeof(struct tcg_region_tree), qemu_dcache_linesize);
369be2cdc5eSEmilio G. Cota     region_trees = qemu_memalign(qemu_dcache_linesize, region.n * tree_size);
370be2cdc5eSEmilio G. Cota     for (i = 0; i < region.n; i++) {
371be2cdc5eSEmilio G. Cota         struct tcg_region_tree *rt = region_trees + i * tree_size;
372be2cdc5eSEmilio G. Cota 
373be2cdc5eSEmilio G. Cota         qemu_mutex_init(&rt->lock);
374be2cdc5eSEmilio G. Cota         rt->tree = g_tree_new(tb_tc_cmp);
375be2cdc5eSEmilio G. Cota     }
376be2cdc5eSEmilio G. Cota }
377be2cdc5eSEmilio G. Cota 
378be2cdc5eSEmilio G. Cota static struct tcg_region_tree *tc_ptr_to_region_tree(void *p)
379be2cdc5eSEmilio G. Cota {
380be2cdc5eSEmilio G. Cota     size_t region_idx;
381be2cdc5eSEmilio G. Cota 
382be2cdc5eSEmilio G. Cota     if (p < region.start_aligned) {
383be2cdc5eSEmilio G. Cota         region_idx = 0;
384be2cdc5eSEmilio G. Cota     } else {
385be2cdc5eSEmilio G. Cota         ptrdiff_t offset = p - region.start_aligned;
386be2cdc5eSEmilio G. Cota 
387be2cdc5eSEmilio G. Cota         if (offset > region.stride * (region.n - 1)) {
388be2cdc5eSEmilio G. Cota             region_idx = region.n - 1;
389be2cdc5eSEmilio G. Cota         } else {
390be2cdc5eSEmilio G. Cota             region_idx = offset / region.stride;
391be2cdc5eSEmilio G. Cota         }
392be2cdc5eSEmilio G. Cota     }
393be2cdc5eSEmilio G. Cota     return region_trees + region_idx * tree_size;
394be2cdc5eSEmilio G. Cota }
395be2cdc5eSEmilio G. Cota 
396be2cdc5eSEmilio G. Cota void tcg_tb_insert(TranslationBlock *tb)
397be2cdc5eSEmilio G. Cota {
398be2cdc5eSEmilio G. Cota     struct tcg_region_tree *rt = tc_ptr_to_region_tree(tb->tc.ptr);
399be2cdc5eSEmilio G. Cota 
400be2cdc5eSEmilio G. Cota     qemu_mutex_lock(&rt->lock);
401be2cdc5eSEmilio G. Cota     g_tree_insert(rt->tree, &tb->tc, tb);
402be2cdc5eSEmilio G. Cota     qemu_mutex_unlock(&rt->lock);
403be2cdc5eSEmilio G. Cota }
404be2cdc5eSEmilio G. Cota 
405be2cdc5eSEmilio G. Cota void tcg_tb_remove(TranslationBlock *tb)
406be2cdc5eSEmilio G. Cota {
407be2cdc5eSEmilio G. Cota     struct tcg_region_tree *rt = tc_ptr_to_region_tree(tb->tc.ptr);
408be2cdc5eSEmilio G. Cota 
409be2cdc5eSEmilio G. Cota     qemu_mutex_lock(&rt->lock);
410be2cdc5eSEmilio G. Cota     g_tree_remove(rt->tree, &tb->tc);
411be2cdc5eSEmilio G. Cota     qemu_mutex_unlock(&rt->lock);
412be2cdc5eSEmilio G. Cota }
413be2cdc5eSEmilio G. Cota 
414be2cdc5eSEmilio G. Cota /*
415be2cdc5eSEmilio G. Cota  * Find the TB 'tb' such that
416be2cdc5eSEmilio G. Cota  * tb->tc.ptr <= tc_ptr < tb->tc.ptr + tb->tc.size
417be2cdc5eSEmilio G. Cota  * Return NULL if not found.
418be2cdc5eSEmilio G. Cota  */
419be2cdc5eSEmilio G. Cota TranslationBlock *tcg_tb_lookup(uintptr_t tc_ptr)
420be2cdc5eSEmilio G. Cota {
421be2cdc5eSEmilio G. Cota     struct tcg_region_tree *rt = tc_ptr_to_region_tree((void *)tc_ptr);
422be2cdc5eSEmilio G. Cota     TranslationBlock *tb;
423be2cdc5eSEmilio G. Cota     struct tb_tc s = { .ptr = (void *)tc_ptr };
424be2cdc5eSEmilio G. Cota 
425be2cdc5eSEmilio G. Cota     qemu_mutex_lock(&rt->lock);
426be2cdc5eSEmilio G. Cota     tb = g_tree_lookup(rt->tree, &s);
427be2cdc5eSEmilio G. Cota     qemu_mutex_unlock(&rt->lock);
428be2cdc5eSEmilio G. Cota     return tb;
429be2cdc5eSEmilio G. Cota }
430be2cdc5eSEmilio G. Cota 
431be2cdc5eSEmilio G. Cota static void tcg_region_tree_lock_all(void)
432be2cdc5eSEmilio G. Cota {
433be2cdc5eSEmilio G. Cota     size_t i;
434be2cdc5eSEmilio G. Cota 
435be2cdc5eSEmilio G. Cota     for (i = 0; i < region.n; i++) {
436be2cdc5eSEmilio G. Cota         struct tcg_region_tree *rt = region_trees + i * tree_size;
437be2cdc5eSEmilio G. Cota 
438be2cdc5eSEmilio G. Cota         qemu_mutex_lock(&rt->lock);
439be2cdc5eSEmilio G. Cota     }
440be2cdc5eSEmilio G. Cota }
441be2cdc5eSEmilio G. Cota 
442be2cdc5eSEmilio G. Cota static void tcg_region_tree_unlock_all(void)
443be2cdc5eSEmilio G. Cota {
444be2cdc5eSEmilio G. Cota     size_t i;
445be2cdc5eSEmilio G. Cota 
446be2cdc5eSEmilio G. Cota     for (i = 0; i < region.n; i++) {
447be2cdc5eSEmilio G. Cota         struct tcg_region_tree *rt = region_trees + i * tree_size;
448be2cdc5eSEmilio G. Cota 
449be2cdc5eSEmilio G. Cota         qemu_mutex_unlock(&rt->lock);
450be2cdc5eSEmilio G. Cota     }
451be2cdc5eSEmilio G. Cota }
452be2cdc5eSEmilio G. Cota 
453be2cdc5eSEmilio G. Cota void tcg_tb_foreach(GTraverseFunc func, gpointer user_data)
454be2cdc5eSEmilio G. Cota {
455be2cdc5eSEmilio G. Cota     size_t i;
456be2cdc5eSEmilio G. Cota 
457be2cdc5eSEmilio G. Cota     tcg_region_tree_lock_all();
458be2cdc5eSEmilio G. Cota     for (i = 0; i < region.n; i++) {
459be2cdc5eSEmilio G. Cota         struct tcg_region_tree *rt = region_trees + i * tree_size;
460be2cdc5eSEmilio G. Cota 
461be2cdc5eSEmilio G. Cota         g_tree_foreach(rt->tree, func, user_data);
462be2cdc5eSEmilio G. Cota     }
463be2cdc5eSEmilio G. Cota     tcg_region_tree_unlock_all();
464be2cdc5eSEmilio G. Cota }
465be2cdc5eSEmilio G. Cota 
466be2cdc5eSEmilio G. Cota size_t tcg_nb_tbs(void)
467be2cdc5eSEmilio G. Cota {
468be2cdc5eSEmilio G. Cota     size_t nb_tbs = 0;
469be2cdc5eSEmilio G. Cota     size_t i;
470be2cdc5eSEmilio G. Cota 
471be2cdc5eSEmilio G. Cota     tcg_region_tree_lock_all();
472be2cdc5eSEmilio G. Cota     for (i = 0; i < region.n; i++) {
473be2cdc5eSEmilio G. Cota         struct tcg_region_tree *rt = region_trees + i * tree_size;
474be2cdc5eSEmilio G. Cota 
475be2cdc5eSEmilio G. Cota         nb_tbs += g_tree_nnodes(rt->tree);
476be2cdc5eSEmilio G. Cota     }
477be2cdc5eSEmilio G. Cota     tcg_region_tree_unlock_all();
478be2cdc5eSEmilio G. Cota     return nb_tbs;
479be2cdc5eSEmilio G. Cota }
480be2cdc5eSEmilio G. Cota 
481be2cdc5eSEmilio G. Cota static void tcg_region_tree_reset_all(void)
482be2cdc5eSEmilio G. Cota {
483be2cdc5eSEmilio G. Cota     size_t i;
484be2cdc5eSEmilio G. Cota 
485be2cdc5eSEmilio G. Cota     tcg_region_tree_lock_all();
486be2cdc5eSEmilio G. Cota     for (i = 0; i < region.n; i++) {
487be2cdc5eSEmilio G. Cota         struct tcg_region_tree *rt = region_trees + i * tree_size;
488be2cdc5eSEmilio G. Cota 
489be2cdc5eSEmilio G. Cota         /* Increment the refcount first so that destroy acts as a reset */
490be2cdc5eSEmilio G. Cota         g_tree_ref(rt->tree);
491be2cdc5eSEmilio G. Cota         g_tree_destroy(rt->tree);
492be2cdc5eSEmilio G. Cota     }
493be2cdc5eSEmilio G. Cota     tcg_region_tree_unlock_all();
494be2cdc5eSEmilio G. Cota }
495be2cdc5eSEmilio G. Cota 
496e8feb96fSEmilio G. Cota static void tcg_region_bounds(size_t curr_region, void **pstart, void **pend)
497e8feb96fSEmilio G. Cota {
498e8feb96fSEmilio G. Cota     void *start, *end;
499e8feb96fSEmilio G. Cota 
500e8feb96fSEmilio G. Cota     start = region.start_aligned + curr_region * region.stride;
501e8feb96fSEmilio G. Cota     end = start + region.size;
502e8feb96fSEmilio G. Cota 
503e8feb96fSEmilio G. Cota     if (curr_region == 0) {
504e8feb96fSEmilio G. Cota         start = region.start;
505e8feb96fSEmilio G. Cota     }
506e8feb96fSEmilio G. Cota     if (curr_region == region.n - 1) {
507e8feb96fSEmilio G. Cota         end = region.end;
508e8feb96fSEmilio G. Cota     }
509e8feb96fSEmilio G. Cota 
510e8feb96fSEmilio G. Cota     *pstart = start;
511e8feb96fSEmilio G. Cota     *pend = end;
512e8feb96fSEmilio G. Cota }
513e8feb96fSEmilio G. Cota 
514e8feb96fSEmilio G. Cota static void tcg_region_assign(TCGContext *s, size_t curr_region)
515e8feb96fSEmilio G. Cota {
516e8feb96fSEmilio G. Cota     void *start, *end;
517e8feb96fSEmilio G. Cota 
518e8feb96fSEmilio G. Cota     tcg_region_bounds(curr_region, &start, &end);
519e8feb96fSEmilio G. Cota 
520e8feb96fSEmilio G. Cota     s->code_gen_buffer = start;
521e8feb96fSEmilio G. Cota     s->code_gen_ptr = start;
522e8feb96fSEmilio G. Cota     s->code_gen_buffer_size = end - start;
523e8feb96fSEmilio G. Cota     s->code_gen_highwater = end - TCG_HIGHWATER;
524e8feb96fSEmilio G. Cota }
525e8feb96fSEmilio G. Cota 
526e8feb96fSEmilio G. Cota static bool tcg_region_alloc__locked(TCGContext *s)
527e8feb96fSEmilio G. Cota {
528e8feb96fSEmilio G. Cota     if (region.current == region.n) {
529e8feb96fSEmilio G. Cota         return true;
530e8feb96fSEmilio G. Cota     }
531e8feb96fSEmilio G. Cota     tcg_region_assign(s, region.current);
532e8feb96fSEmilio G. Cota     region.current++;
533e8feb96fSEmilio G. Cota     return false;
534e8feb96fSEmilio G. Cota }
535e8feb96fSEmilio G. Cota 
536e8feb96fSEmilio G. Cota /*
537e8feb96fSEmilio G. Cota  * Request a new region once the one in use has filled up.
538e8feb96fSEmilio G. Cota  * Returns true on error.
539e8feb96fSEmilio G. Cota  */
540e8feb96fSEmilio G. Cota static bool tcg_region_alloc(TCGContext *s)
541e8feb96fSEmilio G. Cota {
542e8feb96fSEmilio G. Cota     bool err;
543e8feb96fSEmilio G. Cota     /* read the region size now; alloc__locked will overwrite it on success */
544e8feb96fSEmilio G. Cota     size_t size_full = s->code_gen_buffer_size;
545e8feb96fSEmilio G. Cota 
546e8feb96fSEmilio G. Cota     qemu_mutex_lock(&region.lock);
547e8feb96fSEmilio G. Cota     err = tcg_region_alloc__locked(s);
548e8feb96fSEmilio G. Cota     if (!err) {
549e8feb96fSEmilio G. Cota         region.agg_size_full += size_full - TCG_HIGHWATER;
550e8feb96fSEmilio G. Cota     }
551e8feb96fSEmilio G. Cota     qemu_mutex_unlock(&region.lock);
552e8feb96fSEmilio G. Cota     return err;
553e8feb96fSEmilio G. Cota }
554e8feb96fSEmilio G. Cota 
555e8feb96fSEmilio G. Cota /*
556e8feb96fSEmilio G. Cota  * Perform a context's first region allocation.
557e8feb96fSEmilio G. Cota  * This function does _not_ increment region.agg_size_full.
558e8feb96fSEmilio G. Cota  */
559e8feb96fSEmilio G. Cota static inline bool tcg_region_initial_alloc__locked(TCGContext *s)
560e8feb96fSEmilio G. Cota {
561e8feb96fSEmilio G. Cota     return tcg_region_alloc__locked(s);
562e8feb96fSEmilio G. Cota }
563e8feb96fSEmilio G. Cota 
564e8feb96fSEmilio G. Cota /* Call from a safe-work context */
565e8feb96fSEmilio G. Cota void tcg_region_reset_all(void)
566e8feb96fSEmilio G. Cota {
5673468b59eSEmilio G. Cota     unsigned int n_ctxs = atomic_read(&n_tcg_ctxs);
568e8feb96fSEmilio G. Cota     unsigned int i;
569e8feb96fSEmilio G. Cota 
570e8feb96fSEmilio G. Cota     qemu_mutex_lock(&region.lock);
571e8feb96fSEmilio G. Cota     region.current = 0;
572e8feb96fSEmilio G. Cota     region.agg_size_full = 0;
573e8feb96fSEmilio G. Cota 
5743468b59eSEmilio G. Cota     for (i = 0; i < n_ctxs; i++) {
5753468b59eSEmilio G. Cota         TCGContext *s = atomic_read(&tcg_ctxs[i]);
5763468b59eSEmilio G. Cota         bool err = tcg_region_initial_alloc__locked(s);
577e8feb96fSEmilio G. Cota 
578e8feb96fSEmilio G. Cota         g_assert(!err);
579e8feb96fSEmilio G. Cota     }
580e8feb96fSEmilio G. Cota     qemu_mutex_unlock(&region.lock);
581be2cdc5eSEmilio G. Cota 
582be2cdc5eSEmilio G. Cota     tcg_region_tree_reset_all();
583e8feb96fSEmilio G. Cota }
584e8feb96fSEmilio G. Cota 
5853468b59eSEmilio G. Cota #ifdef CONFIG_USER_ONLY
5863468b59eSEmilio G. Cota static size_t tcg_n_regions(void)
5873468b59eSEmilio G. Cota {
5883468b59eSEmilio G. Cota     return 1;
5893468b59eSEmilio G. Cota }
5903468b59eSEmilio G. Cota #else
5913468b59eSEmilio G. Cota /*
5923468b59eSEmilio G. Cota  * It is likely that some vCPUs will translate more code than others, so we
5933468b59eSEmilio G. Cota  * first try to set more regions than max_cpus, with those regions being of
5943468b59eSEmilio G. Cota  * reasonable size. If that's not possible we make do by evenly dividing
5953468b59eSEmilio G. Cota  * the code_gen_buffer among the vCPUs.
5963468b59eSEmilio G. Cota  */
5973468b59eSEmilio G. Cota static size_t tcg_n_regions(void)
5983468b59eSEmilio G. Cota {
5993468b59eSEmilio G. Cota     size_t i;
6003468b59eSEmilio G. Cota 
6013468b59eSEmilio G. Cota     /* Use a single region if all we have is one vCPU thread */
6023468b59eSEmilio G. Cota     if (max_cpus == 1 || !qemu_tcg_mttcg_enabled()) {
6033468b59eSEmilio G. Cota         return 1;
6043468b59eSEmilio G. Cota     }
6053468b59eSEmilio G. Cota 
6063468b59eSEmilio G. Cota     /* Try to have more regions than max_cpus, with each region being >= 2 MB */
6073468b59eSEmilio G. Cota     for (i = 8; i > 0; i--) {
6083468b59eSEmilio G. Cota         size_t regions_per_thread = i;
6093468b59eSEmilio G. Cota         size_t region_size;
6103468b59eSEmilio G. Cota 
6113468b59eSEmilio G. Cota         region_size = tcg_init_ctx.code_gen_buffer_size;
6123468b59eSEmilio G. Cota         region_size /= max_cpus * regions_per_thread;
6133468b59eSEmilio G. Cota 
6143468b59eSEmilio G. Cota         if (region_size >= 2 * 1024u * 1024) {
6153468b59eSEmilio G. Cota             return max_cpus * regions_per_thread;
6163468b59eSEmilio G. Cota         }
6173468b59eSEmilio G. Cota     }
6183468b59eSEmilio G. Cota     /* If we can't, then just allocate one region per vCPU thread */
6193468b59eSEmilio G. Cota     return max_cpus;
6203468b59eSEmilio G. Cota }
6213468b59eSEmilio G. Cota #endif
6223468b59eSEmilio G. Cota 
623e8feb96fSEmilio G. Cota /*
624e8feb96fSEmilio G. Cota  * Initializes region partitioning.
625e8feb96fSEmilio G. Cota  *
626e8feb96fSEmilio G. Cota  * Called at init time from the parent thread (i.e. the one calling
627e8feb96fSEmilio G. Cota  * tcg_context_init), after the target's TCG globals have been set.
6283468b59eSEmilio G. Cota  *
6293468b59eSEmilio G. Cota  * Region partitioning works by splitting code_gen_buffer into separate regions,
6303468b59eSEmilio G. Cota  * and then assigning regions to TCG threads so that the threads can translate
6313468b59eSEmilio G. Cota  * code in parallel without synchronization.
6323468b59eSEmilio G. Cota  *
6333468b59eSEmilio G. Cota  * In softmmu the number of TCG threads is bounded by max_cpus, so we use at
6343468b59eSEmilio G. Cota  * least max_cpus regions in MTTCG. In !MTTCG we use a single region.
6353468b59eSEmilio G. Cota  * Note that the TCG options from the command-line (i.e. -accel accel=tcg,[...])
6363468b59eSEmilio G. Cota  * must have been parsed before calling this function, since it calls
6373468b59eSEmilio G. Cota  * qemu_tcg_mttcg_enabled().
6383468b59eSEmilio G. Cota  *
6393468b59eSEmilio G. Cota  * In user-mode we use a single region.  Having multiple regions in user-mode
6403468b59eSEmilio G. Cota  * is not supported, because the number of vCPU threads (recall that each thread
6413468b59eSEmilio G. Cota  * spawned by the guest corresponds to a vCPU thread) is only bounded by the
6423468b59eSEmilio G. Cota  * OS, and usually this number is huge (tens of thousands is not uncommon).
6433468b59eSEmilio G. Cota  * Thus, given this large bound on the number of vCPU threads and the fact
6443468b59eSEmilio G. Cota  * that code_gen_buffer is allocated at compile-time, we cannot guarantee
6453468b59eSEmilio G. Cota  * that the availability of at least one region per vCPU thread.
6463468b59eSEmilio G. Cota  *
6473468b59eSEmilio G. Cota  * However, this user-mode limitation is unlikely to be a significant problem
6483468b59eSEmilio G. Cota  * in practice. Multi-threaded guests share most if not all of their translated
6493468b59eSEmilio G. Cota  * code, which makes parallel code generation less appealing than in softmmu.
650e8feb96fSEmilio G. Cota  */
651e8feb96fSEmilio G. Cota void tcg_region_init(void)
652e8feb96fSEmilio G. Cota {
653e8feb96fSEmilio G. Cota     void *buf = tcg_init_ctx.code_gen_buffer;
654e8feb96fSEmilio G. Cota     void *aligned;
655e8feb96fSEmilio G. Cota     size_t size = tcg_init_ctx.code_gen_buffer_size;
656e8feb96fSEmilio G. Cota     size_t page_size = qemu_real_host_page_size;
657e8feb96fSEmilio G. Cota     size_t region_size;
658e8feb96fSEmilio G. Cota     size_t n_regions;
659e8feb96fSEmilio G. Cota     size_t i;
660e8feb96fSEmilio G. Cota 
6613468b59eSEmilio G. Cota     n_regions = tcg_n_regions();
662e8feb96fSEmilio G. Cota 
663e8feb96fSEmilio G. Cota     /* The first region will be 'aligned - buf' bytes larger than the others */
664e8feb96fSEmilio G. Cota     aligned = QEMU_ALIGN_PTR_UP(buf, page_size);
665e8feb96fSEmilio G. Cota     g_assert(aligned < tcg_init_ctx.code_gen_buffer + size);
666e8feb96fSEmilio G. Cota     /*
667e8feb96fSEmilio G. Cota      * Make region_size a multiple of page_size, using aligned as the start.
668e8feb96fSEmilio G. Cota      * As a result of this we might end up with a few extra pages at the end of
669e8feb96fSEmilio G. Cota      * the buffer; we will assign those to the last region.
670e8feb96fSEmilio G. Cota      */
671e8feb96fSEmilio G. Cota     region_size = (size - (aligned - buf)) / n_regions;
672e8feb96fSEmilio G. Cota     region_size = QEMU_ALIGN_DOWN(region_size, page_size);
673e8feb96fSEmilio G. Cota 
674e8feb96fSEmilio G. Cota     /* A region must have at least 2 pages; one code, one guard */
675e8feb96fSEmilio G. Cota     g_assert(region_size >= 2 * page_size);
676e8feb96fSEmilio G. Cota 
677e8feb96fSEmilio G. Cota     /* init the region struct */
678e8feb96fSEmilio G. Cota     qemu_mutex_init(&region.lock);
679e8feb96fSEmilio G. Cota     region.n = n_regions;
680e8feb96fSEmilio G. Cota     region.size = region_size - page_size;
681e8feb96fSEmilio G. Cota     region.stride = region_size;
682e8feb96fSEmilio G. Cota     region.start = buf;
683e8feb96fSEmilio G. Cota     region.start_aligned = aligned;
684e8feb96fSEmilio G. Cota     /* page-align the end, since its last page will be a guard page */
685e8feb96fSEmilio G. Cota     region.end = QEMU_ALIGN_PTR_DOWN(buf + size, page_size);
686e8feb96fSEmilio G. Cota     /* account for that last guard page */
687e8feb96fSEmilio G. Cota     region.end -= page_size;
688e8feb96fSEmilio G. Cota 
689e8feb96fSEmilio G. Cota     /* set guard pages */
690e8feb96fSEmilio G. Cota     for (i = 0; i < region.n; i++) {
691e8feb96fSEmilio G. Cota         void *start, *end;
692e8feb96fSEmilio G. Cota         int rc;
693e8feb96fSEmilio G. Cota 
694e8feb96fSEmilio G. Cota         tcg_region_bounds(i, &start, &end);
695e8feb96fSEmilio G. Cota         rc = qemu_mprotect_none(end, page_size);
696e8feb96fSEmilio G. Cota         g_assert(!rc);
697e8feb96fSEmilio G. Cota     }
698e8feb96fSEmilio G. Cota 
699be2cdc5eSEmilio G. Cota     tcg_region_trees_init();
700be2cdc5eSEmilio G. Cota 
7013468b59eSEmilio G. Cota     /* In user-mode we support only one ctx, so do the initial allocation now */
7023468b59eSEmilio G. Cota #ifdef CONFIG_USER_ONLY
703e8feb96fSEmilio G. Cota     {
704e8feb96fSEmilio G. Cota         bool err = tcg_region_initial_alloc__locked(tcg_ctx);
705e8feb96fSEmilio G. Cota 
706e8feb96fSEmilio G. Cota         g_assert(!err);
707e8feb96fSEmilio G. Cota     }
7083468b59eSEmilio G. Cota #endif
709e8feb96fSEmilio G. Cota }
710e8feb96fSEmilio G. Cota 
711e8feb96fSEmilio G. Cota /*
7123468b59eSEmilio G. Cota  * All TCG threads except the parent (i.e. the one that called tcg_context_init
7133468b59eSEmilio G. Cota  * and registered the target's TCG globals) must register with this function
7143468b59eSEmilio G. Cota  * before initiating translation.
7153468b59eSEmilio G. Cota  *
7163468b59eSEmilio G. Cota  * In user-mode we just point tcg_ctx to tcg_init_ctx. See the documentation
7173468b59eSEmilio G. Cota  * of tcg_region_init() for the reasoning behind this.
7183468b59eSEmilio G. Cota  *
7193468b59eSEmilio G. Cota  * In softmmu each caller registers its context in tcg_ctxs[]. Note that in
7203468b59eSEmilio G. Cota  * softmmu tcg_ctxs[] does not track tcg_ctx_init, since the initial context
7213468b59eSEmilio G. Cota  * is not used anymore for translation once this function is called.
7223468b59eSEmilio G. Cota  *
7233468b59eSEmilio G. Cota  * Not tracking tcg_init_ctx in tcg_ctxs[] in softmmu keeps code that iterates
7243468b59eSEmilio G. Cota  * over the array (e.g. tcg_code_size() the same for both softmmu and user-mode.
7253468b59eSEmilio G. Cota  */
7263468b59eSEmilio G. Cota #ifdef CONFIG_USER_ONLY
7273468b59eSEmilio G. Cota void tcg_register_thread(void)
7283468b59eSEmilio G. Cota {
7293468b59eSEmilio G. Cota     tcg_ctx = &tcg_init_ctx;
7303468b59eSEmilio G. Cota }
7313468b59eSEmilio G. Cota #else
7323468b59eSEmilio G. Cota void tcg_register_thread(void)
7333468b59eSEmilio G. Cota {
7343468b59eSEmilio G. Cota     TCGContext *s = g_malloc(sizeof(*s));
7353468b59eSEmilio G. Cota     unsigned int i, n;
7363468b59eSEmilio G. Cota     bool err;
7373468b59eSEmilio G. Cota 
7383468b59eSEmilio G. Cota     *s = tcg_init_ctx;
7393468b59eSEmilio G. Cota 
7403468b59eSEmilio G. Cota     /* Relink mem_base.  */
7413468b59eSEmilio G. Cota     for (i = 0, n = tcg_init_ctx.nb_globals; i < n; ++i) {
7423468b59eSEmilio G. Cota         if (tcg_init_ctx.temps[i].mem_base) {
7433468b59eSEmilio G. Cota             ptrdiff_t b = tcg_init_ctx.temps[i].mem_base - tcg_init_ctx.temps;
7443468b59eSEmilio G. Cota             tcg_debug_assert(b >= 0 && b < n);
7453468b59eSEmilio G. Cota             s->temps[i].mem_base = &s->temps[b];
7463468b59eSEmilio G. Cota         }
7473468b59eSEmilio G. Cota     }
7483468b59eSEmilio G. Cota 
7493468b59eSEmilio G. Cota     /* Claim an entry in tcg_ctxs */
7503468b59eSEmilio G. Cota     n = atomic_fetch_inc(&n_tcg_ctxs);
7513468b59eSEmilio G. Cota     g_assert(n < max_cpus);
7523468b59eSEmilio G. Cota     atomic_set(&tcg_ctxs[n], s);
7533468b59eSEmilio G. Cota 
7543468b59eSEmilio G. Cota     tcg_ctx = s;
7553468b59eSEmilio G. Cota     qemu_mutex_lock(&region.lock);
7563468b59eSEmilio G. Cota     err = tcg_region_initial_alloc__locked(tcg_ctx);
7573468b59eSEmilio G. Cota     g_assert(!err);
7583468b59eSEmilio G. Cota     qemu_mutex_unlock(&region.lock);
7593468b59eSEmilio G. Cota }
7603468b59eSEmilio G. Cota #endif /* !CONFIG_USER_ONLY */
7613468b59eSEmilio G. Cota 
7623468b59eSEmilio G. Cota /*
763e8feb96fSEmilio G. Cota  * Returns the size (in bytes) of all translated code (i.e. from all regions)
764e8feb96fSEmilio G. Cota  * currently in the cache.
765e8feb96fSEmilio G. Cota  * See also: tcg_code_capacity()
766e8feb96fSEmilio G. Cota  * Do not confuse with tcg_current_code_size(); that one applies to a single
767e8feb96fSEmilio G. Cota  * TCG context.
768e8feb96fSEmilio G. Cota  */
769e8feb96fSEmilio G. Cota size_t tcg_code_size(void)
770e8feb96fSEmilio G. Cota {
7713468b59eSEmilio G. Cota     unsigned int n_ctxs = atomic_read(&n_tcg_ctxs);
772e8feb96fSEmilio G. Cota     unsigned int i;
773e8feb96fSEmilio G. Cota     size_t total;
774e8feb96fSEmilio G. Cota 
775e8feb96fSEmilio G. Cota     qemu_mutex_lock(&region.lock);
776e8feb96fSEmilio G. Cota     total = region.agg_size_full;
7773468b59eSEmilio G. Cota     for (i = 0; i < n_ctxs; i++) {
7783468b59eSEmilio G. Cota         const TCGContext *s = atomic_read(&tcg_ctxs[i]);
779e8feb96fSEmilio G. Cota         size_t size;
780e8feb96fSEmilio G. Cota 
781e8feb96fSEmilio G. Cota         size = atomic_read(&s->code_gen_ptr) - s->code_gen_buffer;
782e8feb96fSEmilio G. Cota         g_assert(size <= s->code_gen_buffer_size);
783e8feb96fSEmilio G. Cota         total += size;
784e8feb96fSEmilio G. Cota     }
785e8feb96fSEmilio G. Cota     qemu_mutex_unlock(&region.lock);
786e8feb96fSEmilio G. Cota     return total;
787e8feb96fSEmilio G. Cota }
788e8feb96fSEmilio G. Cota 
789e8feb96fSEmilio G. Cota /*
790e8feb96fSEmilio G. Cota  * Returns the code capacity (in bytes) of the entire cache, i.e. including all
791e8feb96fSEmilio G. Cota  * regions.
792e8feb96fSEmilio G. Cota  * See also: tcg_code_size()
793e8feb96fSEmilio G. Cota  */
794e8feb96fSEmilio G. Cota size_t tcg_code_capacity(void)
795e8feb96fSEmilio G. Cota {
796e8feb96fSEmilio G. Cota     size_t guard_size, capacity;
797e8feb96fSEmilio G. Cota 
798e8feb96fSEmilio G. Cota     /* no need for synchronization; these variables are set at init time */
799e8feb96fSEmilio G. Cota     guard_size = region.stride - region.size;
800e8feb96fSEmilio G. Cota     capacity = region.end + guard_size - region.start;
801e8feb96fSEmilio G. Cota     capacity -= region.n * (guard_size + TCG_HIGHWATER);
802e8feb96fSEmilio G. Cota     return capacity;
803e8feb96fSEmilio G. Cota }
804e8feb96fSEmilio G. Cota 
805128ed227SEmilio G. Cota size_t tcg_tb_phys_invalidate_count(void)
806128ed227SEmilio G. Cota {
807128ed227SEmilio G. Cota     unsigned int n_ctxs = atomic_read(&n_tcg_ctxs);
808128ed227SEmilio G. Cota     unsigned int i;
809128ed227SEmilio G. Cota     size_t total = 0;
810128ed227SEmilio G. Cota 
811128ed227SEmilio G. Cota     for (i = 0; i < n_ctxs; i++) {
812128ed227SEmilio G. Cota         const TCGContext *s = atomic_read(&tcg_ctxs[i]);
813128ed227SEmilio G. Cota 
814128ed227SEmilio G. Cota         total += atomic_read(&s->tb_phys_invalidate_count);
815128ed227SEmilio G. Cota     }
816128ed227SEmilio G. Cota     return total;
817128ed227SEmilio G. Cota }
818128ed227SEmilio G. Cota 
819c896fe29Sbellard /* pool based memory allocation */
820c896fe29Sbellard void *tcg_malloc_internal(TCGContext *s, int size)
821c896fe29Sbellard {
822c896fe29Sbellard     TCGPool *p;
823c896fe29Sbellard     int pool_size;
824c896fe29Sbellard 
825c896fe29Sbellard     if (size > TCG_POOL_CHUNK_SIZE) {
826c896fe29Sbellard         /* big malloc: insert a new pool (XXX: could optimize) */
8277267c094SAnthony Liguori         p = g_malloc(sizeof(TCGPool) + size);
828c896fe29Sbellard         p->size = size;
8294055299eSKirill Batuzov         p->next = s->pool_first_large;
8304055299eSKirill Batuzov         s->pool_first_large = p;
8314055299eSKirill Batuzov         return p->data;
832c896fe29Sbellard     } else {
833c896fe29Sbellard         p = s->pool_current;
834c896fe29Sbellard         if (!p) {
835c896fe29Sbellard             p = s->pool_first;
836c896fe29Sbellard             if (!p)
837c896fe29Sbellard                 goto new_pool;
838c896fe29Sbellard         } else {
839c896fe29Sbellard             if (!p->next) {
840c896fe29Sbellard             new_pool:
841c896fe29Sbellard                 pool_size = TCG_POOL_CHUNK_SIZE;
8427267c094SAnthony Liguori                 p = g_malloc(sizeof(TCGPool) + pool_size);
843c896fe29Sbellard                 p->size = pool_size;
844c896fe29Sbellard                 p->next = NULL;
845c896fe29Sbellard                 if (s->pool_current)
846c896fe29Sbellard                     s->pool_current->next = p;
847c896fe29Sbellard                 else
848c896fe29Sbellard                     s->pool_first = p;
849c896fe29Sbellard             } else {
850c896fe29Sbellard                 p = p->next;
851c896fe29Sbellard             }
852c896fe29Sbellard         }
853c896fe29Sbellard     }
854c896fe29Sbellard     s->pool_current = p;
855c896fe29Sbellard     s->pool_cur = p->data + size;
856c896fe29Sbellard     s->pool_end = p->data + p->size;
857c896fe29Sbellard     return p->data;
858c896fe29Sbellard }
859c896fe29Sbellard 
860c896fe29Sbellard void tcg_pool_reset(TCGContext *s)
861c896fe29Sbellard {
8624055299eSKirill Batuzov     TCGPool *p, *t;
8634055299eSKirill Batuzov     for (p = s->pool_first_large; p; p = t) {
8644055299eSKirill Batuzov         t = p->next;
8654055299eSKirill Batuzov         g_free(p);
8664055299eSKirill Batuzov     }
8674055299eSKirill Batuzov     s->pool_first_large = NULL;
868c896fe29Sbellard     s->pool_cur = s->pool_end = NULL;
869c896fe29Sbellard     s->pool_current = NULL;
870c896fe29Sbellard }
871c896fe29Sbellard 
872100b5e01SRichard Henderson typedef struct TCGHelperInfo {
873100b5e01SRichard Henderson     void *func;
874100b5e01SRichard Henderson     const char *name;
875afb49896SRichard Henderson     unsigned flags;
876afb49896SRichard Henderson     unsigned sizemask;
877100b5e01SRichard Henderson } TCGHelperInfo;
878100b5e01SRichard Henderson 
8792ef6175aSRichard Henderson #include "exec/helper-proto.h"
8802ef6175aSRichard Henderson 
881100b5e01SRichard Henderson static const TCGHelperInfo all_helpers[] = {
8822ef6175aSRichard Henderson #include "exec/helper-tcg.h"
883100b5e01SRichard Henderson };
884619205fdSEmilio G. Cota static GHashTable *helper_table;
885100b5e01SRichard Henderson 
88691478cefSRichard Henderson static int indirect_reg_alloc_order[ARRAY_SIZE(tcg_target_reg_alloc_order)];
887f69d277eSRichard Henderson static void process_op_defs(TCGContext *s);
8881c2adb95SRichard Henderson static TCGTemp *tcg_global_reg_new_internal(TCGContext *s, TCGType type,
8891c2adb95SRichard Henderson                                             TCGReg reg, const char *name);
89091478cefSRichard Henderson 
891c896fe29Sbellard void tcg_context_init(TCGContext *s)
892c896fe29Sbellard {
893100b5e01SRichard Henderson     int op, total_args, n, i;
894c896fe29Sbellard     TCGOpDef *def;
895c896fe29Sbellard     TCGArgConstraint *args_ct;
896c896fe29Sbellard     int *sorted_args;
8971c2adb95SRichard Henderson     TCGTemp *ts;
898c896fe29Sbellard 
899c896fe29Sbellard     memset(s, 0, sizeof(*s));
900c896fe29Sbellard     s->nb_globals = 0;
901c896fe29Sbellard 
902c896fe29Sbellard     /* Count total number of arguments and allocate the corresponding
903c896fe29Sbellard        space */
904c896fe29Sbellard     total_args = 0;
905c896fe29Sbellard     for(op = 0; op < NB_OPS; op++) {
906c896fe29Sbellard         def = &tcg_op_defs[op];
907c896fe29Sbellard         n = def->nb_iargs + def->nb_oargs;
908c896fe29Sbellard         total_args += n;
909c896fe29Sbellard     }
910c896fe29Sbellard 
9117267c094SAnthony Liguori     args_ct = g_malloc(sizeof(TCGArgConstraint) * total_args);
9127267c094SAnthony Liguori     sorted_args = g_malloc(sizeof(int) * total_args);
913c896fe29Sbellard 
914c896fe29Sbellard     for(op = 0; op < NB_OPS; op++) {
915c896fe29Sbellard         def = &tcg_op_defs[op];
916c896fe29Sbellard         def->args_ct = args_ct;
917c896fe29Sbellard         def->sorted_args = sorted_args;
918c896fe29Sbellard         n = def->nb_iargs + def->nb_oargs;
919c896fe29Sbellard         sorted_args += n;
920c896fe29Sbellard         args_ct += n;
921c896fe29Sbellard     }
922c896fe29Sbellard 
9235cd8f621SRichard Henderson     /* Register helpers.  */
92484fd9dd3SRichard Henderson     /* Use g_direct_hash/equal for direct pointer comparisons on func.  */
925619205fdSEmilio G. Cota     helper_table = g_hash_table_new(NULL, NULL);
92684fd9dd3SRichard Henderson 
927100b5e01SRichard Henderson     for (i = 0; i < ARRAY_SIZE(all_helpers); ++i) {
92884fd9dd3SRichard Henderson         g_hash_table_insert(helper_table, (gpointer)all_helpers[i].func,
92972866e82SRichard Henderson                             (gpointer)&all_helpers[i]);
930100b5e01SRichard Henderson     }
9315cd8f621SRichard Henderson 
932c896fe29Sbellard     tcg_target_init(s);
933f69d277eSRichard Henderson     process_op_defs(s);
93491478cefSRichard Henderson 
93591478cefSRichard Henderson     /* Reverse the order of the saved registers, assuming they're all at
93691478cefSRichard Henderson        the start of tcg_target_reg_alloc_order.  */
93791478cefSRichard Henderson     for (n = 0; n < ARRAY_SIZE(tcg_target_reg_alloc_order); ++n) {
93891478cefSRichard Henderson         int r = tcg_target_reg_alloc_order[n];
93991478cefSRichard Henderson         if (tcg_regset_test_reg(tcg_target_call_clobber_regs, r)) {
94091478cefSRichard Henderson             break;
94191478cefSRichard Henderson         }
94291478cefSRichard Henderson     }
94391478cefSRichard Henderson     for (i = 0; i < n; ++i) {
94491478cefSRichard Henderson         indirect_reg_alloc_order[i] = tcg_target_reg_alloc_order[n - 1 - i];
94591478cefSRichard Henderson     }
94691478cefSRichard Henderson     for (; i < ARRAY_SIZE(tcg_target_reg_alloc_order); ++i) {
94791478cefSRichard Henderson         indirect_reg_alloc_order[i] = tcg_target_reg_alloc_order[i];
94891478cefSRichard Henderson     }
949b1311c4aSEmilio G. Cota 
950b1311c4aSEmilio G. Cota     tcg_ctx = s;
9513468b59eSEmilio G. Cota     /*
9523468b59eSEmilio G. Cota      * In user-mode we simply share the init context among threads, since we
9533468b59eSEmilio G. Cota      * use a single region. See the documentation tcg_region_init() for the
9543468b59eSEmilio G. Cota      * reasoning behind this.
9553468b59eSEmilio G. Cota      * In softmmu we will have at most max_cpus TCG threads.
9563468b59eSEmilio G. Cota      */
9573468b59eSEmilio G. Cota #ifdef CONFIG_USER_ONLY
958df2cce29SEmilio G. Cota     tcg_ctxs = &tcg_ctx;
959df2cce29SEmilio G. Cota     n_tcg_ctxs = 1;
9603468b59eSEmilio G. Cota #else
9613468b59eSEmilio G. Cota     tcg_ctxs = g_new(TCGContext *, max_cpus);
9623468b59eSEmilio G. Cota #endif
9631c2adb95SRichard Henderson 
9641c2adb95SRichard Henderson     tcg_debug_assert(!tcg_regset_test_reg(s->reserved_regs, TCG_AREG0));
9651c2adb95SRichard Henderson     ts = tcg_global_reg_new_internal(s, TCG_TYPE_PTR, TCG_AREG0, "env");
9661c2adb95SRichard Henderson     cpu_env = temp_tcgv_ptr(ts);
9679002ec79SRichard Henderson }
968b03cce8eSbellard 
9696e3b2bfdSEmilio G. Cota /*
9706e3b2bfdSEmilio G. Cota  * Allocate TBs right before their corresponding translated code, making
9716e3b2bfdSEmilio G. Cota  * sure that TBs and code are on different cache lines.
9726e3b2bfdSEmilio G. Cota  */
9736e3b2bfdSEmilio G. Cota TranslationBlock *tcg_tb_alloc(TCGContext *s)
9746e3b2bfdSEmilio G. Cota {
9756e3b2bfdSEmilio G. Cota     uintptr_t align = qemu_icache_linesize;
9766e3b2bfdSEmilio G. Cota     TranslationBlock *tb;
9776e3b2bfdSEmilio G. Cota     void *next;
9786e3b2bfdSEmilio G. Cota 
979e8feb96fSEmilio G. Cota  retry:
9806e3b2bfdSEmilio G. Cota     tb = (void *)ROUND_UP((uintptr_t)s->code_gen_ptr, align);
9816e3b2bfdSEmilio G. Cota     next = (void *)ROUND_UP((uintptr_t)(tb + 1), align);
9826e3b2bfdSEmilio G. Cota 
9836e3b2bfdSEmilio G. Cota     if (unlikely(next > s->code_gen_highwater)) {
984e8feb96fSEmilio G. Cota         if (tcg_region_alloc(s)) {
9856e3b2bfdSEmilio G. Cota             return NULL;
9866e3b2bfdSEmilio G. Cota         }
987e8feb96fSEmilio G. Cota         goto retry;
988e8feb96fSEmilio G. Cota     }
989e8feb96fSEmilio G. Cota     atomic_set(&s->code_gen_ptr, next);
99057a26946SRichard Henderson     s->data_gen_ptr = NULL;
9916e3b2bfdSEmilio G. Cota     return tb;
9926e3b2bfdSEmilio G. Cota }
9936e3b2bfdSEmilio G. Cota 
9949002ec79SRichard Henderson void tcg_prologue_init(TCGContext *s)
9959002ec79SRichard Henderson {
9968163b749SRichard Henderson     size_t prologue_size, total_size;
9978163b749SRichard Henderson     void *buf0, *buf1;
9988163b749SRichard Henderson 
9998163b749SRichard Henderson     /* Put the prologue at the beginning of code_gen_buffer.  */
10008163b749SRichard Henderson     buf0 = s->code_gen_buffer;
10015b38ee31SRichard Henderson     total_size = s->code_gen_buffer_size;
10028163b749SRichard Henderson     s->code_ptr = buf0;
10038163b749SRichard Henderson     s->code_buf = buf0;
10045b38ee31SRichard Henderson     s->data_gen_ptr = NULL;
10058163b749SRichard Henderson     s->code_gen_prologue = buf0;
10068163b749SRichard Henderson 
10075b38ee31SRichard Henderson     /* Compute a high-water mark, at which we voluntarily flush the buffer
10085b38ee31SRichard Henderson        and start over.  The size here is arbitrary, significantly larger
10095b38ee31SRichard Henderson        than we expect the code generation for any one opcode to require.  */
10105b38ee31SRichard Henderson     s->code_gen_highwater = s->code_gen_buffer + (total_size - TCG_HIGHWATER);
10115b38ee31SRichard Henderson 
10125b38ee31SRichard Henderson #ifdef TCG_TARGET_NEED_POOL_LABELS
10135b38ee31SRichard Henderson     s->pool_labels = NULL;
10145b38ee31SRichard Henderson #endif
10155b38ee31SRichard Henderson 
10168163b749SRichard Henderson     /* Generate the prologue.  */
1017b03cce8eSbellard     tcg_target_qemu_prologue(s);
10185b38ee31SRichard Henderson 
10195b38ee31SRichard Henderson #ifdef TCG_TARGET_NEED_POOL_LABELS
10205b38ee31SRichard Henderson     /* Allow the prologue to put e.g. guest_base into a pool entry.  */
10215b38ee31SRichard Henderson     {
10225b38ee31SRichard Henderson         bool ok = tcg_out_pool_finalize(s);
10235b38ee31SRichard Henderson         tcg_debug_assert(ok);
10245b38ee31SRichard Henderson     }
10255b38ee31SRichard Henderson #endif
10265b38ee31SRichard Henderson 
10278163b749SRichard Henderson     buf1 = s->code_ptr;
10288163b749SRichard Henderson     flush_icache_range((uintptr_t)buf0, (uintptr_t)buf1);
10298163b749SRichard Henderson 
10308163b749SRichard Henderson     /* Deduct the prologue from the buffer.  */
10318163b749SRichard Henderson     prologue_size = tcg_current_code_size(s);
10328163b749SRichard Henderson     s->code_gen_ptr = buf1;
10338163b749SRichard Henderson     s->code_gen_buffer = buf1;
10348163b749SRichard Henderson     s->code_buf = buf1;
10355b38ee31SRichard Henderson     total_size -= prologue_size;
10368163b749SRichard Henderson     s->code_gen_buffer_size = total_size;
10378163b749SRichard Henderson 
10388163b749SRichard Henderson     tcg_register_jit(s->code_gen_buffer, total_size);
1039d6b64b2bSRichard Henderson 
1040d6b64b2bSRichard Henderson #ifdef DEBUG_DISAS
1041d6b64b2bSRichard Henderson     if (qemu_loglevel_mask(CPU_LOG_TB_OUT_ASM)) {
10421ee73216SRichard Henderson         qemu_log_lock();
10438163b749SRichard Henderson         qemu_log("PROLOGUE: [size=%zu]\n", prologue_size);
10445b38ee31SRichard Henderson         if (s->data_gen_ptr) {
10455b38ee31SRichard Henderson             size_t code_size = s->data_gen_ptr - buf0;
10465b38ee31SRichard Henderson             size_t data_size = prologue_size - code_size;
10475b38ee31SRichard Henderson             size_t i;
10485b38ee31SRichard Henderson 
10495b38ee31SRichard Henderson             log_disas(buf0, code_size);
10505b38ee31SRichard Henderson 
10515b38ee31SRichard Henderson             for (i = 0; i < data_size; i += sizeof(tcg_target_ulong)) {
10525b38ee31SRichard Henderson                 if (sizeof(tcg_target_ulong) == 8) {
10535b38ee31SRichard Henderson                     qemu_log("0x%08" PRIxPTR ":  .quad  0x%016" PRIx64 "\n",
10545b38ee31SRichard Henderson                              (uintptr_t)s->data_gen_ptr + i,
10555b38ee31SRichard Henderson                              *(uint64_t *)(s->data_gen_ptr + i));
10565b38ee31SRichard Henderson                 } else {
10575b38ee31SRichard Henderson                     qemu_log("0x%08" PRIxPTR ":  .long  0x%08x\n",
10585b38ee31SRichard Henderson                              (uintptr_t)s->data_gen_ptr + i,
10595b38ee31SRichard Henderson                              *(uint32_t *)(s->data_gen_ptr + i));
10605b38ee31SRichard Henderson                 }
10615b38ee31SRichard Henderson             }
10625b38ee31SRichard Henderson         } else {
10638163b749SRichard Henderson             log_disas(buf0, prologue_size);
10645b38ee31SRichard Henderson         }
1065d6b64b2bSRichard Henderson         qemu_log("\n");
1066d6b64b2bSRichard Henderson         qemu_log_flush();
10671ee73216SRichard Henderson         qemu_log_unlock();
1068d6b64b2bSRichard Henderson     }
1069d6b64b2bSRichard Henderson #endif
1070cedbcb01SEmilio G. Cota 
1071cedbcb01SEmilio G. Cota     /* Assert that goto_ptr is implemented completely.  */
1072cedbcb01SEmilio G. Cota     if (TCG_TARGET_HAS_goto_ptr) {
1073cedbcb01SEmilio G. Cota         tcg_debug_assert(s->code_gen_epilogue != NULL);
1074cedbcb01SEmilio G. Cota     }
1075c896fe29Sbellard }
1076c896fe29Sbellard 
1077c896fe29Sbellard void tcg_func_start(TCGContext *s)
1078c896fe29Sbellard {
1079c896fe29Sbellard     tcg_pool_reset(s);
1080c896fe29Sbellard     s->nb_temps = s->nb_globals;
10810ec9eabcSRichard Henderson 
10820ec9eabcSRichard Henderson     /* No temps have been previously allocated for size or locality.  */
10830ec9eabcSRichard Henderson     memset(s->free_temps, 0, sizeof(s->free_temps));
10840ec9eabcSRichard Henderson 
1085abebf925SRichard Henderson     s->nb_ops = 0;
1086c896fe29Sbellard     s->nb_labels = 0;
1087c896fe29Sbellard     s->current_frame_offset = s->frame_start;
1088c896fe29Sbellard 
10890a209d4bSRichard Henderson #ifdef CONFIG_DEBUG_TCG
10900a209d4bSRichard Henderson     s->goto_tb_issue_mask = 0;
10910a209d4bSRichard Henderson #endif
10920a209d4bSRichard Henderson 
109315fa08f8SRichard Henderson     QTAILQ_INIT(&s->ops);
109415fa08f8SRichard Henderson     QTAILQ_INIT(&s->free_ops);
1095c896fe29Sbellard }
1096c896fe29Sbellard 
10977ca4b752SRichard Henderson static inline TCGTemp *tcg_temp_alloc(TCGContext *s)
10987ca4b752SRichard Henderson {
10997ca4b752SRichard Henderson     int n = s->nb_temps++;
11007ca4b752SRichard Henderson     tcg_debug_assert(n < TCG_MAX_TEMPS);
11017ca4b752SRichard Henderson     return memset(&s->temps[n], 0, sizeof(TCGTemp));
11027ca4b752SRichard Henderson }
11037ca4b752SRichard Henderson 
11047ca4b752SRichard Henderson static inline TCGTemp *tcg_global_alloc(TCGContext *s)
11057ca4b752SRichard Henderson {
1106fa477d25SRichard Henderson     TCGTemp *ts;
1107fa477d25SRichard Henderson 
11087ca4b752SRichard Henderson     tcg_debug_assert(s->nb_globals == s->nb_temps);
11097ca4b752SRichard Henderson     s->nb_globals++;
1110fa477d25SRichard Henderson     ts = tcg_temp_alloc(s);
1111fa477d25SRichard Henderson     ts->temp_global = 1;
1112fa477d25SRichard Henderson 
1113fa477d25SRichard Henderson     return ts;
1114c896fe29Sbellard }
1115c896fe29Sbellard 
1116085272b3SRichard Henderson static TCGTemp *tcg_global_reg_new_internal(TCGContext *s, TCGType type,
1117b6638662SRichard Henderson                                             TCGReg reg, const char *name)
1118c896fe29Sbellard {
1119c896fe29Sbellard     TCGTemp *ts;
1120c896fe29Sbellard 
1121b3a62939SRichard Henderson     if (TCG_TARGET_REG_BITS == 32 && type != TCG_TYPE_I32) {
1122c896fe29Sbellard         tcg_abort();
1123b3a62939SRichard Henderson     }
11247ca4b752SRichard Henderson 
11257ca4b752SRichard Henderson     ts = tcg_global_alloc(s);
1126c896fe29Sbellard     ts->base_type = type;
1127c896fe29Sbellard     ts->type = type;
1128c896fe29Sbellard     ts->fixed_reg = 1;
1129c896fe29Sbellard     ts->reg = reg;
1130c896fe29Sbellard     ts->name = name;
1131c896fe29Sbellard     tcg_regset_set_reg(s->reserved_regs, reg);
11327ca4b752SRichard Henderson 
1133085272b3SRichard Henderson     return ts;
1134a7812ae4Spbrook }
1135a7812ae4Spbrook 
1136b6638662SRichard Henderson void tcg_set_frame(TCGContext *s, TCGReg reg, intptr_t start, intptr_t size)
1137a7812ae4Spbrook {
1138b3a62939SRichard Henderson     s->frame_start = start;
1139b3a62939SRichard Henderson     s->frame_end = start + size;
1140085272b3SRichard Henderson     s->frame_temp
1141085272b3SRichard Henderson         = tcg_global_reg_new_internal(s, TCG_TYPE_PTR, reg, "_frame");
1142b3a62939SRichard Henderson }
1143a7812ae4Spbrook 
1144085272b3SRichard Henderson TCGTemp *tcg_global_mem_new_internal(TCGType type, TCGv_ptr base,
1145e1ccc054SRichard Henderson                                      intptr_t offset, const char *name)
1146c896fe29Sbellard {
1147b1311c4aSEmilio G. Cota     TCGContext *s = tcg_ctx;
1148dc41aa7dSRichard Henderson     TCGTemp *base_ts = tcgv_ptr_temp(base);
11497ca4b752SRichard Henderson     TCGTemp *ts = tcg_global_alloc(s);
1150b3915dbbSRichard Henderson     int indirect_reg = 0, bigendian = 0;
11517ca4b752SRichard Henderson #ifdef HOST_WORDS_BIGENDIAN
11527ca4b752SRichard Henderson     bigendian = 1;
11537ca4b752SRichard Henderson #endif
1154c896fe29Sbellard 
1155b3915dbbSRichard Henderson     if (!base_ts->fixed_reg) {
11565a18407fSRichard Henderson         /* We do not support double-indirect registers.  */
11575a18407fSRichard Henderson         tcg_debug_assert(!base_ts->indirect_reg);
1158b3915dbbSRichard Henderson         base_ts->indirect_base = 1;
11595a18407fSRichard Henderson         s->nb_indirects += (TCG_TARGET_REG_BITS == 32 && type == TCG_TYPE_I64
11605a18407fSRichard Henderson                             ? 2 : 1);
11615a18407fSRichard Henderson         indirect_reg = 1;
1162b3915dbbSRichard Henderson     }
1163b3915dbbSRichard Henderson 
11647ca4b752SRichard Henderson     if (TCG_TARGET_REG_BITS == 32 && type == TCG_TYPE_I64) {
11657ca4b752SRichard Henderson         TCGTemp *ts2 = tcg_global_alloc(s);
1166c896fe29Sbellard         char buf[64];
11677ca4b752SRichard Henderson 
11687ca4b752SRichard Henderson         ts->base_type = TCG_TYPE_I64;
1169c896fe29Sbellard         ts->type = TCG_TYPE_I32;
1170b3915dbbSRichard Henderson         ts->indirect_reg = indirect_reg;
1171c896fe29Sbellard         ts->mem_allocated = 1;
1172b3a62939SRichard Henderson         ts->mem_base = base_ts;
11737ca4b752SRichard Henderson         ts->mem_offset = offset + bigendian * 4;
1174c896fe29Sbellard         pstrcpy(buf, sizeof(buf), name);
1175c896fe29Sbellard         pstrcat(buf, sizeof(buf), "_0");
1176c896fe29Sbellard         ts->name = strdup(buf);
1177c896fe29Sbellard 
11787ca4b752SRichard Henderson         tcg_debug_assert(ts2 == ts + 1);
11797ca4b752SRichard Henderson         ts2->base_type = TCG_TYPE_I64;
11807ca4b752SRichard Henderson         ts2->type = TCG_TYPE_I32;
1181b3915dbbSRichard Henderson         ts2->indirect_reg = indirect_reg;
11827ca4b752SRichard Henderson         ts2->mem_allocated = 1;
11837ca4b752SRichard Henderson         ts2->mem_base = base_ts;
11847ca4b752SRichard Henderson         ts2->mem_offset = offset + (1 - bigendian) * 4;
1185c896fe29Sbellard         pstrcpy(buf, sizeof(buf), name);
1186c896fe29Sbellard         pstrcat(buf, sizeof(buf), "_1");
1187120c1084SRichard Henderson         ts2->name = strdup(buf);
11887ca4b752SRichard Henderson     } else {
1189c896fe29Sbellard         ts->base_type = type;
1190c896fe29Sbellard         ts->type = type;
1191b3915dbbSRichard Henderson         ts->indirect_reg = indirect_reg;
1192c896fe29Sbellard         ts->mem_allocated = 1;
1193b3a62939SRichard Henderson         ts->mem_base = base_ts;
1194c896fe29Sbellard         ts->mem_offset = offset;
1195c896fe29Sbellard         ts->name = name;
1196c896fe29Sbellard     }
1197085272b3SRichard Henderson     return ts;
1198c896fe29Sbellard }
1199c896fe29Sbellard 
12005bfa8034SRichard Henderson TCGTemp *tcg_temp_new_internal(TCGType type, bool temp_local)
1201c896fe29Sbellard {
1202b1311c4aSEmilio G. Cota     TCGContext *s = tcg_ctx;
1203c896fe29Sbellard     TCGTemp *ts;
1204641d5fbeSbellard     int idx, k;
1205c896fe29Sbellard 
12060ec9eabcSRichard Henderson     k = type + (temp_local ? TCG_TYPE_COUNT : 0);
12070ec9eabcSRichard Henderson     idx = find_first_bit(s->free_temps[k].l, TCG_MAX_TEMPS);
12080ec9eabcSRichard Henderson     if (idx < TCG_MAX_TEMPS) {
12090ec9eabcSRichard Henderson         /* There is already an available temp with the right type.  */
12100ec9eabcSRichard Henderson         clear_bit(idx, s->free_temps[k].l);
12110ec9eabcSRichard Henderson 
1212e8996ee0Sbellard         ts = &s->temps[idx];
1213e8996ee0Sbellard         ts->temp_allocated = 1;
12147ca4b752SRichard Henderson         tcg_debug_assert(ts->base_type == type);
12157ca4b752SRichard Henderson         tcg_debug_assert(ts->temp_local == temp_local);
1216e8996ee0Sbellard     } else {
12177ca4b752SRichard Henderson         ts = tcg_temp_alloc(s);
12187ca4b752SRichard Henderson         if (TCG_TARGET_REG_BITS == 32 && type == TCG_TYPE_I64) {
12197ca4b752SRichard Henderson             TCGTemp *ts2 = tcg_temp_alloc(s);
12207ca4b752SRichard Henderson 
1221c896fe29Sbellard             ts->base_type = type;
1222c896fe29Sbellard             ts->type = TCG_TYPE_I32;
1223e8996ee0Sbellard             ts->temp_allocated = 1;
1224641d5fbeSbellard             ts->temp_local = temp_local;
12257ca4b752SRichard Henderson 
12267ca4b752SRichard Henderson             tcg_debug_assert(ts2 == ts + 1);
12277ca4b752SRichard Henderson             ts2->base_type = TCG_TYPE_I64;
12287ca4b752SRichard Henderson             ts2->type = TCG_TYPE_I32;
12297ca4b752SRichard Henderson             ts2->temp_allocated = 1;
12307ca4b752SRichard Henderson             ts2->temp_local = temp_local;
12317ca4b752SRichard Henderson         } else {
1232c896fe29Sbellard             ts->base_type = type;
1233c896fe29Sbellard             ts->type = type;
1234e8996ee0Sbellard             ts->temp_allocated = 1;
1235641d5fbeSbellard             ts->temp_local = temp_local;
1236c896fe29Sbellard         }
1237e8996ee0Sbellard     }
123827bfd83cSPeter Maydell 
123927bfd83cSPeter Maydell #if defined(CONFIG_DEBUG_TCG)
124027bfd83cSPeter Maydell     s->temps_in_use++;
124127bfd83cSPeter Maydell #endif
1242085272b3SRichard Henderson     return ts;
1243c896fe29Sbellard }
1244c896fe29Sbellard 
1245d2fd745fSRichard Henderson TCGv_vec tcg_temp_new_vec(TCGType type)
1246d2fd745fSRichard Henderson {
1247d2fd745fSRichard Henderson     TCGTemp *t;
1248d2fd745fSRichard Henderson 
1249d2fd745fSRichard Henderson #ifdef CONFIG_DEBUG_TCG
1250d2fd745fSRichard Henderson     switch (type) {
1251d2fd745fSRichard Henderson     case TCG_TYPE_V64:
1252d2fd745fSRichard Henderson         assert(TCG_TARGET_HAS_v64);
1253d2fd745fSRichard Henderson         break;
1254d2fd745fSRichard Henderson     case TCG_TYPE_V128:
1255d2fd745fSRichard Henderson         assert(TCG_TARGET_HAS_v128);
1256d2fd745fSRichard Henderson         break;
1257d2fd745fSRichard Henderson     case TCG_TYPE_V256:
1258d2fd745fSRichard Henderson         assert(TCG_TARGET_HAS_v256);
1259d2fd745fSRichard Henderson         break;
1260d2fd745fSRichard Henderson     default:
1261d2fd745fSRichard Henderson         g_assert_not_reached();
1262d2fd745fSRichard Henderson     }
1263d2fd745fSRichard Henderson #endif
1264d2fd745fSRichard Henderson 
1265d2fd745fSRichard Henderson     t = tcg_temp_new_internal(type, 0);
1266d2fd745fSRichard Henderson     return temp_tcgv_vec(t);
1267d2fd745fSRichard Henderson }
1268d2fd745fSRichard Henderson 
1269d2fd745fSRichard Henderson /* Create a new temp of the same type as an existing temp.  */
1270d2fd745fSRichard Henderson TCGv_vec tcg_temp_new_vec_matching(TCGv_vec match)
1271d2fd745fSRichard Henderson {
1272d2fd745fSRichard Henderson     TCGTemp *t = tcgv_vec_temp(match);
1273d2fd745fSRichard Henderson 
1274d2fd745fSRichard Henderson     tcg_debug_assert(t->temp_allocated != 0);
1275d2fd745fSRichard Henderson 
1276d2fd745fSRichard Henderson     t = tcg_temp_new_internal(t->base_type, 0);
1277d2fd745fSRichard Henderson     return temp_tcgv_vec(t);
1278d2fd745fSRichard Henderson }
1279d2fd745fSRichard Henderson 
12805bfa8034SRichard Henderson void tcg_temp_free_internal(TCGTemp *ts)
1281c896fe29Sbellard {
1282b1311c4aSEmilio G. Cota     TCGContext *s = tcg_ctx;
1283085272b3SRichard Henderson     int k, idx;
1284c896fe29Sbellard 
128527bfd83cSPeter Maydell #if defined(CONFIG_DEBUG_TCG)
128627bfd83cSPeter Maydell     s->temps_in_use--;
128727bfd83cSPeter Maydell     if (s->temps_in_use < 0) {
128827bfd83cSPeter Maydell         fprintf(stderr, "More temporaries freed than allocated!\n");
128927bfd83cSPeter Maydell     }
129027bfd83cSPeter Maydell #endif
129127bfd83cSPeter Maydell 
1292085272b3SRichard Henderson     tcg_debug_assert(ts->temp_global == 0);
1293eabb7b91SAurelien Jarno     tcg_debug_assert(ts->temp_allocated != 0);
1294e8996ee0Sbellard     ts->temp_allocated = 0;
12950ec9eabcSRichard Henderson 
1296085272b3SRichard Henderson     idx = temp_idx(ts);
129718d13fa2SAlexander Graf     k = ts->base_type + (ts->temp_local ? TCG_TYPE_COUNT : 0);
12980ec9eabcSRichard Henderson     set_bit(idx, s->free_temps[k].l);
1299e8996ee0Sbellard }
1300e8996ee0Sbellard 
1301a7812ae4Spbrook TCGv_i32 tcg_const_i32(int32_t val)
1302a7812ae4Spbrook {
1303a7812ae4Spbrook     TCGv_i32 t0;
1304a7812ae4Spbrook     t0 = tcg_temp_new_i32();
1305e8996ee0Sbellard     tcg_gen_movi_i32(t0, val);
1306e8996ee0Sbellard     return t0;
1307c896fe29Sbellard }
1308c896fe29Sbellard 
1309a7812ae4Spbrook TCGv_i64 tcg_const_i64(int64_t val)
1310c896fe29Sbellard {
1311a7812ae4Spbrook     TCGv_i64 t0;
1312a7812ae4Spbrook     t0 = tcg_temp_new_i64();
1313e8996ee0Sbellard     tcg_gen_movi_i64(t0, val);
1314e8996ee0Sbellard     return t0;
1315c896fe29Sbellard }
1316c896fe29Sbellard 
1317a7812ae4Spbrook TCGv_i32 tcg_const_local_i32(int32_t val)
1318bdffd4a9Saurel32 {
1319a7812ae4Spbrook     TCGv_i32 t0;
1320a7812ae4Spbrook     t0 = tcg_temp_local_new_i32();
1321bdffd4a9Saurel32     tcg_gen_movi_i32(t0, val);
1322bdffd4a9Saurel32     return t0;
1323bdffd4a9Saurel32 }
1324bdffd4a9Saurel32 
1325a7812ae4Spbrook TCGv_i64 tcg_const_local_i64(int64_t val)
1326bdffd4a9Saurel32 {
1327a7812ae4Spbrook     TCGv_i64 t0;
1328a7812ae4Spbrook     t0 = tcg_temp_local_new_i64();
1329bdffd4a9Saurel32     tcg_gen_movi_i64(t0, val);
1330bdffd4a9Saurel32     return t0;
1331bdffd4a9Saurel32 }
1332bdffd4a9Saurel32 
133327bfd83cSPeter Maydell #if defined(CONFIG_DEBUG_TCG)
133427bfd83cSPeter Maydell void tcg_clear_temp_count(void)
133527bfd83cSPeter Maydell {
1336b1311c4aSEmilio G. Cota     TCGContext *s = tcg_ctx;
133727bfd83cSPeter Maydell     s->temps_in_use = 0;
133827bfd83cSPeter Maydell }
133927bfd83cSPeter Maydell 
134027bfd83cSPeter Maydell int tcg_check_temp_count(void)
134127bfd83cSPeter Maydell {
1342b1311c4aSEmilio G. Cota     TCGContext *s = tcg_ctx;
134327bfd83cSPeter Maydell     if (s->temps_in_use) {
134427bfd83cSPeter Maydell         /* Clear the count so that we don't give another
134527bfd83cSPeter Maydell          * warning immediately next time around.
134627bfd83cSPeter Maydell          */
134727bfd83cSPeter Maydell         s->temps_in_use = 0;
134827bfd83cSPeter Maydell         return 1;
134927bfd83cSPeter Maydell     }
135027bfd83cSPeter Maydell     return 0;
135127bfd83cSPeter Maydell }
135227bfd83cSPeter Maydell #endif
135327bfd83cSPeter Maydell 
1354be0f34b5SRichard Henderson /* Return true if OP may appear in the opcode stream.
1355be0f34b5SRichard Henderson    Test the runtime variable that controls each opcode.  */
1356be0f34b5SRichard Henderson bool tcg_op_supported(TCGOpcode op)
1357be0f34b5SRichard Henderson {
1358d2fd745fSRichard Henderson     const bool have_vec
1359d2fd745fSRichard Henderson         = TCG_TARGET_HAS_v64 | TCG_TARGET_HAS_v128 | TCG_TARGET_HAS_v256;
1360d2fd745fSRichard Henderson 
1361be0f34b5SRichard Henderson     switch (op) {
1362be0f34b5SRichard Henderson     case INDEX_op_discard:
1363be0f34b5SRichard Henderson     case INDEX_op_set_label:
1364be0f34b5SRichard Henderson     case INDEX_op_call:
1365be0f34b5SRichard Henderson     case INDEX_op_br:
1366be0f34b5SRichard Henderson     case INDEX_op_mb:
1367be0f34b5SRichard Henderson     case INDEX_op_insn_start:
1368be0f34b5SRichard Henderson     case INDEX_op_exit_tb:
1369be0f34b5SRichard Henderson     case INDEX_op_goto_tb:
1370be0f34b5SRichard Henderson     case INDEX_op_qemu_ld_i32:
1371be0f34b5SRichard Henderson     case INDEX_op_qemu_st_i32:
1372be0f34b5SRichard Henderson     case INDEX_op_qemu_ld_i64:
1373be0f34b5SRichard Henderson     case INDEX_op_qemu_st_i64:
1374be0f34b5SRichard Henderson         return true;
1375be0f34b5SRichard Henderson 
1376be0f34b5SRichard Henderson     case INDEX_op_goto_ptr:
1377be0f34b5SRichard Henderson         return TCG_TARGET_HAS_goto_ptr;
1378be0f34b5SRichard Henderson 
1379be0f34b5SRichard Henderson     case INDEX_op_mov_i32:
1380be0f34b5SRichard Henderson     case INDEX_op_movi_i32:
1381be0f34b5SRichard Henderson     case INDEX_op_setcond_i32:
1382be0f34b5SRichard Henderson     case INDEX_op_brcond_i32:
1383be0f34b5SRichard Henderson     case INDEX_op_ld8u_i32:
1384be0f34b5SRichard Henderson     case INDEX_op_ld8s_i32:
1385be0f34b5SRichard Henderson     case INDEX_op_ld16u_i32:
1386be0f34b5SRichard Henderson     case INDEX_op_ld16s_i32:
1387be0f34b5SRichard Henderson     case INDEX_op_ld_i32:
1388be0f34b5SRichard Henderson     case INDEX_op_st8_i32:
1389be0f34b5SRichard Henderson     case INDEX_op_st16_i32:
1390be0f34b5SRichard Henderson     case INDEX_op_st_i32:
1391be0f34b5SRichard Henderson     case INDEX_op_add_i32:
1392be0f34b5SRichard Henderson     case INDEX_op_sub_i32:
1393be0f34b5SRichard Henderson     case INDEX_op_mul_i32:
1394be0f34b5SRichard Henderson     case INDEX_op_and_i32:
1395be0f34b5SRichard Henderson     case INDEX_op_or_i32:
1396be0f34b5SRichard Henderson     case INDEX_op_xor_i32:
1397be0f34b5SRichard Henderson     case INDEX_op_shl_i32:
1398be0f34b5SRichard Henderson     case INDEX_op_shr_i32:
1399be0f34b5SRichard Henderson     case INDEX_op_sar_i32:
1400be0f34b5SRichard Henderson         return true;
1401be0f34b5SRichard Henderson 
1402be0f34b5SRichard Henderson     case INDEX_op_movcond_i32:
1403be0f34b5SRichard Henderson         return TCG_TARGET_HAS_movcond_i32;
1404be0f34b5SRichard Henderson     case INDEX_op_div_i32:
1405be0f34b5SRichard Henderson     case INDEX_op_divu_i32:
1406be0f34b5SRichard Henderson         return TCG_TARGET_HAS_div_i32;
1407be0f34b5SRichard Henderson     case INDEX_op_rem_i32:
1408be0f34b5SRichard Henderson     case INDEX_op_remu_i32:
1409be0f34b5SRichard Henderson         return TCG_TARGET_HAS_rem_i32;
1410be0f34b5SRichard Henderson     case INDEX_op_div2_i32:
1411be0f34b5SRichard Henderson     case INDEX_op_divu2_i32:
1412be0f34b5SRichard Henderson         return TCG_TARGET_HAS_div2_i32;
1413be0f34b5SRichard Henderson     case INDEX_op_rotl_i32:
1414be0f34b5SRichard Henderson     case INDEX_op_rotr_i32:
1415be0f34b5SRichard Henderson         return TCG_TARGET_HAS_rot_i32;
1416be0f34b5SRichard Henderson     case INDEX_op_deposit_i32:
1417be0f34b5SRichard Henderson         return TCG_TARGET_HAS_deposit_i32;
1418be0f34b5SRichard Henderson     case INDEX_op_extract_i32:
1419be0f34b5SRichard Henderson         return TCG_TARGET_HAS_extract_i32;
1420be0f34b5SRichard Henderson     case INDEX_op_sextract_i32:
1421be0f34b5SRichard Henderson         return TCG_TARGET_HAS_sextract_i32;
1422be0f34b5SRichard Henderson     case INDEX_op_add2_i32:
1423be0f34b5SRichard Henderson         return TCG_TARGET_HAS_add2_i32;
1424be0f34b5SRichard Henderson     case INDEX_op_sub2_i32:
1425be0f34b5SRichard Henderson         return TCG_TARGET_HAS_sub2_i32;
1426be0f34b5SRichard Henderson     case INDEX_op_mulu2_i32:
1427be0f34b5SRichard Henderson         return TCG_TARGET_HAS_mulu2_i32;
1428be0f34b5SRichard Henderson     case INDEX_op_muls2_i32:
1429be0f34b5SRichard Henderson         return TCG_TARGET_HAS_muls2_i32;
1430be0f34b5SRichard Henderson     case INDEX_op_muluh_i32:
1431be0f34b5SRichard Henderson         return TCG_TARGET_HAS_muluh_i32;
1432be0f34b5SRichard Henderson     case INDEX_op_mulsh_i32:
1433be0f34b5SRichard Henderson         return TCG_TARGET_HAS_mulsh_i32;
1434be0f34b5SRichard Henderson     case INDEX_op_ext8s_i32:
1435be0f34b5SRichard Henderson         return TCG_TARGET_HAS_ext8s_i32;
1436be0f34b5SRichard Henderson     case INDEX_op_ext16s_i32:
1437be0f34b5SRichard Henderson         return TCG_TARGET_HAS_ext16s_i32;
1438be0f34b5SRichard Henderson     case INDEX_op_ext8u_i32:
1439be0f34b5SRichard Henderson         return TCG_TARGET_HAS_ext8u_i32;
1440be0f34b5SRichard Henderson     case INDEX_op_ext16u_i32:
1441be0f34b5SRichard Henderson         return TCG_TARGET_HAS_ext16u_i32;
1442be0f34b5SRichard Henderson     case INDEX_op_bswap16_i32:
1443be0f34b5SRichard Henderson         return TCG_TARGET_HAS_bswap16_i32;
1444be0f34b5SRichard Henderson     case INDEX_op_bswap32_i32:
1445be0f34b5SRichard Henderson         return TCG_TARGET_HAS_bswap32_i32;
1446be0f34b5SRichard Henderson     case INDEX_op_not_i32:
1447be0f34b5SRichard Henderson         return TCG_TARGET_HAS_not_i32;
1448be0f34b5SRichard Henderson     case INDEX_op_neg_i32:
1449be0f34b5SRichard Henderson         return TCG_TARGET_HAS_neg_i32;
1450be0f34b5SRichard Henderson     case INDEX_op_andc_i32:
1451be0f34b5SRichard Henderson         return TCG_TARGET_HAS_andc_i32;
1452be0f34b5SRichard Henderson     case INDEX_op_orc_i32:
1453be0f34b5SRichard Henderson         return TCG_TARGET_HAS_orc_i32;
1454be0f34b5SRichard Henderson     case INDEX_op_eqv_i32:
1455be0f34b5SRichard Henderson         return TCG_TARGET_HAS_eqv_i32;
1456be0f34b5SRichard Henderson     case INDEX_op_nand_i32:
1457be0f34b5SRichard Henderson         return TCG_TARGET_HAS_nand_i32;
1458be0f34b5SRichard Henderson     case INDEX_op_nor_i32:
1459be0f34b5SRichard Henderson         return TCG_TARGET_HAS_nor_i32;
1460be0f34b5SRichard Henderson     case INDEX_op_clz_i32:
1461be0f34b5SRichard Henderson         return TCG_TARGET_HAS_clz_i32;
1462be0f34b5SRichard Henderson     case INDEX_op_ctz_i32:
1463be0f34b5SRichard Henderson         return TCG_TARGET_HAS_ctz_i32;
1464be0f34b5SRichard Henderson     case INDEX_op_ctpop_i32:
1465be0f34b5SRichard Henderson         return TCG_TARGET_HAS_ctpop_i32;
1466be0f34b5SRichard Henderson 
1467be0f34b5SRichard Henderson     case INDEX_op_brcond2_i32:
1468be0f34b5SRichard Henderson     case INDEX_op_setcond2_i32:
1469be0f34b5SRichard Henderson         return TCG_TARGET_REG_BITS == 32;
1470be0f34b5SRichard Henderson 
1471be0f34b5SRichard Henderson     case INDEX_op_mov_i64:
1472be0f34b5SRichard Henderson     case INDEX_op_movi_i64:
1473be0f34b5SRichard Henderson     case INDEX_op_setcond_i64:
1474be0f34b5SRichard Henderson     case INDEX_op_brcond_i64:
1475be0f34b5SRichard Henderson     case INDEX_op_ld8u_i64:
1476be0f34b5SRichard Henderson     case INDEX_op_ld8s_i64:
1477be0f34b5SRichard Henderson     case INDEX_op_ld16u_i64:
1478be0f34b5SRichard Henderson     case INDEX_op_ld16s_i64:
1479be0f34b5SRichard Henderson     case INDEX_op_ld32u_i64:
1480be0f34b5SRichard Henderson     case INDEX_op_ld32s_i64:
1481be0f34b5SRichard Henderson     case INDEX_op_ld_i64:
1482be0f34b5SRichard Henderson     case INDEX_op_st8_i64:
1483be0f34b5SRichard Henderson     case INDEX_op_st16_i64:
1484be0f34b5SRichard Henderson     case INDEX_op_st32_i64:
1485be0f34b5SRichard Henderson     case INDEX_op_st_i64:
1486be0f34b5SRichard Henderson     case INDEX_op_add_i64:
1487be0f34b5SRichard Henderson     case INDEX_op_sub_i64:
1488be0f34b5SRichard Henderson     case INDEX_op_mul_i64:
1489be0f34b5SRichard Henderson     case INDEX_op_and_i64:
1490be0f34b5SRichard Henderson     case INDEX_op_or_i64:
1491be0f34b5SRichard Henderson     case INDEX_op_xor_i64:
1492be0f34b5SRichard Henderson     case INDEX_op_shl_i64:
1493be0f34b5SRichard Henderson     case INDEX_op_shr_i64:
1494be0f34b5SRichard Henderson     case INDEX_op_sar_i64:
1495be0f34b5SRichard Henderson     case INDEX_op_ext_i32_i64:
1496be0f34b5SRichard Henderson     case INDEX_op_extu_i32_i64:
1497be0f34b5SRichard Henderson         return TCG_TARGET_REG_BITS == 64;
1498be0f34b5SRichard Henderson 
1499be0f34b5SRichard Henderson     case INDEX_op_movcond_i64:
1500be0f34b5SRichard Henderson         return TCG_TARGET_HAS_movcond_i64;
1501be0f34b5SRichard Henderson     case INDEX_op_div_i64:
1502be0f34b5SRichard Henderson     case INDEX_op_divu_i64:
1503be0f34b5SRichard Henderson         return TCG_TARGET_HAS_div_i64;
1504be0f34b5SRichard Henderson     case INDEX_op_rem_i64:
1505be0f34b5SRichard Henderson     case INDEX_op_remu_i64:
1506be0f34b5SRichard Henderson         return TCG_TARGET_HAS_rem_i64;
1507be0f34b5SRichard Henderson     case INDEX_op_div2_i64:
1508be0f34b5SRichard Henderson     case INDEX_op_divu2_i64:
1509be0f34b5SRichard Henderson         return TCG_TARGET_HAS_div2_i64;
1510be0f34b5SRichard Henderson     case INDEX_op_rotl_i64:
1511be0f34b5SRichard Henderson     case INDEX_op_rotr_i64:
1512be0f34b5SRichard Henderson         return TCG_TARGET_HAS_rot_i64;
1513be0f34b5SRichard Henderson     case INDEX_op_deposit_i64:
1514be0f34b5SRichard Henderson         return TCG_TARGET_HAS_deposit_i64;
1515be0f34b5SRichard Henderson     case INDEX_op_extract_i64:
1516be0f34b5SRichard Henderson         return TCG_TARGET_HAS_extract_i64;
1517be0f34b5SRichard Henderson     case INDEX_op_sextract_i64:
1518be0f34b5SRichard Henderson         return TCG_TARGET_HAS_sextract_i64;
1519be0f34b5SRichard Henderson     case INDEX_op_extrl_i64_i32:
1520be0f34b5SRichard Henderson         return TCG_TARGET_HAS_extrl_i64_i32;
1521be0f34b5SRichard Henderson     case INDEX_op_extrh_i64_i32:
1522be0f34b5SRichard Henderson         return TCG_TARGET_HAS_extrh_i64_i32;
1523be0f34b5SRichard Henderson     case INDEX_op_ext8s_i64:
1524be0f34b5SRichard Henderson         return TCG_TARGET_HAS_ext8s_i64;
1525be0f34b5SRichard Henderson     case INDEX_op_ext16s_i64:
1526be0f34b5SRichard Henderson         return TCG_TARGET_HAS_ext16s_i64;
1527be0f34b5SRichard Henderson     case INDEX_op_ext32s_i64:
1528be0f34b5SRichard Henderson         return TCG_TARGET_HAS_ext32s_i64;
1529be0f34b5SRichard Henderson     case INDEX_op_ext8u_i64:
1530be0f34b5SRichard Henderson         return TCG_TARGET_HAS_ext8u_i64;
1531be0f34b5SRichard Henderson     case INDEX_op_ext16u_i64:
1532be0f34b5SRichard Henderson         return TCG_TARGET_HAS_ext16u_i64;
1533be0f34b5SRichard Henderson     case INDEX_op_ext32u_i64:
1534be0f34b5SRichard Henderson         return TCG_TARGET_HAS_ext32u_i64;
1535be0f34b5SRichard Henderson     case INDEX_op_bswap16_i64:
1536be0f34b5SRichard Henderson         return TCG_TARGET_HAS_bswap16_i64;
1537be0f34b5SRichard Henderson     case INDEX_op_bswap32_i64:
1538be0f34b5SRichard Henderson         return TCG_TARGET_HAS_bswap32_i64;
1539be0f34b5SRichard Henderson     case INDEX_op_bswap64_i64:
1540be0f34b5SRichard Henderson         return TCG_TARGET_HAS_bswap64_i64;
1541be0f34b5SRichard Henderson     case INDEX_op_not_i64:
1542be0f34b5SRichard Henderson         return TCG_TARGET_HAS_not_i64;
1543be0f34b5SRichard Henderson     case INDEX_op_neg_i64:
1544be0f34b5SRichard Henderson         return TCG_TARGET_HAS_neg_i64;
1545be0f34b5SRichard Henderson     case INDEX_op_andc_i64:
1546be0f34b5SRichard Henderson         return TCG_TARGET_HAS_andc_i64;
1547be0f34b5SRichard Henderson     case INDEX_op_orc_i64:
1548be0f34b5SRichard Henderson         return TCG_TARGET_HAS_orc_i64;
1549be0f34b5SRichard Henderson     case INDEX_op_eqv_i64:
1550be0f34b5SRichard Henderson         return TCG_TARGET_HAS_eqv_i64;
1551be0f34b5SRichard Henderson     case INDEX_op_nand_i64:
1552be0f34b5SRichard Henderson         return TCG_TARGET_HAS_nand_i64;
1553be0f34b5SRichard Henderson     case INDEX_op_nor_i64:
1554be0f34b5SRichard Henderson         return TCG_TARGET_HAS_nor_i64;
1555be0f34b5SRichard Henderson     case INDEX_op_clz_i64:
1556be0f34b5SRichard Henderson         return TCG_TARGET_HAS_clz_i64;
1557be0f34b5SRichard Henderson     case INDEX_op_ctz_i64:
1558be0f34b5SRichard Henderson         return TCG_TARGET_HAS_ctz_i64;
1559be0f34b5SRichard Henderson     case INDEX_op_ctpop_i64:
1560be0f34b5SRichard Henderson         return TCG_TARGET_HAS_ctpop_i64;
1561be0f34b5SRichard Henderson     case INDEX_op_add2_i64:
1562be0f34b5SRichard Henderson         return TCG_TARGET_HAS_add2_i64;
1563be0f34b5SRichard Henderson     case INDEX_op_sub2_i64:
1564be0f34b5SRichard Henderson         return TCG_TARGET_HAS_sub2_i64;
1565be0f34b5SRichard Henderson     case INDEX_op_mulu2_i64:
1566be0f34b5SRichard Henderson         return TCG_TARGET_HAS_mulu2_i64;
1567be0f34b5SRichard Henderson     case INDEX_op_muls2_i64:
1568be0f34b5SRichard Henderson         return TCG_TARGET_HAS_muls2_i64;
1569be0f34b5SRichard Henderson     case INDEX_op_muluh_i64:
1570be0f34b5SRichard Henderson         return TCG_TARGET_HAS_muluh_i64;
1571be0f34b5SRichard Henderson     case INDEX_op_mulsh_i64:
1572be0f34b5SRichard Henderson         return TCG_TARGET_HAS_mulsh_i64;
1573be0f34b5SRichard Henderson 
1574d2fd745fSRichard Henderson     case INDEX_op_mov_vec:
1575d2fd745fSRichard Henderson     case INDEX_op_dup_vec:
1576d2fd745fSRichard Henderson     case INDEX_op_dupi_vec:
1577d2fd745fSRichard Henderson     case INDEX_op_ld_vec:
1578d2fd745fSRichard Henderson     case INDEX_op_st_vec:
1579d2fd745fSRichard Henderson     case INDEX_op_add_vec:
1580d2fd745fSRichard Henderson     case INDEX_op_sub_vec:
1581d2fd745fSRichard Henderson     case INDEX_op_and_vec:
1582d2fd745fSRichard Henderson     case INDEX_op_or_vec:
1583d2fd745fSRichard Henderson     case INDEX_op_xor_vec:
1584212be173SRichard Henderson     case INDEX_op_cmp_vec:
1585d2fd745fSRichard Henderson         return have_vec;
1586d2fd745fSRichard Henderson     case INDEX_op_dup2_vec:
1587d2fd745fSRichard Henderson         return have_vec && TCG_TARGET_REG_BITS == 32;
1588d2fd745fSRichard Henderson     case INDEX_op_not_vec:
1589d2fd745fSRichard Henderson         return have_vec && TCG_TARGET_HAS_not_vec;
1590d2fd745fSRichard Henderson     case INDEX_op_neg_vec:
1591d2fd745fSRichard Henderson         return have_vec && TCG_TARGET_HAS_neg_vec;
1592d2fd745fSRichard Henderson     case INDEX_op_andc_vec:
1593d2fd745fSRichard Henderson         return have_vec && TCG_TARGET_HAS_andc_vec;
1594d2fd745fSRichard Henderson     case INDEX_op_orc_vec:
1595d2fd745fSRichard Henderson         return have_vec && TCG_TARGET_HAS_orc_vec;
15963774030aSRichard Henderson     case INDEX_op_mul_vec:
15973774030aSRichard Henderson         return have_vec && TCG_TARGET_HAS_mul_vec;
1598d0ec9796SRichard Henderson     case INDEX_op_shli_vec:
1599d0ec9796SRichard Henderson     case INDEX_op_shri_vec:
1600d0ec9796SRichard Henderson     case INDEX_op_sari_vec:
1601d0ec9796SRichard Henderson         return have_vec && TCG_TARGET_HAS_shi_vec;
1602d0ec9796SRichard Henderson     case INDEX_op_shls_vec:
1603d0ec9796SRichard Henderson     case INDEX_op_shrs_vec:
1604d0ec9796SRichard Henderson     case INDEX_op_sars_vec:
1605d0ec9796SRichard Henderson         return have_vec && TCG_TARGET_HAS_shs_vec;
1606d0ec9796SRichard Henderson     case INDEX_op_shlv_vec:
1607d0ec9796SRichard Henderson     case INDEX_op_shrv_vec:
1608d0ec9796SRichard Henderson     case INDEX_op_sarv_vec:
1609d0ec9796SRichard Henderson         return have_vec && TCG_TARGET_HAS_shv_vec;
1610d2fd745fSRichard Henderson 
1611db432672SRichard Henderson     default:
1612db432672SRichard Henderson         tcg_debug_assert(op > INDEX_op_last_generic && op < NB_OPS);
1613db432672SRichard Henderson         return true;
1614be0f34b5SRichard Henderson     }
1615be0f34b5SRichard Henderson }
1616be0f34b5SRichard Henderson 
161739cf05d3Sbellard /* Note: we convert the 64 bit args to 32 bit and do some alignment
161839cf05d3Sbellard    and endian swap. Maybe it would be better to do the alignment
161939cf05d3Sbellard    and endian swap in tcg_reg_alloc_call(). */
1620ae8b75dcSRichard Henderson void tcg_gen_callN(void *func, TCGTemp *ret, int nargs, TCGTemp **args)
1621c896fe29Sbellard {
162275e8b9b7SRichard Henderson     int i, real_args, nb_rets, pi;
1623bbb8a1b4SRichard Henderson     unsigned sizemask, flags;
1624afb49896SRichard Henderson     TCGHelperInfo *info;
162575e8b9b7SRichard Henderson     TCGOp *op;
1626afb49896SRichard Henderson 
1627619205fdSEmilio G. Cota     info = g_hash_table_lookup(helper_table, (gpointer)func);
1628bbb8a1b4SRichard Henderson     flags = info->flags;
1629bbb8a1b4SRichard Henderson     sizemask = info->sizemask;
16302bece2c8SRichard Henderson 
163134b1a49cSRichard Henderson #if defined(__sparc__) && !defined(__arch64__) \
163234b1a49cSRichard Henderson     && !defined(CONFIG_TCG_INTERPRETER)
163334b1a49cSRichard Henderson     /* We have 64-bit values in one register, but need to pass as two
163434b1a49cSRichard Henderson        separate parameters.  Split them.  */
163534b1a49cSRichard Henderson     int orig_sizemask = sizemask;
163634b1a49cSRichard Henderson     int orig_nargs = nargs;
163734b1a49cSRichard Henderson     TCGv_i64 retl, reth;
1638ae8b75dcSRichard Henderson     TCGTemp *split_args[MAX_OPC_PARAM];
163934b1a49cSRichard Henderson 
1640f764718dSRichard Henderson     retl = NULL;
1641f764718dSRichard Henderson     reth = NULL;
164234b1a49cSRichard Henderson     if (sizemask != 0) {
164334b1a49cSRichard Henderson         for (i = real_args = 0; i < nargs; ++i) {
164434b1a49cSRichard Henderson             int is_64bit = sizemask & (1 << (i+1)*2);
164534b1a49cSRichard Henderson             if (is_64bit) {
1646085272b3SRichard Henderson                 TCGv_i64 orig = temp_tcgv_i64(args[i]);
164734b1a49cSRichard Henderson                 TCGv_i32 h = tcg_temp_new_i32();
164834b1a49cSRichard Henderson                 TCGv_i32 l = tcg_temp_new_i32();
164934b1a49cSRichard Henderson                 tcg_gen_extr_i64_i32(l, h, orig);
1650ae8b75dcSRichard Henderson                 split_args[real_args++] = tcgv_i32_temp(h);
1651ae8b75dcSRichard Henderson                 split_args[real_args++] = tcgv_i32_temp(l);
165234b1a49cSRichard Henderson             } else {
165334b1a49cSRichard Henderson                 split_args[real_args++] = args[i];
165434b1a49cSRichard Henderson             }
165534b1a49cSRichard Henderson         }
165634b1a49cSRichard Henderson         nargs = real_args;
165734b1a49cSRichard Henderson         args = split_args;
165834b1a49cSRichard Henderson         sizemask = 0;
165934b1a49cSRichard Henderson     }
166034b1a49cSRichard Henderson #elif defined(TCG_TARGET_EXTEND_ARGS) && TCG_TARGET_REG_BITS == 64
16612bece2c8SRichard Henderson     for (i = 0; i < nargs; ++i) {
16622bece2c8SRichard Henderson         int is_64bit = sizemask & (1 << (i+1)*2);
16632bece2c8SRichard Henderson         int is_signed = sizemask & (2 << (i+1)*2);
16642bece2c8SRichard Henderson         if (!is_64bit) {
16652bece2c8SRichard Henderson             TCGv_i64 temp = tcg_temp_new_i64();
1666085272b3SRichard Henderson             TCGv_i64 orig = temp_tcgv_i64(args[i]);
16672bece2c8SRichard Henderson             if (is_signed) {
16682bece2c8SRichard Henderson                 tcg_gen_ext32s_i64(temp, orig);
16692bece2c8SRichard Henderson             } else {
16702bece2c8SRichard Henderson                 tcg_gen_ext32u_i64(temp, orig);
16712bece2c8SRichard Henderson             }
1672ae8b75dcSRichard Henderson             args[i] = tcgv_i64_temp(temp);
16732bece2c8SRichard Henderson         }
16742bece2c8SRichard Henderson     }
16752bece2c8SRichard Henderson #endif /* TCG_TARGET_EXTEND_ARGS */
16762bece2c8SRichard Henderson 
167715fa08f8SRichard Henderson     op = tcg_emit_op(INDEX_op_call);
167875e8b9b7SRichard Henderson 
167975e8b9b7SRichard Henderson     pi = 0;
1680ae8b75dcSRichard Henderson     if (ret != NULL) {
168134b1a49cSRichard Henderson #if defined(__sparc__) && !defined(__arch64__) \
168234b1a49cSRichard Henderson     && !defined(CONFIG_TCG_INTERPRETER)
168334b1a49cSRichard Henderson         if (orig_sizemask & 1) {
168434b1a49cSRichard Henderson             /* The 32-bit ABI is going to return the 64-bit value in
168534b1a49cSRichard Henderson                the %o0/%o1 register pair.  Prepare for this by using
168634b1a49cSRichard Henderson                two return temporaries, and reassemble below.  */
168734b1a49cSRichard Henderson             retl = tcg_temp_new_i64();
168834b1a49cSRichard Henderson             reth = tcg_temp_new_i64();
1689ae8b75dcSRichard Henderson             op->args[pi++] = tcgv_i64_arg(reth);
1690ae8b75dcSRichard Henderson             op->args[pi++] = tcgv_i64_arg(retl);
169134b1a49cSRichard Henderson             nb_rets = 2;
169234b1a49cSRichard Henderson         } else {
1693ae8b75dcSRichard Henderson             op->args[pi++] = temp_arg(ret);
169434b1a49cSRichard Henderson             nb_rets = 1;
169534b1a49cSRichard Henderson         }
169634b1a49cSRichard Henderson #else
169734b1a49cSRichard Henderson         if (TCG_TARGET_REG_BITS < 64 && (sizemask & 1)) {
169802eb19d0SRichard Henderson #ifdef HOST_WORDS_BIGENDIAN
1699ae8b75dcSRichard Henderson             op->args[pi++] = temp_arg(ret + 1);
1700ae8b75dcSRichard Henderson             op->args[pi++] = temp_arg(ret);
1701a7812ae4Spbrook #else
1702ae8b75dcSRichard Henderson             op->args[pi++] = temp_arg(ret);
1703ae8b75dcSRichard Henderson             op->args[pi++] = temp_arg(ret + 1);
1704a7812ae4Spbrook #endif
1705a7812ae4Spbrook             nb_rets = 2;
170634b1a49cSRichard Henderson         } else {
1707ae8b75dcSRichard Henderson             op->args[pi++] = temp_arg(ret);
1708a7812ae4Spbrook             nb_rets = 1;
1709a7812ae4Spbrook         }
171034b1a49cSRichard Henderson #endif
1711a7812ae4Spbrook     } else {
1712a7812ae4Spbrook         nb_rets = 0;
1713a7812ae4Spbrook     }
1714cd9090aaSRichard Henderson     TCGOP_CALLO(op) = nb_rets;
171575e8b9b7SRichard Henderson 
1716a7812ae4Spbrook     real_args = 0;
1717a7812ae4Spbrook     for (i = 0; i < nargs; i++) {
17182bece2c8SRichard Henderson         int is_64bit = sizemask & (1 << (i+1)*2);
1719bbb8a1b4SRichard Henderson         if (TCG_TARGET_REG_BITS < 64 && is_64bit) {
172039cf05d3Sbellard #ifdef TCG_TARGET_CALL_ALIGN_ARGS
172139cf05d3Sbellard             /* some targets want aligned 64 bit args */
1722ebd486d5Smalc             if (real_args & 1) {
172375e8b9b7SRichard Henderson                 op->args[pi++] = TCG_CALL_DUMMY_ARG;
1724ebd486d5Smalc                 real_args++;
172539cf05d3Sbellard             }
172639cf05d3Sbellard #endif
17273f90f252SRichard Henderson            /* If stack grows up, then we will be placing successive
17283f90f252SRichard Henderson               arguments at lower addresses, which means we need to
17293f90f252SRichard Henderson               reverse the order compared to how we would normally
17303f90f252SRichard Henderson               treat either big or little-endian.  For those arguments
17313f90f252SRichard Henderson               that will wind up in registers, this still works for
17323f90f252SRichard Henderson               HPPA (the only current STACK_GROWSUP target) since the
17333f90f252SRichard Henderson               argument registers are *also* allocated in decreasing
17343f90f252SRichard Henderson               order.  If another such target is added, this logic may
17353f90f252SRichard Henderson               have to get more complicated to differentiate between
17363f90f252SRichard Henderson               stack arguments and register arguments.  */
173702eb19d0SRichard Henderson #if defined(HOST_WORDS_BIGENDIAN) != defined(TCG_TARGET_STACK_GROWSUP)
1738ae8b75dcSRichard Henderson             op->args[pi++] = temp_arg(args[i] + 1);
1739ae8b75dcSRichard Henderson             op->args[pi++] = temp_arg(args[i]);
1740c896fe29Sbellard #else
1741ae8b75dcSRichard Henderson             op->args[pi++] = temp_arg(args[i]);
1742ae8b75dcSRichard Henderson             op->args[pi++] = temp_arg(args[i] + 1);
1743c896fe29Sbellard #endif
1744a7812ae4Spbrook             real_args += 2;
17452bece2c8SRichard Henderson             continue;
17462bece2c8SRichard Henderson         }
17472bece2c8SRichard Henderson 
1748ae8b75dcSRichard Henderson         op->args[pi++] = temp_arg(args[i]);
1749a7812ae4Spbrook         real_args++;
1750c896fe29Sbellard     }
175175e8b9b7SRichard Henderson     op->args[pi++] = (uintptr_t)func;
175275e8b9b7SRichard Henderson     op->args[pi++] = flags;
1753cd9090aaSRichard Henderson     TCGOP_CALLI(op) = real_args;
1754a7812ae4Spbrook 
175575e8b9b7SRichard Henderson     /* Make sure the fields didn't overflow.  */
1756cd9090aaSRichard Henderson     tcg_debug_assert(TCGOP_CALLI(op) == real_args);
175775e8b9b7SRichard Henderson     tcg_debug_assert(pi <= ARRAY_SIZE(op->args));
17582bece2c8SRichard Henderson 
175934b1a49cSRichard Henderson #if defined(__sparc__) && !defined(__arch64__) \
176034b1a49cSRichard Henderson     && !defined(CONFIG_TCG_INTERPRETER)
176134b1a49cSRichard Henderson     /* Free all of the parts we allocated above.  */
176234b1a49cSRichard Henderson     for (i = real_args = 0; i < orig_nargs; ++i) {
176334b1a49cSRichard Henderson         int is_64bit = orig_sizemask & (1 << (i+1)*2);
176434b1a49cSRichard Henderson         if (is_64bit) {
1765085272b3SRichard Henderson             tcg_temp_free_internal(args[real_args++]);
1766085272b3SRichard Henderson             tcg_temp_free_internal(args[real_args++]);
176734b1a49cSRichard Henderson         } else {
176834b1a49cSRichard Henderson             real_args++;
176934b1a49cSRichard Henderson         }
177034b1a49cSRichard Henderson     }
177134b1a49cSRichard Henderson     if (orig_sizemask & 1) {
177234b1a49cSRichard Henderson         /* The 32-bit ABI returned two 32-bit pieces.  Re-assemble them.
177334b1a49cSRichard Henderson            Note that describing these as TCGv_i64 eliminates an unnecessary
177434b1a49cSRichard Henderson            zero-extension that tcg_gen_concat_i32_i64 would create.  */
1775085272b3SRichard Henderson         tcg_gen_concat32_i64(temp_tcgv_i64(ret), retl, reth);
177634b1a49cSRichard Henderson         tcg_temp_free_i64(retl);
177734b1a49cSRichard Henderson         tcg_temp_free_i64(reth);
177834b1a49cSRichard Henderson     }
177934b1a49cSRichard Henderson #elif defined(TCG_TARGET_EXTEND_ARGS) && TCG_TARGET_REG_BITS == 64
17802bece2c8SRichard Henderson     for (i = 0; i < nargs; ++i) {
17812bece2c8SRichard Henderson         int is_64bit = sizemask & (1 << (i+1)*2);
17822bece2c8SRichard Henderson         if (!is_64bit) {
1783085272b3SRichard Henderson             tcg_temp_free_internal(args[i]);
17842bece2c8SRichard Henderson         }
17852bece2c8SRichard Henderson     }
17862bece2c8SRichard Henderson #endif /* TCG_TARGET_EXTEND_ARGS */
1787a7812ae4Spbrook }
1788c896fe29Sbellard 
17898fcd3692Sblueswir1 static void tcg_reg_alloc_start(TCGContext *s)
1790c896fe29Sbellard {
1791ac3b8891SRichard Henderson     int i, n;
1792c896fe29Sbellard     TCGTemp *ts;
1793ac3b8891SRichard Henderson 
1794ac3b8891SRichard Henderson     for (i = 0, n = s->nb_globals; i < n; i++) {
1795c896fe29Sbellard         ts = &s->temps[i];
1796ac3b8891SRichard Henderson         ts->val_type = (ts->fixed_reg ? TEMP_VAL_REG : TEMP_VAL_MEM);
1797c896fe29Sbellard     }
1798ac3b8891SRichard Henderson     for (n = s->nb_temps; i < n; i++) {
1799e8996ee0Sbellard         ts = &s->temps[i];
1800ac3b8891SRichard Henderson         ts->val_type = (ts->temp_local ? TEMP_VAL_MEM : TEMP_VAL_DEAD);
1801e8996ee0Sbellard         ts->mem_allocated = 0;
1802e8996ee0Sbellard         ts->fixed_reg = 0;
1803e8996ee0Sbellard     }
1804f8b2f202SRichard Henderson 
1805f8b2f202SRichard Henderson     memset(s->reg_to_temp, 0, sizeof(s->reg_to_temp));
1806c896fe29Sbellard }
1807c896fe29Sbellard 
1808f8b2f202SRichard Henderson static char *tcg_get_arg_str_ptr(TCGContext *s, char *buf, int buf_size,
1809f8b2f202SRichard Henderson                                  TCGTemp *ts)
1810c896fe29Sbellard {
18111807f4c4SRichard Henderson     int idx = temp_idx(ts);
1812ac56dd48Spbrook 
1813fa477d25SRichard Henderson     if (ts->temp_global) {
1814ac56dd48Spbrook         pstrcpy(buf, buf_size, ts->name);
1815f8b2f202SRichard Henderson     } else if (ts->temp_local) {
1816641d5fbeSbellard         snprintf(buf, buf_size, "loc%d", idx - s->nb_globals);
1817f8b2f202SRichard Henderson     } else {
1818ac56dd48Spbrook         snprintf(buf, buf_size, "tmp%d", idx - s->nb_globals);
1819c896fe29Sbellard     }
1820c896fe29Sbellard     return buf;
1821c896fe29Sbellard }
1822c896fe29Sbellard 
182343439139SRichard Henderson static char *tcg_get_arg_str(TCGContext *s, char *buf,
182443439139SRichard Henderson                              int buf_size, TCGArg arg)
1825f8b2f202SRichard Henderson {
182643439139SRichard Henderson     return tcg_get_arg_str_ptr(s, buf, buf_size, arg_temp(arg));
1827f8b2f202SRichard Henderson }
1828f8b2f202SRichard Henderson 
18296e085f72SRichard Henderson /* Find helper name.  */
18306e085f72SRichard Henderson static inline const char *tcg_find_helper(TCGContext *s, uintptr_t val)
1831e8996ee0Sbellard {
18326e085f72SRichard Henderson     const char *ret = NULL;
1833619205fdSEmilio G. Cota     if (helper_table) {
1834619205fdSEmilio G. Cota         TCGHelperInfo *info = g_hash_table_lookup(helper_table, (gpointer)val);
183572866e82SRichard Henderson         if (info) {
183672866e82SRichard Henderson             ret = info->name;
183772866e82SRichard Henderson         }
1838e8996ee0Sbellard     }
18396e085f72SRichard Henderson     return ret;
18404dc81f28Sbellard }
18414dc81f28Sbellard 
1842f48f3edeSblueswir1 static const char * const cond_name[] =
1843f48f3edeSblueswir1 {
18440aed257fSRichard Henderson     [TCG_COND_NEVER] = "never",
18450aed257fSRichard Henderson     [TCG_COND_ALWAYS] = "always",
1846f48f3edeSblueswir1     [TCG_COND_EQ] = "eq",
1847f48f3edeSblueswir1     [TCG_COND_NE] = "ne",
1848f48f3edeSblueswir1     [TCG_COND_LT] = "lt",
1849f48f3edeSblueswir1     [TCG_COND_GE] = "ge",
1850f48f3edeSblueswir1     [TCG_COND_LE] = "le",
1851f48f3edeSblueswir1     [TCG_COND_GT] = "gt",
1852f48f3edeSblueswir1     [TCG_COND_LTU] = "ltu",
1853f48f3edeSblueswir1     [TCG_COND_GEU] = "geu",
1854f48f3edeSblueswir1     [TCG_COND_LEU] = "leu",
1855f48f3edeSblueswir1     [TCG_COND_GTU] = "gtu"
1856f48f3edeSblueswir1 };
1857f48f3edeSblueswir1 
1858f713d6adSRichard Henderson static const char * const ldst_name[] =
1859f713d6adSRichard Henderson {
1860f713d6adSRichard Henderson     [MO_UB]   = "ub",
1861f713d6adSRichard Henderson     [MO_SB]   = "sb",
1862f713d6adSRichard Henderson     [MO_LEUW] = "leuw",
1863f713d6adSRichard Henderson     [MO_LESW] = "lesw",
1864f713d6adSRichard Henderson     [MO_LEUL] = "leul",
1865f713d6adSRichard Henderson     [MO_LESL] = "lesl",
1866f713d6adSRichard Henderson     [MO_LEQ]  = "leq",
1867f713d6adSRichard Henderson     [MO_BEUW] = "beuw",
1868f713d6adSRichard Henderson     [MO_BESW] = "besw",
1869f713d6adSRichard Henderson     [MO_BEUL] = "beul",
1870f713d6adSRichard Henderson     [MO_BESL] = "besl",
1871f713d6adSRichard Henderson     [MO_BEQ]  = "beq",
1872f713d6adSRichard Henderson };
1873f713d6adSRichard Henderson 
18741f00b27fSSergey Sorokin static const char * const alignment_name[(MO_AMASK >> MO_ASHIFT) + 1] = {
18751f00b27fSSergey Sorokin #ifdef ALIGNED_ONLY
18761f00b27fSSergey Sorokin     [MO_UNALN >> MO_ASHIFT]    = "un+",
18771f00b27fSSergey Sorokin     [MO_ALIGN >> MO_ASHIFT]    = "",
18781f00b27fSSergey Sorokin #else
18791f00b27fSSergey Sorokin     [MO_UNALN >> MO_ASHIFT]    = "",
18801f00b27fSSergey Sorokin     [MO_ALIGN >> MO_ASHIFT]    = "al+",
18811f00b27fSSergey Sorokin #endif
18821f00b27fSSergey Sorokin     [MO_ALIGN_2 >> MO_ASHIFT]  = "al2+",
18831f00b27fSSergey Sorokin     [MO_ALIGN_4 >> MO_ASHIFT]  = "al4+",
18841f00b27fSSergey Sorokin     [MO_ALIGN_8 >> MO_ASHIFT]  = "al8+",
18851f00b27fSSergey Sorokin     [MO_ALIGN_16 >> MO_ASHIFT] = "al16+",
18861f00b27fSSergey Sorokin     [MO_ALIGN_32 >> MO_ASHIFT] = "al32+",
18871f00b27fSSergey Sorokin     [MO_ALIGN_64 >> MO_ASHIFT] = "al64+",
18881f00b27fSSergey Sorokin };
18891f00b27fSSergey Sorokin 
1890b016486eSRichard Henderson static inline bool tcg_regset_single(TCGRegSet d)
1891b016486eSRichard Henderson {
1892b016486eSRichard Henderson     return (d & (d - 1)) == 0;
1893b016486eSRichard Henderson }
1894b016486eSRichard Henderson 
1895b016486eSRichard Henderson static inline TCGReg tcg_regset_first(TCGRegSet d)
1896b016486eSRichard Henderson {
1897b016486eSRichard Henderson     if (TCG_TARGET_NB_REGS <= 32) {
1898b016486eSRichard Henderson         return ctz32(d);
1899b016486eSRichard Henderson     } else {
1900b016486eSRichard Henderson         return ctz64(d);
1901b016486eSRichard Henderson     }
1902b016486eSRichard Henderson }
1903b016486eSRichard Henderson 
19041894f69aSRichard Henderson static void tcg_dump_ops(TCGContext *s, bool have_prefs)
1905c896fe29Sbellard {
1906c896fe29Sbellard     char buf[128];
1907c45cb8bbSRichard Henderson     TCGOp *op;
1908c896fe29Sbellard 
190915fa08f8SRichard Henderson     QTAILQ_FOREACH(op, &s->ops, link) {
1910c45cb8bbSRichard Henderson         int i, k, nb_oargs, nb_iargs, nb_cargs;
1911c45cb8bbSRichard Henderson         const TCGOpDef *def;
1912c45cb8bbSRichard Henderson         TCGOpcode c;
1913bdfb460eSRichard Henderson         int col = 0;
1914c45cb8bbSRichard Henderson 
1915c45cb8bbSRichard Henderson         c = op->opc;
1916c896fe29Sbellard         def = &tcg_op_defs[c];
1917c45cb8bbSRichard Henderson 
1918765b842aSRichard Henderson         if (c == INDEX_op_insn_start) {
1919b016486eSRichard Henderson             nb_oargs = 0;
192015fa08f8SRichard Henderson             col += qemu_log("\n ----");
19219aef40edSRichard Henderson 
19229aef40edSRichard Henderson             for (i = 0; i < TARGET_INSN_START_WORDS; ++i) {
19239aef40edSRichard Henderson                 target_ulong a;
19247e4597d7Sbellard #if TARGET_LONG_BITS > TCG_TARGET_REG_BITS
1925efee3746SRichard Henderson                 a = deposit64(op->args[i * 2], 32, 32, op->args[i * 2 + 1]);
19267e4597d7Sbellard #else
1927efee3746SRichard Henderson                 a = op->args[i];
19287e4597d7Sbellard #endif
1929bdfb460eSRichard Henderson                 col += qemu_log(" " TARGET_FMT_lx, a);
1930eeacee4dSBlue Swirl             }
19317e4597d7Sbellard         } else if (c == INDEX_op_call) {
1932c896fe29Sbellard             /* variable number of arguments */
1933cd9090aaSRichard Henderson             nb_oargs = TCGOP_CALLO(op);
1934cd9090aaSRichard Henderson             nb_iargs = TCGOP_CALLI(op);
1935c896fe29Sbellard             nb_cargs = def->nb_cargs;
1936b03cce8eSbellard 
1937cf066674SRichard Henderson             /* function name, flags, out args */
1938bdfb460eSRichard Henderson             col += qemu_log(" %s %s,$0x%" TCG_PRIlx ",$%d", def->name,
1939efee3746SRichard Henderson                             tcg_find_helper(s, op->args[nb_oargs + nb_iargs]),
1940efee3746SRichard Henderson                             op->args[nb_oargs + nb_iargs + 1], nb_oargs);
1941b03cce8eSbellard             for (i = 0; i < nb_oargs; i++) {
194243439139SRichard Henderson                 col += qemu_log(",%s", tcg_get_arg_str(s, buf, sizeof(buf),
1943efee3746SRichard Henderson                                                        op->args[i]));
1944b03cce8eSbellard             }
1945cf066674SRichard Henderson             for (i = 0; i < nb_iargs; i++) {
1946efee3746SRichard Henderson                 TCGArg arg = op->args[nb_oargs + i];
1947cf066674SRichard Henderson                 const char *t = "<dummy>";
1948cf066674SRichard Henderson                 if (arg != TCG_CALL_DUMMY_ARG) {
194943439139SRichard Henderson                     t = tcg_get_arg_str(s, buf, sizeof(buf), arg);
1950b03cce8eSbellard                 }
1951bdfb460eSRichard Henderson                 col += qemu_log(",%s", t);
1952e8996ee0Sbellard             }
1953b03cce8eSbellard         } else {
1954bdfb460eSRichard Henderson             col += qemu_log(" %s ", def->name);
1955c45cb8bbSRichard Henderson 
1956c896fe29Sbellard             nb_oargs = def->nb_oargs;
1957c896fe29Sbellard             nb_iargs = def->nb_iargs;
1958c896fe29Sbellard             nb_cargs = def->nb_cargs;
1959c896fe29Sbellard 
1960d2fd745fSRichard Henderson             if (def->flags & TCG_OPF_VECTOR) {
1961d2fd745fSRichard Henderson                 col += qemu_log("v%d,e%d,", 64 << TCGOP_VECL(op),
1962d2fd745fSRichard Henderson                                 8 << TCGOP_VECE(op));
1963d2fd745fSRichard Henderson             }
1964d2fd745fSRichard Henderson 
1965c896fe29Sbellard             k = 0;
1966c896fe29Sbellard             for (i = 0; i < nb_oargs; i++) {
1967eeacee4dSBlue Swirl                 if (k != 0) {
1968bdfb460eSRichard Henderson                     col += qemu_log(",");
1969eeacee4dSBlue Swirl                 }
197043439139SRichard Henderson                 col += qemu_log("%s", tcg_get_arg_str(s, buf, sizeof(buf),
1971efee3746SRichard Henderson                                                       op->args[k++]));
1972c896fe29Sbellard             }
1973c896fe29Sbellard             for (i = 0; i < nb_iargs; i++) {
1974eeacee4dSBlue Swirl                 if (k != 0) {
1975bdfb460eSRichard Henderson                     col += qemu_log(",");
1976eeacee4dSBlue Swirl                 }
197743439139SRichard Henderson                 col += qemu_log("%s", tcg_get_arg_str(s, buf, sizeof(buf),
1978efee3746SRichard Henderson                                                       op->args[k++]));
1979c896fe29Sbellard             }
1980be210acbSRichard Henderson             switch (c) {
1981be210acbSRichard Henderson             case INDEX_op_brcond_i32:
1982ffc5ea09SRichard Henderson             case INDEX_op_setcond_i32:
1983ffc5ea09SRichard Henderson             case INDEX_op_movcond_i32:
1984be210acbSRichard Henderson             case INDEX_op_brcond2_i32:
1985be210acbSRichard Henderson             case INDEX_op_setcond2_i32:
1986ffc5ea09SRichard Henderson             case INDEX_op_brcond_i64:
1987be210acbSRichard Henderson             case INDEX_op_setcond_i64:
1988ffc5ea09SRichard Henderson             case INDEX_op_movcond_i64:
1989212be173SRichard Henderson             case INDEX_op_cmp_vec:
1990efee3746SRichard Henderson                 if (op->args[k] < ARRAY_SIZE(cond_name)
1991efee3746SRichard Henderson                     && cond_name[op->args[k]]) {
1992efee3746SRichard Henderson                     col += qemu_log(",%s", cond_name[op->args[k++]]);
1993eeacee4dSBlue Swirl                 } else {
1994efee3746SRichard Henderson                     col += qemu_log(",$0x%" TCG_PRIlx, op->args[k++]);
1995eeacee4dSBlue Swirl                 }
1996f48f3edeSblueswir1                 i = 1;
1997be210acbSRichard Henderson                 break;
1998f713d6adSRichard Henderson             case INDEX_op_qemu_ld_i32:
1999f713d6adSRichard Henderson             case INDEX_op_qemu_st_i32:
2000f713d6adSRichard Henderson             case INDEX_op_qemu_ld_i64:
2001f713d6adSRichard Henderson             case INDEX_op_qemu_st_i64:
200259227d5dSRichard Henderson                 {
2003efee3746SRichard Henderson                     TCGMemOpIdx oi = op->args[k++];
200459227d5dSRichard Henderson                     TCGMemOp op = get_memop(oi);
200559227d5dSRichard Henderson                     unsigned ix = get_mmuidx(oi);
200659227d5dSRichard Henderson 
200759c4b7e8SRichard Henderson                     if (op & ~(MO_AMASK | MO_BSWAP | MO_SSIZE)) {
2008bdfb460eSRichard Henderson                         col += qemu_log(",$0x%x,%u", op, ix);
200959c4b7e8SRichard Henderson                     } else {
20101f00b27fSSergey Sorokin                         const char *s_al, *s_op;
20111f00b27fSSergey Sorokin                         s_al = alignment_name[(op & MO_AMASK) >> MO_ASHIFT];
201259c4b7e8SRichard Henderson                         s_op = ldst_name[op & (MO_BSWAP | MO_SSIZE)];
2013bdfb460eSRichard Henderson                         col += qemu_log(",%s%s,%u", s_al, s_op, ix);
2014f713d6adSRichard Henderson                     }
2015f713d6adSRichard Henderson                     i = 1;
201659227d5dSRichard Henderson                 }
2017f713d6adSRichard Henderson                 break;
2018be210acbSRichard Henderson             default:
2019f48f3edeSblueswir1                 i = 0;
2020be210acbSRichard Henderson                 break;
2021be210acbSRichard Henderson             }
202251e3972cSRichard Henderson             switch (c) {
202351e3972cSRichard Henderson             case INDEX_op_set_label:
202451e3972cSRichard Henderson             case INDEX_op_br:
202551e3972cSRichard Henderson             case INDEX_op_brcond_i32:
202651e3972cSRichard Henderson             case INDEX_op_brcond_i64:
202751e3972cSRichard Henderson             case INDEX_op_brcond2_i32:
2028efee3746SRichard Henderson                 col += qemu_log("%s$L%d", k ? "," : "",
2029efee3746SRichard Henderson                                 arg_label(op->args[k])->id);
203051e3972cSRichard Henderson                 i++, k++;
203151e3972cSRichard Henderson                 break;
203251e3972cSRichard Henderson             default:
203351e3972cSRichard Henderson                 break;
2034eeacee4dSBlue Swirl             }
203551e3972cSRichard Henderson             for (; i < nb_cargs; i++, k++) {
2036efee3746SRichard Henderson                 col += qemu_log("%s$0x%" TCG_PRIlx, k ? "," : "", op->args[k]);
2037bdfb460eSRichard Henderson             }
2038bdfb460eSRichard Henderson         }
2039bdfb460eSRichard Henderson 
20401894f69aSRichard Henderson         if (have_prefs || op->life) {
20411894f69aSRichard Henderson             for (; col < 40; ++col) {
2042bdfb460eSRichard Henderson                 putc(' ', qemu_logfile);
2043bdfb460eSRichard Henderson             }
20441894f69aSRichard Henderson         }
20451894f69aSRichard Henderson 
20461894f69aSRichard Henderson         if (op->life) {
20471894f69aSRichard Henderson             unsigned life = op->life;
2048bdfb460eSRichard Henderson 
2049bdfb460eSRichard Henderson             if (life & (SYNC_ARG * 3)) {
2050bdfb460eSRichard Henderson                 qemu_log("  sync:");
2051bdfb460eSRichard Henderson                 for (i = 0; i < 2; ++i) {
2052bdfb460eSRichard Henderson                     if (life & (SYNC_ARG << i)) {
2053bdfb460eSRichard Henderson                         qemu_log(" %d", i);
2054bdfb460eSRichard Henderson                     }
2055bdfb460eSRichard Henderson                 }
2056bdfb460eSRichard Henderson             }
2057bdfb460eSRichard Henderson             life /= DEAD_ARG;
2058bdfb460eSRichard Henderson             if (life) {
2059bdfb460eSRichard Henderson                 qemu_log("  dead:");
2060bdfb460eSRichard Henderson                 for (i = 0; life; ++i, life >>= 1) {
2061bdfb460eSRichard Henderson                     if (life & 1) {
2062bdfb460eSRichard Henderson                         qemu_log(" %d", i);
2063bdfb460eSRichard Henderson                     }
2064bdfb460eSRichard Henderson                 }
2065c896fe29Sbellard             }
2066b03cce8eSbellard         }
20671894f69aSRichard Henderson 
20681894f69aSRichard Henderson         if (have_prefs) {
20691894f69aSRichard Henderson             for (i = 0; i < nb_oargs; ++i) {
20701894f69aSRichard Henderson                 TCGRegSet set = op->output_pref[i];
20711894f69aSRichard Henderson 
20721894f69aSRichard Henderson                 if (i == 0) {
20731894f69aSRichard Henderson                     qemu_log("  pref=");
20741894f69aSRichard Henderson                 } else {
20751894f69aSRichard Henderson                     qemu_log(",");
20761894f69aSRichard Henderson                 }
20771894f69aSRichard Henderson                 if (set == 0) {
20781894f69aSRichard Henderson                     qemu_log("none");
20791894f69aSRichard Henderson                 } else if (set == MAKE_64BIT_MASK(0, TCG_TARGET_NB_REGS)) {
20801894f69aSRichard Henderson                     qemu_log("all");
20811894f69aSRichard Henderson #ifdef CONFIG_DEBUG_TCG
20821894f69aSRichard Henderson                 } else if (tcg_regset_single(set)) {
20831894f69aSRichard Henderson                     TCGReg reg = tcg_regset_first(set);
20841894f69aSRichard Henderson                     qemu_log("%s", tcg_target_reg_names[reg]);
20851894f69aSRichard Henderson #endif
20861894f69aSRichard Henderson                 } else if (TCG_TARGET_NB_REGS <= 32) {
20871894f69aSRichard Henderson                     qemu_log("%#x", (uint32_t)set);
20881894f69aSRichard Henderson                 } else {
20891894f69aSRichard Henderson                     qemu_log("%#" PRIx64, (uint64_t)set);
20901894f69aSRichard Henderson                 }
20911894f69aSRichard Henderson             }
20921894f69aSRichard Henderson         }
20931894f69aSRichard Henderson 
2094eeacee4dSBlue Swirl         qemu_log("\n");
2095c896fe29Sbellard     }
2096c896fe29Sbellard }
2097c896fe29Sbellard 
2098c896fe29Sbellard /* we give more priority to constraints with less registers */
2099c896fe29Sbellard static int get_constraint_priority(const TCGOpDef *def, int k)
2100c896fe29Sbellard {
2101c896fe29Sbellard     const TCGArgConstraint *arg_ct;
2102c896fe29Sbellard 
2103c896fe29Sbellard     int i, n;
2104c896fe29Sbellard     arg_ct = &def->args_ct[k];
2105c896fe29Sbellard     if (arg_ct->ct & TCG_CT_ALIAS) {
2106c896fe29Sbellard         /* an alias is equivalent to a single register */
2107c896fe29Sbellard         n = 1;
2108c896fe29Sbellard     } else {
2109c896fe29Sbellard         if (!(arg_ct->ct & TCG_CT_REG))
2110c896fe29Sbellard             return 0;
2111c896fe29Sbellard         n = 0;
2112c896fe29Sbellard         for(i = 0; i < TCG_TARGET_NB_REGS; i++) {
2113c896fe29Sbellard             if (tcg_regset_test_reg(arg_ct->u.regs, i))
2114c896fe29Sbellard                 n++;
2115c896fe29Sbellard         }
2116c896fe29Sbellard     }
2117c896fe29Sbellard     return TCG_TARGET_NB_REGS - n + 1;
2118c896fe29Sbellard }
2119c896fe29Sbellard 
2120c896fe29Sbellard /* sort from highest priority to lowest */
2121c896fe29Sbellard static void sort_constraints(TCGOpDef *def, int start, int n)
2122c896fe29Sbellard {
2123c896fe29Sbellard     int i, j, p1, p2, tmp;
2124c896fe29Sbellard 
2125c896fe29Sbellard     for(i = 0; i < n; i++)
2126c896fe29Sbellard         def->sorted_args[start + i] = start + i;
2127c896fe29Sbellard     if (n <= 1)
2128c896fe29Sbellard         return;
2129c896fe29Sbellard     for(i = 0; i < n - 1; i++) {
2130c896fe29Sbellard         for(j = i + 1; j < n; j++) {
2131c896fe29Sbellard             p1 = get_constraint_priority(def, def->sorted_args[start + i]);
2132c896fe29Sbellard             p2 = get_constraint_priority(def, def->sorted_args[start + j]);
2133c896fe29Sbellard             if (p1 < p2) {
2134c896fe29Sbellard                 tmp = def->sorted_args[start + i];
2135c896fe29Sbellard                 def->sorted_args[start + i] = def->sorted_args[start + j];
2136c896fe29Sbellard                 def->sorted_args[start + j] = tmp;
2137c896fe29Sbellard             }
2138c896fe29Sbellard         }
2139c896fe29Sbellard     }
2140c896fe29Sbellard }
2141c896fe29Sbellard 
2142f69d277eSRichard Henderson static void process_op_defs(TCGContext *s)
2143c896fe29Sbellard {
2144a9751609SRichard Henderson     TCGOpcode op;
2145c896fe29Sbellard 
2146f69d277eSRichard Henderson     for (op = 0; op < NB_OPS; op++) {
2147f69d277eSRichard Henderson         TCGOpDef *def = &tcg_op_defs[op];
2148f69d277eSRichard Henderson         const TCGTargetOpDef *tdefs;
2149069ea736SRichard Henderson         TCGType type;
2150069ea736SRichard Henderson         int i, nb_args;
2151f69d277eSRichard Henderson 
2152f69d277eSRichard Henderson         if (def->flags & TCG_OPF_NOT_PRESENT) {
2153f69d277eSRichard Henderson             continue;
2154f69d277eSRichard Henderson         }
2155f69d277eSRichard Henderson 
2156c896fe29Sbellard         nb_args = def->nb_iargs + def->nb_oargs;
2157f69d277eSRichard Henderson         if (nb_args == 0) {
2158f69d277eSRichard Henderson             continue;
2159f69d277eSRichard Henderson         }
2160f69d277eSRichard Henderson 
2161f69d277eSRichard Henderson         tdefs = tcg_target_op_def(op);
2162f69d277eSRichard Henderson         /* Missing TCGTargetOpDef entry. */
2163f69d277eSRichard Henderson         tcg_debug_assert(tdefs != NULL);
2164f69d277eSRichard Henderson 
2165069ea736SRichard Henderson         type = (def->flags & TCG_OPF_64BIT ? TCG_TYPE_I64 : TCG_TYPE_I32);
2166c896fe29Sbellard         for (i = 0; i < nb_args; i++) {
2167f69d277eSRichard Henderson             const char *ct_str = tdefs->args_ct_str[i];
2168f69d277eSRichard Henderson             /* Incomplete TCGTargetOpDef entry. */
2169eabb7b91SAurelien Jarno             tcg_debug_assert(ct_str != NULL);
2170f69d277eSRichard Henderson 
2171ccb1bb66SRichard Henderson             def->args_ct[i].u.regs = 0;
2172c896fe29Sbellard             def->args_ct[i].ct = 0;
217317280ff4SRichard Henderson             while (*ct_str != '\0') {
217417280ff4SRichard Henderson                 switch(*ct_str) {
217517280ff4SRichard Henderson                 case '0' ... '9':
217617280ff4SRichard Henderson                     {
217717280ff4SRichard Henderson                         int oarg = *ct_str - '0';
217817280ff4SRichard Henderson                         tcg_debug_assert(ct_str == tdefs->args_ct_str[i]);
2179eabb7b91SAurelien Jarno                         tcg_debug_assert(oarg < def->nb_oargs);
2180eabb7b91SAurelien Jarno                         tcg_debug_assert(def->args_ct[oarg].ct & TCG_CT_REG);
218117280ff4SRichard Henderson                         /* TCG_CT_ALIAS is for the output arguments.
218217280ff4SRichard Henderson                            The input is tagged with TCG_CT_IALIAS. */
2183c896fe29Sbellard                         def->args_ct[i] = def->args_ct[oarg];
218417280ff4SRichard Henderson                         def->args_ct[oarg].ct |= TCG_CT_ALIAS;
21855ff9d6a4Sbellard                         def->args_ct[oarg].alias_index = i;
2186c896fe29Sbellard                         def->args_ct[i].ct |= TCG_CT_IALIAS;
21875ff9d6a4Sbellard                         def->args_ct[i].alias_index = oarg;
218817280ff4SRichard Henderson                     }
218917280ff4SRichard Henderson                     ct_str++;
2190c896fe29Sbellard                     break;
219182790a87SRichard Henderson                 case '&':
219282790a87SRichard Henderson                     def->args_ct[i].ct |= TCG_CT_NEWREG;
219382790a87SRichard Henderson                     ct_str++;
219482790a87SRichard Henderson                     break;
2195c896fe29Sbellard                 case 'i':
2196c896fe29Sbellard                     def->args_ct[i].ct |= TCG_CT_CONST;
2197c896fe29Sbellard                     ct_str++;
2198c896fe29Sbellard                     break;
2199c896fe29Sbellard                 default:
2200069ea736SRichard Henderson                     ct_str = target_parse_constraint(&def->args_ct[i],
2201069ea736SRichard Henderson                                                      ct_str, type);
2202f69d277eSRichard Henderson                     /* Typo in TCGTargetOpDef constraint. */
2203069ea736SRichard Henderson                     tcg_debug_assert(ct_str != NULL);
2204c896fe29Sbellard                 }
2205c896fe29Sbellard             }
2206c896fe29Sbellard         }
2207c896fe29Sbellard 
2208c68aaa18SStefan Weil         /* TCGTargetOpDef entry with too much information? */
2209eabb7b91SAurelien Jarno         tcg_debug_assert(i == TCG_MAX_OP_ARGS || tdefs->args_ct_str[i] == NULL);
2210c68aaa18SStefan Weil 
2211c896fe29Sbellard         /* sort the constraints (XXX: this is just an heuristic) */
2212c896fe29Sbellard         sort_constraints(def, 0, def->nb_oargs);
2213c896fe29Sbellard         sort_constraints(def, def->nb_oargs, def->nb_iargs);
2214c896fe29Sbellard     }
2215c896fe29Sbellard }
2216c896fe29Sbellard 
22170c627cdcSRichard Henderson void tcg_op_remove(TCGContext *s, TCGOp *op)
22180c627cdcSRichard Henderson {
2219d88a117eSRichard Henderson     TCGLabel *label;
2220d88a117eSRichard Henderson 
2221d88a117eSRichard Henderson     switch (op->opc) {
2222d88a117eSRichard Henderson     case INDEX_op_br:
2223d88a117eSRichard Henderson         label = arg_label(op->args[0]);
2224d88a117eSRichard Henderson         label->refs--;
2225d88a117eSRichard Henderson         break;
2226d88a117eSRichard Henderson     case INDEX_op_brcond_i32:
2227d88a117eSRichard Henderson     case INDEX_op_brcond_i64:
2228d88a117eSRichard Henderson         label = arg_label(op->args[3]);
2229d88a117eSRichard Henderson         label->refs--;
2230d88a117eSRichard Henderson         break;
2231d88a117eSRichard Henderson     case INDEX_op_brcond2_i32:
2232d88a117eSRichard Henderson         label = arg_label(op->args[5]);
2233d88a117eSRichard Henderson         label->refs--;
2234d88a117eSRichard Henderson         break;
2235d88a117eSRichard Henderson     default:
2236d88a117eSRichard Henderson         break;
2237d88a117eSRichard Henderson     }
2238d88a117eSRichard Henderson 
223915fa08f8SRichard Henderson     QTAILQ_REMOVE(&s->ops, op, link);
224015fa08f8SRichard Henderson     QTAILQ_INSERT_TAIL(&s->free_ops, op, link);
2241abebf925SRichard Henderson     s->nb_ops--;
22420c627cdcSRichard Henderson 
22430c627cdcSRichard Henderson #ifdef CONFIG_PROFILER
2244c3fac113SEmilio G. Cota     atomic_set(&s->prof.del_op_count, s->prof.del_op_count + 1);
22450c627cdcSRichard Henderson #endif
22460c627cdcSRichard Henderson }
22470c627cdcSRichard Henderson 
224815fa08f8SRichard Henderson static TCGOp *tcg_op_alloc(TCGOpcode opc)
224915fa08f8SRichard Henderson {
225015fa08f8SRichard Henderson     TCGContext *s = tcg_ctx;
225115fa08f8SRichard Henderson     TCGOp *op;
225215fa08f8SRichard Henderson 
225315fa08f8SRichard Henderson     if (likely(QTAILQ_EMPTY(&s->free_ops))) {
225415fa08f8SRichard Henderson         op = tcg_malloc(sizeof(TCGOp));
225515fa08f8SRichard Henderson     } else {
225615fa08f8SRichard Henderson         op = QTAILQ_FIRST(&s->free_ops);
225715fa08f8SRichard Henderson         QTAILQ_REMOVE(&s->free_ops, op, link);
225815fa08f8SRichard Henderson     }
225915fa08f8SRichard Henderson     memset(op, 0, offsetof(TCGOp, link));
226015fa08f8SRichard Henderson     op->opc = opc;
2261abebf925SRichard Henderson     s->nb_ops++;
226215fa08f8SRichard Henderson 
226315fa08f8SRichard Henderson     return op;
226415fa08f8SRichard Henderson }
226515fa08f8SRichard Henderson 
226615fa08f8SRichard Henderson TCGOp *tcg_emit_op(TCGOpcode opc)
226715fa08f8SRichard Henderson {
226815fa08f8SRichard Henderson     TCGOp *op = tcg_op_alloc(opc);
226915fa08f8SRichard Henderson     QTAILQ_INSERT_TAIL(&tcg_ctx->ops, op, link);
227015fa08f8SRichard Henderson     return op;
227115fa08f8SRichard Henderson }
227215fa08f8SRichard Henderson 
2273ac1043f6SEmilio G. Cota TCGOp *tcg_op_insert_before(TCGContext *s, TCGOp *old_op, TCGOpcode opc)
22745a18407fSRichard Henderson {
227515fa08f8SRichard Henderson     TCGOp *new_op = tcg_op_alloc(opc);
227615fa08f8SRichard Henderson     QTAILQ_INSERT_BEFORE(old_op, new_op, link);
22775a18407fSRichard Henderson     return new_op;
22785a18407fSRichard Henderson }
22795a18407fSRichard Henderson 
2280ac1043f6SEmilio G. Cota TCGOp *tcg_op_insert_after(TCGContext *s, TCGOp *old_op, TCGOpcode opc)
22815a18407fSRichard Henderson {
228215fa08f8SRichard Henderson     TCGOp *new_op = tcg_op_alloc(opc);
228315fa08f8SRichard Henderson     QTAILQ_INSERT_AFTER(&s->ops, old_op, new_op, link);
22845a18407fSRichard Henderson     return new_op;
22855a18407fSRichard Henderson }
22865a18407fSRichard Henderson 
2287b4fc67c7SRichard Henderson /* Reachable analysis : remove unreachable code.  */
2288b4fc67c7SRichard Henderson static void reachable_code_pass(TCGContext *s)
2289b4fc67c7SRichard Henderson {
2290b4fc67c7SRichard Henderson     TCGOp *op, *op_next;
2291b4fc67c7SRichard Henderson     bool dead = false;
2292b4fc67c7SRichard Henderson 
2293b4fc67c7SRichard Henderson     QTAILQ_FOREACH_SAFE(op, &s->ops, link, op_next) {
2294b4fc67c7SRichard Henderson         bool remove = dead;
2295b4fc67c7SRichard Henderson         TCGLabel *label;
2296b4fc67c7SRichard Henderson         int call_flags;
2297b4fc67c7SRichard Henderson 
2298b4fc67c7SRichard Henderson         switch (op->opc) {
2299b4fc67c7SRichard Henderson         case INDEX_op_set_label:
2300b4fc67c7SRichard Henderson             label = arg_label(op->args[0]);
2301b4fc67c7SRichard Henderson             if (label->refs == 0) {
2302b4fc67c7SRichard Henderson                 /*
2303b4fc67c7SRichard Henderson                  * While there is an occasional backward branch, virtually
2304b4fc67c7SRichard Henderson                  * all branches generated by the translators are forward.
2305b4fc67c7SRichard Henderson                  * Which means that generally we will have already removed
2306b4fc67c7SRichard Henderson                  * all references to the label that will be, and there is
2307b4fc67c7SRichard Henderson                  * little to be gained by iterating.
2308b4fc67c7SRichard Henderson                  */
2309b4fc67c7SRichard Henderson                 remove = true;
2310b4fc67c7SRichard Henderson             } else {
2311b4fc67c7SRichard Henderson                 /* Once we see a label, insns become live again.  */
2312b4fc67c7SRichard Henderson                 dead = false;
2313b4fc67c7SRichard Henderson                 remove = false;
2314b4fc67c7SRichard Henderson 
2315b4fc67c7SRichard Henderson                 /*
2316b4fc67c7SRichard Henderson                  * Optimization can fold conditional branches to unconditional.
2317b4fc67c7SRichard Henderson                  * If we find a label with one reference which is preceded by
2318b4fc67c7SRichard Henderson                  * an unconditional branch to it, remove both.  This needed to
2319b4fc67c7SRichard Henderson                  * wait until the dead code in between them was removed.
2320b4fc67c7SRichard Henderson                  */
2321b4fc67c7SRichard Henderson                 if (label->refs == 1) {
2322b4fc67c7SRichard Henderson                     TCGOp *op_prev = QTAILQ_PREV(op, TCGOpHead, link);
2323b4fc67c7SRichard Henderson                     if (op_prev->opc == INDEX_op_br &&
2324b4fc67c7SRichard Henderson                         label == arg_label(op_prev->args[0])) {
2325b4fc67c7SRichard Henderson                         tcg_op_remove(s, op_prev);
2326b4fc67c7SRichard Henderson                         remove = true;
2327b4fc67c7SRichard Henderson                     }
2328b4fc67c7SRichard Henderson                 }
2329b4fc67c7SRichard Henderson             }
2330b4fc67c7SRichard Henderson             break;
2331b4fc67c7SRichard Henderson 
2332b4fc67c7SRichard Henderson         case INDEX_op_br:
2333b4fc67c7SRichard Henderson         case INDEX_op_exit_tb:
2334b4fc67c7SRichard Henderson         case INDEX_op_goto_ptr:
2335b4fc67c7SRichard Henderson             /* Unconditional branches; everything following is dead.  */
2336b4fc67c7SRichard Henderson             dead = true;
2337b4fc67c7SRichard Henderson             break;
2338b4fc67c7SRichard Henderson 
2339b4fc67c7SRichard Henderson         case INDEX_op_call:
2340b4fc67c7SRichard Henderson             /* Notice noreturn helper calls, raising exceptions.  */
2341b4fc67c7SRichard Henderson             call_flags = op->args[TCGOP_CALLO(op) + TCGOP_CALLI(op) + 1];
2342b4fc67c7SRichard Henderson             if (call_flags & TCG_CALL_NO_RETURN) {
2343b4fc67c7SRichard Henderson                 dead = true;
2344b4fc67c7SRichard Henderson             }
2345b4fc67c7SRichard Henderson             break;
2346b4fc67c7SRichard Henderson 
2347b4fc67c7SRichard Henderson         case INDEX_op_insn_start:
2348b4fc67c7SRichard Henderson             /* Never remove -- we need to keep these for unwind.  */
2349b4fc67c7SRichard Henderson             remove = false;
2350b4fc67c7SRichard Henderson             break;
2351b4fc67c7SRichard Henderson 
2352b4fc67c7SRichard Henderson         default:
2353b4fc67c7SRichard Henderson             break;
2354b4fc67c7SRichard Henderson         }
2355b4fc67c7SRichard Henderson 
2356b4fc67c7SRichard Henderson         if (remove) {
2357b4fc67c7SRichard Henderson             tcg_op_remove(s, op);
2358b4fc67c7SRichard Henderson         }
2359b4fc67c7SRichard Henderson     }
2360b4fc67c7SRichard Henderson }
2361b4fc67c7SRichard Henderson 
2362c70fbf0aSRichard Henderson #define TS_DEAD  1
2363c70fbf0aSRichard Henderson #define TS_MEM   2
2364c70fbf0aSRichard Henderson 
23655a18407fSRichard Henderson #define IS_DEAD_ARG(n)   (arg_life & (DEAD_ARG << (n)))
23665a18407fSRichard Henderson #define NEED_SYNC_ARG(n) (arg_life & (SYNC_ARG << (n)))
23675a18407fSRichard Henderson 
23689c43b68dSAurelien Jarno /* liveness analysis: end of function: all temps are dead, and globals
23699c43b68dSAurelien Jarno    should be in memory. */
2370b83eabeaSRichard Henderson static void tcg_la_func_end(TCGContext *s)
2371c896fe29Sbellard {
2372b83eabeaSRichard Henderson     int ng = s->nb_globals;
2373b83eabeaSRichard Henderson     int nt = s->nb_temps;
2374b83eabeaSRichard Henderson     int i;
2375b83eabeaSRichard Henderson 
2376b83eabeaSRichard Henderson     for (i = 0; i < ng; ++i) {
2377b83eabeaSRichard Henderson         s->temps[i].state = TS_DEAD | TS_MEM;
2378b83eabeaSRichard Henderson     }
2379b83eabeaSRichard Henderson     for (i = ng; i < nt; ++i) {
2380b83eabeaSRichard Henderson         s->temps[i].state = TS_DEAD;
2381b83eabeaSRichard Henderson     }
2382c896fe29Sbellard }
2383c896fe29Sbellard 
23849c43b68dSAurelien Jarno /* liveness analysis: end of basic block: all temps are dead, globals
23859c43b68dSAurelien Jarno    and local temps should be in memory. */
2386b83eabeaSRichard Henderson static void tcg_la_bb_end(TCGContext *s)
2387641d5fbeSbellard {
2388b83eabeaSRichard Henderson     int ng = s->nb_globals;
2389b83eabeaSRichard Henderson     int nt = s->nb_temps;
2390b83eabeaSRichard Henderson     int i;
2391641d5fbeSbellard 
2392b83eabeaSRichard Henderson     for (i = 0; i < ng; ++i) {
2393b83eabeaSRichard Henderson         s->temps[i].state = TS_DEAD | TS_MEM;
2394c70fbf0aSRichard Henderson     }
2395b83eabeaSRichard Henderson     for (i = ng; i < nt; ++i) {
2396b83eabeaSRichard Henderson         s->temps[i].state = (s->temps[i].temp_local
2397b83eabeaSRichard Henderson                              ? TS_DEAD | TS_MEM
2398b83eabeaSRichard Henderson                              : TS_DEAD);
2399641d5fbeSbellard     }
2400641d5fbeSbellard }
2401641d5fbeSbellard 
2402a1b3c48dSRichard Henderson /* Liveness analysis : update the opc_arg_life array to tell if a
2403c896fe29Sbellard    given input arguments is dead. Instructions updating dead
2404c896fe29Sbellard    temporaries are removed. */
2405b83eabeaSRichard Henderson static void liveness_pass_1(TCGContext *s)
2406c896fe29Sbellard {
2407c70fbf0aSRichard Henderson     int nb_globals = s->nb_globals;
240815fa08f8SRichard Henderson     TCGOp *op, *op_prev;
2409c896fe29Sbellard 
2410b83eabeaSRichard Henderson     tcg_la_func_end(s);
2411c896fe29Sbellard 
241215fa08f8SRichard Henderson     QTAILQ_FOREACH_REVERSE_SAFE(op, &s->ops, TCGOpHead, link, op_prev) {
2413c45cb8bbSRichard Henderson         int i, nb_iargs, nb_oargs;
2414c45cb8bbSRichard Henderson         TCGOpcode opc_new, opc_new2;
2415c45cb8bbSRichard Henderson         bool have_opc_new2;
2416a1b3c48dSRichard Henderson         TCGLifeData arg_life = 0;
2417b83eabeaSRichard Henderson         TCGTemp *arg_ts;
2418c45cb8bbSRichard Henderson         TCGOpcode opc = op->opc;
2419c45cb8bbSRichard Henderson         const TCGOpDef *def = &tcg_op_defs[opc];
2420c45cb8bbSRichard Henderson 
2421c45cb8bbSRichard Henderson         switch (opc) {
2422c896fe29Sbellard         case INDEX_op_call:
2423c6e113f5Sbellard             {
2424c6e113f5Sbellard                 int call_flags;
2425c6e113f5Sbellard 
2426cd9090aaSRichard Henderson                 nb_oargs = TCGOP_CALLO(op);
2427cd9090aaSRichard Henderson                 nb_iargs = TCGOP_CALLI(op);
2428efee3746SRichard Henderson                 call_flags = op->args[nb_oargs + nb_iargs + 1];
2429c6e113f5Sbellard 
2430c45cb8bbSRichard Henderson                 /* pure functions can be removed if their result is unused */
243178505279SAurelien Jarno                 if (call_flags & TCG_CALL_NO_SIDE_EFFECTS) {
2432c6e113f5Sbellard                     for (i = 0; i < nb_oargs; i++) {
2433b83eabeaSRichard Henderson                         arg_ts = arg_temp(op->args[i]);
2434b83eabeaSRichard Henderson                         if (arg_ts->state != TS_DEAD) {
2435c6e113f5Sbellard                             goto do_not_remove_call;
2436c6e113f5Sbellard                         }
24379c43b68dSAurelien Jarno                     }
2438c45cb8bbSRichard Henderson                     goto do_remove;
2439*152c35aaSRichard Henderson                 }
2440c6e113f5Sbellard             do_not_remove_call:
2441c896fe29Sbellard 
2442c896fe29Sbellard                 /* output args are dead */
2443c896fe29Sbellard                 for (i = 0; i < nb_oargs; i++) {
2444b83eabeaSRichard Henderson                     arg_ts = arg_temp(op->args[i]);
2445b83eabeaSRichard Henderson                     if (arg_ts->state & TS_DEAD) {
2446a1b3c48dSRichard Henderson                         arg_life |= DEAD_ARG << i;
24476b64b624SAurelien Jarno                     }
2448b83eabeaSRichard Henderson                     if (arg_ts->state & TS_MEM) {
2449a1b3c48dSRichard Henderson                         arg_life |= SYNC_ARG << i;
24509c43b68dSAurelien Jarno                     }
2451b83eabeaSRichard Henderson                     arg_ts->state = TS_DEAD;
2452c896fe29Sbellard                 }
2453c896fe29Sbellard 
245478505279SAurelien Jarno                 if (!(call_flags & (TCG_CALL_NO_WRITE_GLOBALS |
245578505279SAurelien Jarno                                     TCG_CALL_NO_READ_GLOBALS))) {
24569c43b68dSAurelien Jarno                     /* globals should go back to memory */
2457b83eabeaSRichard Henderson                     for (i = 0; i < nb_globals; i++) {
2458b83eabeaSRichard Henderson                         s->temps[i].state = TS_DEAD | TS_MEM;
2459b83eabeaSRichard Henderson                     }
2460c70fbf0aSRichard Henderson                 } else if (!(call_flags & TCG_CALL_NO_READ_GLOBALS)) {
2461c70fbf0aSRichard Henderson                     /* globals should be synced to memory */
2462c70fbf0aSRichard Henderson                     for (i = 0; i < nb_globals; i++) {
2463b83eabeaSRichard Henderson                         s->temps[i].state |= TS_MEM;
2464c70fbf0aSRichard Henderson                     }
2465b9c18f56Saurel32                 }
2466c896fe29Sbellard 
2467c19f47bfSAurelien Jarno                 /* record arguments that die in this helper */
2468866cb6cbSAurelien Jarno                 for (i = nb_oargs; i < nb_iargs + nb_oargs; i++) {
2469b83eabeaSRichard Henderson                     arg_ts = arg_temp(op->args[i]);
2470b83eabeaSRichard Henderson                     if (arg_ts && arg_ts->state & TS_DEAD) {
2471a1b3c48dSRichard Henderson                         arg_life |= DEAD_ARG << i;
2472c896fe29Sbellard                     }
2473c896fe29Sbellard                 }
247467cc32ebSVeres Lajos                 /* input arguments are live for preceding opcodes */
2475c70fbf0aSRichard Henderson                 for (i = nb_oargs; i < nb_iargs + nb_oargs; i++) {
2476b83eabeaSRichard Henderson                     arg_ts = arg_temp(op->args[i]);
2477b83eabeaSRichard Henderson                     if (arg_ts) {
2478b83eabeaSRichard Henderson                         arg_ts->state &= ~TS_DEAD;
2479c70fbf0aSRichard Henderson                     }
2480c19f47bfSAurelien Jarno                 }
2481c6e113f5Sbellard             }
2482c896fe29Sbellard             break;
2483765b842aSRichard Henderson         case INDEX_op_insn_start:
2484c896fe29Sbellard             break;
24855ff9d6a4Sbellard         case INDEX_op_discard:
24865ff9d6a4Sbellard             /* mark the temporary as dead */
2487b83eabeaSRichard Henderson             arg_temp(op->args[0])->state = TS_DEAD;
24885ff9d6a4Sbellard             break;
24891305c451SRichard Henderson 
24901305c451SRichard Henderson         case INDEX_op_add2_i32:
2491c45cb8bbSRichard Henderson             opc_new = INDEX_op_add_i32;
2492f1fae40cSRichard Henderson             goto do_addsub2;
24931305c451SRichard Henderson         case INDEX_op_sub2_i32:
2494c45cb8bbSRichard Henderson             opc_new = INDEX_op_sub_i32;
2495f1fae40cSRichard Henderson             goto do_addsub2;
2496f1fae40cSRichard Henderson         case INDEX_op_add2_i64:
2497c45cb8bbSRichard Henderson             opc_new = INDEX_op_add_i64;
2498f1fae40cSRichard Henderson             goto do_addsub2;
2499f1fae40cSRichard Henderson         case INDEX_op_sub2_i64:
2500c45cb8bbSRichard Henderson             opc_new = INDEX_op_sub_i64;
2501f1fae40cSRichard Henderson         do_addsub2:
25021305c451SRichard Henderson             nb_iargs = 4;
25031305c451SRichard Henderson             nb_oargs = 2;
25041305c451SRichard Henderson             /* Test if the high part of the operation is dead, but not
25051305c451SRichard Henderson                the low part.  The result can be optimized to a simple
25061305c451SRichard Henderson                add or sub.  This happens often for x86_64 guest when the
25071305c451SRichard Henderson                cpu mode is set to 32 bit.  */
2508b83eabeaSRichard Henderson             if (arg_temp(op->args[1])->state == TS_DEAD) {
2509b83eabeaSRichard Henderson                 if (arg_temp(op->args[0])->state == TS_DEAD) {
25101305c451SRichard Henderson                     goto do_remove;
25111305c451SRichard Henderson                 }
2512c45cb8bbSRichard Henderson                 /* Replace the opcode and adjust the args in place,
2513c45cb8bbSRichard Henderson                    leaving 3 unused args at the end.  */
2514c45cb8bbSRichard Henderson                 op->opc = opc = opc_new;
2515efee3746SRichard Henderson                 op->args[1] = op->args[2];
2516efee3746SRichard Henderson                 op->args[2] = op->args[4];
25171305c451SRichard Henderson                 /* Fall through and mark the single-word operation live.  */
25181305c451SRichard Henderson                 nb_iargs = 2;
25191305c451SRichard Henderson                 nb_oargs = 1;
25201305c451SRichard Henderson             }
25211305c451SRichard Henderson             goto do_not_remove;
25221305c451SRichard Henderson 
25231414968aSRichard Henderson         case INDEX_op_mulu2_i32:
2524c45cb8bbSRichard Henderson             opc_new = INDEX_op_mul_i32;
2525c45cb8bbSRichard Henderson             opc_new2 = INDEX_op_muluh_i32;
2526c45cb8bbSRichard Henderson             have_opc_new2 = TCG_TARGET_HAS_muluh_i32;
252703271524SRichard Henderson             goto do_mul2;
2528f1fae40cSRichard Henderson         case INDEX_op_muls2_i32:
2529c45cb8bbSRichard Henderson             opc_new = INDEX_op_mul_i32;
2530c45cb8bbSRichard Henderson             opc_new2 = INDEX_op_mulsh_i32;
2531c45cb8bbSRichard Henderson             have_opc_new2 = TCG_TARGET_HAS_mulsh_i32;
2532f1fae40cSRichard Henderson             goto do_mul2;
2533f1fae40cSRichard Henderson         case INDEX_op_mulu2_i64:
2534c45cb8bbSRichard Henderson             opc_new = INDEX_op_mul_i64;
2535c45cb8bbSRichard Henderson             opc_new2 = INDEX_op_muluh_i64;
2536c45cb8bbSRichard Henderson             have_opc_new2 = TCG_TARGET_HAS_muluh_i64;
253703271524SRichard Henderson             goto do_mul2;
2538f1fae40cSRichard Henderson         case INDEX_op_muls2_i64:
2539c45cb8bbSRichard Henderson             opc_new = INDEX_op_mul_i64;
2540c45cb8bbSRichard Henderson             opc_new2 = INDEX_op_mulsh_i64;
2541c45cb8bbSRichard Henderson             have_opc_new2 = TCG_TARGET_HAS_mulsh_i64;
254203271524SRichard Henderson             goto do_mul2;
2543f1fae40cSRichard Henderson         do_mul2:
25441414968aSRichard Henderson             nb_iargs = 2;
25451414968aSRichard Henderson             nb_oargs = 2;
2546b83eabeaSRichard Henderson             if (arg_temp(op->args[1])->state == TS_DEAD) {
2547b83eabeaSRichard Henderson                 if (arg_temp(op->args[0])->state == TS_DEAD) {
254803271524SRichard Henderson                     /* Both parts of the operation are dead.  */
25491414968aSRichard Henderson                     goto do_remove;
25501414968aSRichard Henderson                 }
255103271524SRichard Henderson                 /* The high part of the operation is dead; generate the low. */
2552c45cb8bbSRichard Henderson                 op->opc = opc = opc_new;
2553efee3746SRichard Henderson                 op->args[1] = op->args[2];
2554efee3746SRichard Henderson                 op->args[2] = op->args[3];
2555b83eabeaSRichard Henderson             } else if (arg_temp(op->args[0])->state == TS_DEAD && have_opc_new2) {
255603271524SRichard Henderson                 /* The low part of the operation is dead; generate the high. */
2557c45cb8bbSRichard Henderson                 op->opc = opc = opc_new2;
2558efee3746SRichard Henderson                 op->args[0] = op->args[1];
2559efee3746SRichard Henderson                 op->args[1] = op->args[2];
2560efee3746SRichard Henderson                 op->args[2] = op->args[3];
256103271524SRichard Henderson             } else {
256203271524SRichard Henderson                 goto do_not_remove;
256303271524SRichard Henderson             }
256403271524SRichard Henderson             /* Mark the single-word operation live.  */
25651414968aSRichard Henderson             nb_oargs = 1;
25661414968aSRichard Henderson             goto do_not_remove;
25671414968aSRichard Henderson 
2568c896fe29Sbellard         default:
25691305c451SRichard Henderson             /* XXX: optimize by hardcoding common cases (e.g. triadic ops) */
2570c896fe29Sbellard             nb_iargs = def->nb_iargs;
2571c896fe29Sbellard             nb_oargs = def->nb_oargs;
2572c896fe29Sbellard 
2573c896fe29Sbellard             /* Test if the operation can be removed because all
25745ff9d6a4Sbellard                its outputs are dead. We assume that nb_oargs == 0
25755ff9d6a4Sbellard                implies side effects */
25765ff9d6a4Sbellard             if (!(def->flags & TCG_OPF_SIDE_EFFECTS) && nb_oargs != 0) {
2577c896fe29Sbellard                 for (i = 0; i < nb_oargs; i++) {
2578b83eabeaSRichard Henderson                     if (arg_temp(op->args[i])->state != TS_DEAD) {
2579c896fe29Sbellard                         goto do_not_remove;
2580c896fe29Sbellard                     }
25819c43b68dSAurelien Jarno                 }
2582*152c35aaSRichard Henderson                 goto do_remove;
2583*152c35aaSRichard Henderson             }
2584*152c35aaSRichard Henderson             goto do_not_remove;
2585*152c35aaSRichard Henderson 
25861305c451SRichard Henderson         do_remove:
25870c627cdcSRichard Henderson             tcg_op_remove(s, op);
2588*152c35aaSRichard Henderson             break;
2589*152c35aaSRichard Henderson 
2590c896fe29Sbellard         do_not_remove:
2591c896fe29Sbellard             /* output args are dead */
2592c896fe29Sbellard             for (i = 0; i < nb_oargs; i++) {
2593b83eabeaSRichard Henderson                 arg_ts = arg_temp(op->args[i]);
2594b83eabeaSRichard Henderson                 if (arg_ts->state & TS_DEAD) {
2595a1b3c48dSRichard Henderson                     arg_life |= DEAD_ARG << i;
25966b64b624SAurelien Jarno                 }
2597b83eabeaSRichard Henderson                 if (arg_ts->state & TS_MEM) {
2598a1b3c48dSRichard Henderson                     arg_life |= SYNC_ARG << i;
25999c43b68dSAurelien Jarno                 }
2600b83eabeaSRichard Henderson                 arg_ts->state = TS_DEAD;
2601c896fe29Sbellard             }
2602c896fe29Sbellard 
2603c896fe29Sbellard             /* if end of basic block, update */
2604c896fe29Sbellard             if (def->flags & TCG_OPF_BB_END) {
2605b83eabeaSRichard Henderson                 tcg_la_bb_end(s);
26063d5c5f87SAurelien Jarno             } else if (def->flags & TCG_OPF_SIDE_EFFECTS) {
26073d5c5f87SAurelien Jarno                 /* globals should be synced to memory */
2608c70fbf0aSRichard Henderson                 for (i = 0; i < nb_globals; i++) {
2609b83eabeaSRichard Henderson                     s->temps[i].state |= TS_MEM;
2610c70fbf0aSRichard Henderson                 }
2611c896fe29Sbellard             }
2612c896fe29Sbellard 
2613c19f47bfSAurelien Jarno             /* record arguments that die in this opcode */
2614866cb6cbSAurelien Jarno             for (i = nb_oargs; i < nb_oargs + nb_iargs; i++) {
2615b83eabeaSRichard Henderson                 arg_ts = arg_temp(op->args[i]);
2616b83eabeaSRichard Henderson                 if (arg_ts->state & TS_DEAD) {
2617a1b3c48dSRichard Henderson                     arg_life |= DEAD_ARG << i;
2618c896fe29Sbellard                 }
2619c19f47bfSAurelien Jarno             }
262067cc32ebSVeres Lajos             /* input arguments are live for preceding opcodes */
2621c19f47bfSAurelien Jarno             for (i = nb_oargs; i < nb_oargs + nb_iargs; i++) {
2622b83eabeaSRichard Henderson                 arg_temp(op->args[i])->state &= ~TS_DEAD;
2623c896fe29Sbellard             }
2624c896fe29Sbellard             break;
2625c896fe29Sbellard         }
2626bee158cbSRichard Henderson         op->life = arg_life;
262769e3706dSRichard Henderson         op->output_pref[0] = 0;
262869e3706dSRichard Henderson         op->output_pref[1] = 0;
2629c896fe29Sbellard     }
26301ff0a2c5SEvgeny Voevodin }
2631c896fe29Sbellard 
26325a18407fSRichard Henderson /* Liveness analysis: Convert indirect regs to direct temporaries.  */
2633b83eabeaSRichard Henderson static bool liveness_pass_2(TCGContext *s)
26345a18407fSRichard Henderson {
26355a18407fSRichard Henderson     int nb_globals = s->nb_globals;
263615fa08f8SRichard Henderson     int nb_temps, i;
26375a18407fSRichard Henderson     bool changes = false;
263815fa08f8SRichard Henderson     TCGOp *op, *op_next;
26395a18407fSRichard Henderson 
26405a18407fSRichard Henderson     /* Create a temporary for each indirect global.  */
26415a18407fSRichard Henderson     for (i = 0; i < nb_globals; ++i) {
26425a18407fSRichard Henderson         TCGTemp *its = &s->temps[i];
26435a18407fSRichard Henderson         if (its->indirect_reg) {
26445a18407fSRichard Henderson             TCGTemp *dts = tcg_temp_alloc(s);
26455a18407fSRichard Henderson             dts->type = its->type;
26465a18407fSRichard Henderson             dts->base_type = its->base_type;
2647b83eabeaSRichard Henderson             its->state_ptr = dts;
2648b83eabeaSRichard Henderson         } else {
2649b83eabeaSRichard Henderson             its->state_ptr = NULL;
26505a18407fSRichard Henderson         }
2651b83eabeaSRichard Henderson         /* All globals begin dead.  */
2652b83eabeaSRichard Henderson         its->state = TS_DEAD;
26535a18407fSRichard Henderson     }
2654b83eabeaSRichard Henderson     for (nb_temps = s->nb_temps; i < nb_temps; ++i) {
2655b83eabeaSRichard Henderson         TCGTemp *its = &s->temps[i];
2656b83eabeaSRichard Henderson         its->state_ptr = NULL;
2657b83eabeaSRichard Henderson         its->state = TS_DEAD;
2658b83eabeaSRichard Henderson     }
26595a18407fSRichard Henderson 
266015fa08f8SRichard Henderson     QTAILQ_FOREACH_SAFE(op, &s->ops, link, op_next) {
26615a18407fSRichard Henderson         TCGOpcode opc = op->opc;
26625a18407fSRichard Henderson         const TCGOpDef *def = &tcg_op_defs[opc];
26635a18407fSRichard Henderson         TCGLifeData arg_life = op->life;
26645a18407fSRichard Henderson         int nb_iargs, nb_oargs, call_flags;
2665b83eabeaSRichard Henderson         TCGTemp *arg_ts, *dir_ts;
26665a18407fSRichard Henderson 
26675a18407fSRichard Henderson         if (opc == INDEX_op_call) {
2668cd9090aaSRichard Henderson             nb_oargs = TCGOP_CALLO(op);
2669cd9090aaSRichard Henderson             nb_iargs = TCGOP_CALLI(op);
2670efee3746SRichard Henderson             call_flags = op->args[nb_oargs + nb_iargs + 1];
26715a18407fSRichard Henderson         } else {
26725a18407fSRichard Henderson             nb_iargs = def->nb_iargs;
26735a18407fSRichard Henderson             nb_oargs = def->nb_oargs;
26745a18407fSRichard Henderson 
26755a18407fSRichard Henderson             /* Set flags similar to how calls require.  */
26765a18407fSRichard Henderson             if (def->flags & TCG_OPF_BB_END) {
26775a18407fSRichard Henderson                 /* Like writing globals: save_globals */
26785a18407fSRichard Henderson                 call_flags = 0;
26795a18407fSRichard Henderson             } else if (def->flags & TCG_OPF_SIDE_EFFECTS) {
26805a18407fSRichard Henderson                 /* Like reading globals: sync_globals */
26815a18407fSRichard Henderson                 call_flags = TCG_CALL_NO_WRITE_GLOBALS;
26825a18407fSRichard Henderson             } else {
26835a18407fSRichard Henderson                 /* No effect on globals.  */
26845a18407fSRichard Henderson                 call_flags = (TCG_CALL_NO_READ_GLOBALS |
26855a18407fSRichard Henderson                               TCG_CALL_NO_WRITE_GLOBALS);
26865a18407fSRichard Henderson             }
26875a18407fSRichard Henderson         }
26885a18407fSRichard Henderson 
26895a18407fSRichard Henderson         /* Make sure that input arguments are available.  */
26905a18407fSRichard Henderson         for (i = nb_oargs; i < nb_iargs + nb_oargs; i++) {
2691b83eabeaSRichard Henderson             arg_ts = arg_temp(op->args[i]);
2692b83eabeaSRichard Henderson             if (arg_ts) {
2693b83eabeaSRichard Henderson                 dir_ts = arg_ts->state_ptr;
2694b83eabeaSRichard Henderson                 if (dir_ts && arg_ts->state == TS_DEAD) {
2695b83eabeaSRichard Henderson                     TCGOpcode lopc = (arg_ts->type == TCG_TYPE_I32
26965a18407fSRichard Henderson                                       ? INDEX_op_ld_i32
26975a18407fSRichard Henderson                                       : INDEX_op_ld_i64);
2698ac1043f6SEmilio G. Cota                     TCGOp *lop = tcg_op_insert_before(s, op, lopc);
26995a18407fSRichard Henderson 
2700b83eabeaSRichard Henderson                     lop->args[0] = temp_arg(dir_ts);
2701b83eabeaSRichard Henderson                     lop->args[1] = temp_arg(arg_ts->mem_base);
2702b83eabeaSRichard Henderson                     lop->args[2] = arg_ts->mem_offset;
27035a18407fSRichard Henderson 
27045a18407fSRichard Henderson                     /* Loaded, but synced with memory.  */
2705b83eabeaSRichard Henderson                     arg_ts->state = TS_MEM;
27065a18407fSRichard Henderson                 }
27075a18407fSRichard Henderson             }
27085a18407fSRichard Henderson         }
27095a18407fSRichard Henderson 
27105a18407fSRichard Henderson         /* Perform input replacement, and mark inputs that became dead.
27115a18407fSRichard Henderson            No action is required except keeping temp_state up to date
27125a18407fSRichard Henderson            so that we reload when needed.  */
27135a18407fSRichard Henderson         for (i = nb_oargs; i < nb_iargs + nb_oargs; i++) {
2714b83eabeaSRichard Henderson             arg_ts = arg_temp(op->args[i]);
2715b83eabeaSRichard Henderson             if (arg_ts) {
2716b83eabeaSRichard Henderson                 dir_ts = arg_ts->state_ptr;
2717b83eabeaSRichard Henderson                 if (dir_ts) {
2718b83eabeaSRichard Henderson                     op->args[i] = temp_arg(dir_ts);
27195a18407fSRichard Henderson                     changes = true;
27205a18407fSRichard Henderson                     if (IS_DEAD_ARG(i)) {
2721b83eabeaSRichard Henderson                         arg_ts->state = TS_DEAD;
27225a18407fSRichard Henderson                     }
27235a18407fSRichard Henderson                 }
27245a18407fSRichard Henderson             }
27255a18407fSRichard Henderson         }
27265a18407fSRichard Henderson 
27275a18407fSRichard Henderson         /* Liveness analysis should ensure that the following are
27285a18407fSRichard Henderson            all correct, for call sites and basic block end points.  */
27295a18407fSRichard Henderson         if (call_flags & TCG_CALL_NO_READ_GLOBALS) {
27305a18407fSRichard Henderson             /* Nothing to do */
27315a18407fSRichard Henderson         } else if (call_flags & TCG_CALL_NO_WRITE_GLOBALS) {
27325a18407fSRichard Henderson             for (i = 0; i < nb_globals; ++i) {
27335a18407fSRichard Henderson                 /* Liveness should see that globals are synced back,
27345a18407fSRichard Henderson                    that is, either TS_DEAD or TS_MEM.  */
2735b83eabeaSRichard Henderson                 arg_ts = &s->temps[i];
2736b83eabeaSRichard Henderson                 tcg_debug_assert(arg_ts->state_ptr == 0
2737b83eabeaSRichard Henderson                                  || arg_ts->state != 0);
27385a18407fSRichard Henderson             }
27395a18407fSRichard Henderson         } else {
27405a18407fSRichard Henderson             for (i = 0; i < nb_globals; ++i) {
27415a18407fSRichard Henderson                 /* Liveness should see that globals are saved back,
27425a18407fSRichard Henderson                    that is, TS_DEAD, waiting to be reloaded.  */
2743b83eabeaSRichard Henderson                 arg_ts = &s->temps[i];
2744b83eabeaSRichard Henderson                 tcg_debug_assert(arg_ts->state_ptr == 0
2745b83eabeaSRichard Henderson                                  || arg_ts->state == TS_DEAD);
27465a18407fSRichard Henderson             }
27475a18407fSRichard Henderson         }
27485a18407fSRichard Henderson 
27495a18407fSRichard Henderson         /* Outputs become available.  */
27505a18407fSRichard Henderson         for (i = 0; i < nb_oargs; i++) {
2751b83eabeaSRichard Henderson             arg_ts = arg_temp(op->args[i]);
2752b83eabeaSRichard Henderson             dir_ts = arg_ts->state_ptr;
2753b83eabeaSRichard Henderson             if (!dir_ts) {
27545a18407fSRichard Henderson                 continue;
27555a18407fSRichard Henderson             }
2756b83eabeaSRichard Henderson             op->args[i] = temp_arg(dir_ts);
27575a18407fSRichard Henderson             changes = true;
27585a18407fSRichard Henderson 
27595a18407fSRichard Henderson             /* The output is now live and modified.  */
2760b83eabeaSRichard Henderson             arg_ts->state = 0;
27615a18407fSRichard Henderson 
27625a18407fSRichard Henderson             /* Sync outputs upon their last write.  */
27635a18407fSRichard Henderson             if (NEED_SYNC_ARG(i)) {
2764b83eabeaSRichard Henderson                 TCGOpcode sopc = (arg_ts->type == TCG_TYPE_I32
27655a18407fSRichard Henderson                                   ? INDEX_op_st_i32
27665a18407fSRichard Henderson                                   : INDEX_op_st_i64);
2767ac1043f6SEmilio G. Cota                 TCGOp *sop = tcg_op_insert_after(s, op, sopc);
27685a18407fSRichard Henderson 
2769b83eabeaSRichard Henderson                 sop->args[0] = temp_arg(dir_ts);
2770b83eabeaSRichard Henderson                 sop->args[1] = temp_arg(arg_ts->mem_base);
2771b83eabeaSRichard Henderson                 sop->args[2] = arg_ts->mem_offset;
27725a18407fSRichard Henderson 
2773b83eabeaSRichard Henderson                 arg_ts->state = TS_MEM;
27745a18407fSRichard Henderson             }
27755a18407fSRichard Henderson             /* Drop outputs that are dead.  */
27765a18407fSRichard Henderson             if (IS_DEAD_ARG(i)) {
2777b83eabeaSRichard Henderson                 arg_ts->state = TS_DEAD;
27785a18407fSRichard Henderson             }
27795a18407fSRichard Henderson         }
27805a18407fSRichard Henderson     }
27815a18407fSRichard Henderson 
27825a18407fSRichard Henderson     return changes;
27835a18407fSRichard Henderson }
27845a18407fSRichard Henderson 
27858d8fdbaeSAurelien Jarno #ifdef CONFIG_DEBUG_TCG
2786c896fe29Sbellard static void dump_regs(TCGContext *s)
2787c896fe29Sbellard {
2788c896fe29Sbellard     TCGTemp *ts;
2789c896fe29Sbellard     int i;
2790c896fe29Sbellard     char buf[64];
2791c896fe29Sbellard 
2792c896fe29Sbellard     for(i = 0; i < s->nb_temps; i++) {
2793c896fe29Sbellard         ts = &s->temps[i];
279443439139SRichard Henderson         printf("  %10s: ", tcg_get_arg_str_ptr(s, buf, sizeof(buf), ts));
2795c896fe29Sbellard         switch(ts->val_type) {
2796c896fe29Sbellard         case TEMP_VAL_REG:
2797c896fe29Sbellard             printf("%s", tcg_target_reg_names[ts->reg]);
2798c896fe29Sbellard             break;
2799c896fe29Sbellard         case TEMP_VAL_MEM:
2800b3a62939SRichard Henderson             printf("%d(%s)", (int)ts->mem_offset,
2801b3a62939SRichard Henderson                    tcg_target_reg_names[ts->mem_base->reg]);
2802c896fe29Sbellard             break;
2803c896fe29Sbellard         case TEMP_VAL_CONST:
2804c896fe29Sbellard             printf("$0x%" TCG_PRIlx, ts->val);
2805c896fe29Sbellard             break;
2806c896fe29Sbellard         case TEMP_VAL_DEAD:
2807c896fe29Sbellard             printf("D");
2808c896fe29Sbellard             break;
2809c896fe29Sbellard         default:
2810c896fe29Sbellard             printf("???");
2811c896fe29Sbellard             break;
2812c896fe29Sbellard         }
2813c896fe29Sbellard         printf("\n");
2814c896fe29Sbellard     }
2815c896fe29Sbellard 
2816c896fe29Sbellard     for(i = 0; i < TCG_TARGET_NB_REGS; i++) {
2817f8b2f202SRichard Henderson         if (s->reg_to_temp[i] != NULL) {
2818c896fe29Sbellard             printf("%s: %s\n",
2819c896fe29Sbellard                    tcg_target_reg_names[i],
2820f8b2f202SRichard Henderson                    tcg_get_arg_str_ptr(s, buf, sizeof(buf), s->reg_to_temp[i]));
2821c896fe29Sbellard         }
2822c896fe29Sbellard     }
2823c896fe29Sbellard }
2824c896fe29Sbellard 
2825c896fe29Sbellard static void check_regs(TCGContext *s)
2826c896fe29Sbellard {
2827869938aeSRichard Henderson     int reg;
2828b6638662SRichard Henderson     int k;
2829c896fe29Sbellard     TCGTemp *ts;
2830c896fe29Sbellard     char buf[64];
2831c896fe29Sbellard 
2832c896fe29Sbellard     for (reg = 0; reg < TCG_TARGET_NB_REGS; reg++) {
2833f8b2f202SRichard Henderson         ts = s->reg_to_temp[reg];
2834f8b2f202SRichard Henderson         if (ts != NULL) {
2835f8b2f202SRichard Henderson             if (ts->val_type != TEMP_VAL_REG || ts->reg != reg) {
2836c896fe29Sbellard                 printf("Inconsistency for register %s:\n",
2837c896fe29Sbellard                        tcg_target_reg_names[reg]);
2838b03cce8eSbellard                 goto fail;
2839c896fe29Sbellard             }
2840c896fe29Sbellard         }
2841c896fe29Sbellard     }
2842c896fe29Sbellard     for (k = 0; k < s->nb_temps; k++) {
2843c896fe29Sbellard         ts = &s->temps[k];
2844f8b2f202SRichard Henderson         if (ts->val_type == TEMP_VAL_REG && !ts->fixed_reg
2845f8b2f202SRichard Henderson             && s->reg_to_temp[ts->reg] != ts) {
2846c896fe29Sbellard             printf("Inconsistency for temp %s:\n",
2847f8b2f202SRichard Henderson                    tcg_get_arg_str_ptr(s, buf, sizeof(buf), ts));
2848b03cce8eSbellard         fail:
2849c896fe29Sbellard             printf("reg state:\n");
2850c896fe29Sbellard             dump_regs(s);
2851c896fe29Sbellard             tcg_abort();
2852c896fe29Sbellard         }
2853c896fe29Sbellard     }
2854c896fe29Sbellard }
2855c896fe29Sbellard #endif
2856c896fe29Sbellard 
28572272e4a7SRichard Henderson static void temp_allocate_frame(TCGContext *s, TCGTemp *ts)
2858c896fe29Sbellard {
28599b9c37c3SRichard Henderson #if !(defined(__sparc__) && TCG_TARGET_REG_BITS == 64)
28609b9c37c3SRichard Henderson     /* Sparc64 stack is accessed with offset of 2047 */
2861b591dc59SBlue Swirl     s->current_frame_offset = (s->current_frame_offset +
2862b591dc59SBlue Swirl                                (tcg_target_long)sizeof(tcg_target_long) - 1) &
2863b591dc59SBlue Swirl         ~(sizeof(tcg_target_long) - 1);
2864f44c9960SBlue Swirl #endif
2865b591dc59SBlue Swirl     if (s->current_frame_offset + (tcg_target_long)sizeof(tcg_target_long) >
2866b591dc59SBlue Swirl         s->frame_end) {
28675ff9d6a4Sbellard         tcg_abort();
2868b591dc59SBlue Swirl     }
2869c896fe29Sbellard     ts->mem_offset = s->current_frame_offset;
2870b3a62939SRichard Henderson     ts->mem_base = s->frame_temp;
2871c896fe29Sbellard     ts->mem_allocated = 1;
2872e2c6d1b4SRichard Henderson     s->current_frame_offset += sizeof(tcg_target_long);
2873c896fe29Sbellard }
2874c896fe29Sbellard 
2875b722452aSRichard Henderson static void temp_load(TCGContext *, TCGTemp *, TCGRegSet, TCGRegSet, TCGRegSet);
2876b3915dbbSRichard Henderson 
287759d7c14eSRichard Henderson /* Mark a temporary as free or dead.  If 'free_or_dead' is negative,
287859d7c14eSRichard Henderson    mark it free; otherwise mark it dead.  */
287959d7c14eSRichard Henderson static void temp_free_or_dead(TCGContext *s, TCGTemp *ts, int free_or_dead)
2880c896fe29Sbellard {
288159d7c14eSRichard Henderson     if (ts->fixed_reg) {
288259d7c14eSRichard Henderson         return;
288359d7c14eSRichard Henderson     }
288459d7c14eSRichard Henderson     if (ts->val_type == TEMP_VAL_REG) {
288559d7c14eSRichard Henderson         s->reg_to_temp[ts->reg] = NULL;
288659d7c14eSRichard Henderson     }
288759d7c14eSRichard Henderson     ts->val_type = (free_or_dead < 0
288859d7c14eSRichard Henderson                     || ts->temp_local
2889fa477d25SRichard Henderson                     || ts->temp_global
289059d7c14eSRichard Henderson                     ? TEMP_VAL_MEM : TEMP_VAL_DEAD);
289159d7c14eSRichard Henderson }
2892c896fe29Sbellard 
289359d7c14eSRichard Henderson /* Mark a temporary as dead.  */
289459d7c14eSRichard Henderson static inline void temp_dead(TCGContext *s, TCGTemp *ts)
289559d7c14eSRichard Henderson {
289659d7c14eSRichard Henderson     temp_free_or_dead(s, ts, 1);
289759d7c14eSRichard Henderson }
289859d7c14eSRichard Henderson 
289959d7c14eSRichard Henderson /* Sync a temporary to memory. 'allocated_regs' is used in case a temporary
290059d7c14eSRichard Henderson    registers needs to be allocated to store a constant.  If 'free_or_dead'
290159d7c14eSRichard Henderson    is non-zero, subsequently release the temporary; if it is positive, the
290259d7c14eSRichard Henderson    temp is dead; if it is negative, the temp is free.  */
290398b4e186SRichard Henderson static void temp_sync(TCGContext *s, TCGTemp *ts, TCGRegSet allocated_regs,
290498b4e186SRichard Henderson                       TCGRegSet preferred_regs, int free_or_dead)
290559d7c14eSRichard Henderson {
290659d7c14eSRichard Henderson     if (ts->fixed_reg) {
290759d7c14eSRichard Henderson         return;
290859d7c14eSRichard Henderson     }
290959d7c14eSRichard Henderson     if (!ts->mem_coherent) {
29107f6ceedfSAurelien Jarno         if (!ts->mem_allocated) {
29112272e4a7SRichard Henderson             temp_allocate_frame(s, ts);
291259d7c14eSRichard Henderson         }
291359d7c14eSRichard Henderson         switch (ts->val_type) {
291459d7c14eSRichard Henderson         case TEMP_VAL_CONST:
291559d7c14eSRichard Henderson             /* If we're going to free the temp immediately, then we won't
291659d7c14eSRichard Henderson                require it later in a register, so attempt to store the
291759d7c14eSRichard Henderson                constant to memory directly.  */
291859d7c14eSRichard Henderson             if (free_or_dead
291959d7c14eSRichard Henderson                 && tcg_out_sti(s, ts->type, ts->val,
292059d7c14eSRichard Henderson                                ts->mem_base->reg, ts->mem_offset)) {
292159d7c14eSRichard Henderson                 break;
292259d7c14eSRichard Henderson             }
292359d7c14eSRichard Henderson             temp_load(s, ts, tcg_target_available_regs[ts->type],
292498b4e186SRichard Henderson                       allocated_regs, preferred_regs);
292559d7c14eSRichard Henderson             /* fallthrough */
292659d7c14eSRichard Henderson 
292759d7c14eSRichard Henderson         case TEMP_VAL_REG:
292859d7c14eSRichard Henderson             tcg_out_st(s, ts->type, ts->reg,
292959d7c14eSRichard Henderson                        ts->mem_base->reg, ts->mem_offset);
293059d7c14eSRichard Henderson             break;
293159d7c14eSRichard Henderson 
293259d7c14eSRichard Henderson         case TEMP_VAL_MEM:
293359d7c14eSRichard Henderson             break;
293459d7c14eSRichard Henderson 
293559d7c14eSRichard Henderson         case TEMP_VAL_DEAD:
293659d7c14eSRichard Henderson         default:
293759d7c14eSRichard Henderson             tcg_abort();
2938c896fe29Sbellard         }
29397f6ceedfSAurelien Jarno         ts->mem_coherent = 1;
29407f6ceedfSAurelien Jarno     }
294159d7c14eSRichard Henderson     if (free_or_dead) {
294259d7c14eSRichard Henderson         temp_free_or_dead(s, ts, free_or_dead);
294359d7c14eSRichard Henderson     }
294459d7c14eSRichard Henderson }
29457f6ceedfSAurelien Jarno 
29467f6ceedfSAurelien Jarno /* free register 'reg' by spilling the corresponding temporary if necessary */
2947b3915dbbSRichard Henderson static void tcg_reg_free(TCGContext *s, TCGReg reg, TCGRegSet allocated_regs)
29487f6ceedfSAurelien Jarno {
2949f8b2f202SRichard Henderson     TCGTemp *ts = s->reg_to_temp[reg];
2950f8b2f202SRichard Henderson     if (ts != NULL) {
295198b4e186SRichard Henderson         temp_sync(s, ts, allocated_regs, 0, -1);
2952c896fe29Sbellard     }
2953c896fe29Sbellard }
2954c896fe29Sbellard 
2955b016486eSRichard Henderson /**
2956b016486eSRichard Henderson  * tcg_reg_alloc:
2957b016486eSRichard Henderson  * @required_regs: Set of registers in which we must allocate.
2958b016486eSRichard Henderson  * @allocated_regs: Set of registers which must be avoided.
2959b016486eSRichard Henderson  * @preferred_regs: Set of registers we should prefer.
2960b016486eSRichard Henderson  * @rev: True if we search the registers in "indirect" order.
2961b016486eSRichard Henderson  *
2962b016486eSRichard Henderson  * The allocated register must be in @required_regs & ~@allocated_regs,
2963b016486eSRichard Henderson  * but if we can put it in @preferred_regs we may save a move later.
2964b016486eSRichard Henderson  */
2965b016486eSRichard Henderson static TCGReg tcg_reg_alloc(TCGContext *s, TCGRegSet required_regs,
2966b016486eSRichard Henderson                             TCGRegSet allocated_regs,
2967b016486eSRichard Henderson                             TCGRegSet preferred_regs, bool rev)
2968c896fe29Sbellard {
2969b016486eSRichard Henderson     int i, j, f, n = ARRAY_SIZE(tcg_target_reg_alloc_order);
2970b016486eSRichard Henderson     TCGRegSet reg_ct[2];
297191478cefSRichard Henderson     const int *order;
2972c896fe29Sbellard 
2973b016486eSRichard Henderson     reg_ct[1] = required_regs & ~allocated_regs;
2974b016486eSRichard Henderson     tcg_debug_assert(reg_ct[1] != 0);
2975b016486eSRichard Henderson     reg_ct[0] = reg_ct[1] & preferred_regs;
2976b016486eSRichard Henderson 
2977b016486eSRichard Henderson     /* Skip the preferred_regs option if it cannot be satisfied,
2978b016486eSRichard Henderson        or if the preference made no difference.  */
2979b016486eSRichard Henderson     f = reg_ct[0] == 0 || reg_ct[0] == reg_ct[1];
2980b016486eSRichard Henderson 
298191478cefSRichard Henderson     order = rev ? indirect_reg_alloc_order : tcg_target_reg_alloc_order;
2982c896fe29Sbellard 
2983b016486eSRichard Henderson     /* Try free registers, preferences first.  */
2984b016486eSRichard Henderson     for (j = f; j < 2; j++) {
2985b016486eSRichard Henderson         TCGRegSet set = reg_ct[j];
2986b016486eSRichard Henderson 
2987b016486eSRichard Henderson         if (tcg_regset_single(set)) {
2988b016486eSRichard Henderson             /* One register in the set.  */
2989b016486eSRichard Henderson             TCGReg reg = tcg_regset_first(set);
2990b016486eSRichard Henderson             if (s->reg_to_temp[reg] == NULL) {
2991c896fe29Sbellard                 return reg;
2992c896fe29Sbellard             }
2993b016486eSRichard Henderson         } else {
299491478cefSRichard Henderson             for (i = 0; i < n; i++) {
2995b016486eSRichard Henderson                 TCGReg reg = order[i];
2996b016486eSRichard Henderson                 if (s->reg_to_temp[reg] == NULL &&
2997b016486eSRichard Henderson                     tcg_regset_test_reg(set, reg)) {
2998b016486eSRichard Henderson                     return reg;
2999b016486eSRichard Henderson                 }
3000b016486eSRichard Henderson             }
3001b016486eSRichard Henderson         }
3002b016486eSRichard Henderson     }
3003b016486eSRichard Henderson 
3004b016486eSRichard Henderson     /* We must spill something.  */
3005b016486eSRichard Henderson     for (j = f; j < 2; j++) {
3006b016486eSRichard Henderson         TCGRegSet set = reg_ct[j];
3007b016486eSRichard Henderson 
3008b016486eSRichard Henderson         if (tcg_regset_single(set)) {
3009b016486eSRichard Henderson             /* One register in the set.  */
3010b016486eSRichard Henderson             TCGReg reg = tcg_regset_first(set);
3011b3915dbbSRichard Henderson             tcg_reg_free(s, reg, allocated_regs);
3012c896fe29Sbellard             return reg;
3013b016486eSRichard Henderson         } else {
3014b016486eSRichard Henderson             for (i = 0; i < n; i++) {
3015b016486eSRichard Henderson                 TCGReg reg = order[i];
3016b016486eSRichard Henderson                 if (tcg_regset_test_reg(set, reg)) {
3017b016486eSRichard Henderson                     tcg_reg_free(s, reg, allocated_regs);
3018b016486eSRichard Henderson                     return reg;
3019b016486eSRichard Henderson                 }
3020b016486eSRichard Henderson             }
3021c896fe29Sbellard         }
3022c896fe29Sbellard     }
3023c896fe29Sbellard 
3024c896fe29Sbellard     tcg_abort();
3025c896fe29Sbellard }
3026c896fe29Sbellard 
302740ae5c62SRichard Henderson /* Make sure the temporary is in a register.  If needed, allocate the register
302840ae5c62SRichard Henderson    from DESIRED while avoiding ALLOCATED.  */
302940ae5c62SRichard Henderson static void temp_load(TCGContext *s, TCGTemp *ts, TCGRegSet desired_regs,
3030b722452aSRichard Henderson                       TCGRegSet allocated_regs, TCGRegSet preferred_regs)
303140ae5c62SRichard Henderson {
303240ae5c62SRichard Henderson     TCGReg reg;
303340ae5c62SRichard Henderson 
303440ae5c62SRichard Henderson     switch (ts->val_type) {
303540ae5c62SRichard Henderson     case TEMP_VAL_REG:
303640ae5c62SRichard Henderson         return;
303740ae5c62SRichard Henderson     case TEMP_VAL_CONST:
3038b016486eSRichard Henderson         reg = tcg_reg_alloc(s, desired_regs, allocated_regs,
3039b722452aSRichard Henderson                             preferred_regs, ts->indirect_base);
304040ae5c62SRichard Henderson         tcg_out_movi(s, ts->type, reg, ts->val);
304140ae5c62SRichard Henderson         ts->mem_coherent = 0;
304240ae5c62SRichard Henderson         break;
304340ae5c62SRichard Henderson     case TEMP_VAL_MEM:
3044b016486eSRichard Henderson         reg = tcg_reg_alloc(s, desired_regs, allocated_regs,
3045b722452aSRichard Henderson                             preferred_regs, ts->indirect_base);
304640ae5c62SRichard Henderson         tcg_out_ld(s, ts->type, reg, ts->mem_base->reg, ts->mem_offset);
304740ae5c62SRichard Henderson         ts->mem_coherent = 1;
304840ae5c62SRichard Henderson         break;
304940ae5c62SRichard Henderson     case TEMP_VAL_DEAD:
305040ae5c62SRichard Henderson     default:
305140ae5c62SRichard Henderson         tcg_abort();
305240ae5c62SRichard Henderson     }
305340ae5c62SRichard Henderson     ts->reg = reg;
305440ae5c62SRichard Henderson     ts->val_type = TEMP_VAL_REG;
305540ae5c62SRichard Henderson     s->reg_to_temp[reg] = ts;
305640ae5c62SRichard Henderson }
305740ae5c62SRichard Henderson 
305859d7c14eSRichard Henderson /* Save a temporary to memory. 'allocated_regs' is used in case a
3059e8996ee0Sbellard    temporary registers needs to be allocated to store a constant.  */
306059d7c14eSRichard Henderson static void temp_save(TCGContext *s, TCGTemp *ts, TCGRegSet allocated_regs)
30611ad80729SAurelien Jarno {
30622c0366f0SAurelien Jarno     /* The liveness analysis already ensures that globals are back
3063eabb7b91SAurelien Jarno        in memory. Keep an tcg_debug_assert for safety. */
3064f8bf00f1SRichard Henderson     tcg_debug_assert(ts->val_type == TEMP_VAL_MEM || ts->fixed_reg);
30651ad80729SAurelien Jarno }
30661ad80729SAurelien Jarno 
30679814dd27SDong Xu Wang /* save globals to their canonical location and assume they can be
3068641d5fbeSbellard    modified be the following code. 'allocated_regs' is used in case a
3069641d5fbeSbellard    temporary registers needs to be allocated to store a constant. */
3070641d5fbeSbellard static void save_globals(TCGContext *s, TCGRegSet allocated_regs)
3071641d5fbeSbellard {
3072ac3b8891SRichard Henderson     int i, n;
3073641d5fbeSbellard 
3074ac3b8891SRichard Henderson     for (i = 0, n = s->nb_globals; i < n; i++) {
3075b13eb728SRichard Henderson         temp_save(s, &s->temps[i], allocated_regs);
3076641d5fbeSbellard     }
3077e5097dc8Sbellard }
3078e5097dc8Sbellard 
30793d5c5f87SAurelien Jarno /* sync globals to their canonical location and assume they can be
30803d5c5f87SAurelien Jarno    read by the following code. 'allocated_regs' is used in case a
30813d5c5f87SAurelien Jarno    temporary registers needs to be allocated to store a constant. */
30823d5c5f87SAurelien Jarno static void sync_globals(TCGContext *s, TCGRegSet allocated_regs)
30833d5c5f87SAurelien Jarno {
3084ac3b8891SRichard Henderson     int i, n;
30853d5c5f87SAurelien Jarno 
3086ac3b8891SRichard Henderson     for (i = 0, n = s->nb_globals; i < n; i++) {
308712b9b11aSRichard Henderson         TCGTemp *ts = &s->temps[i];
308812b9b11aSRichard Henderson         tcg_debug_assert(ts->val_type != TEMP_VAL_REG
308912b9b11aSRichard Henderson                          || ts->fixed_reg
309012b9b11aSRichard Henderson                          || ts->mem_coherent);
30913d5c5f87SAurelien Jarno     }
30923d5c5f87SAurelien Jarno }
30933d5c5f87SAurelien Jarno 
3094e5097dc8Sbellard /* at the end of a basic block, we assume all temporaries are dead and
3095e8996ee0Sbellard    all globals are stored at their canonical location. */
3096e8996ee0Sbellard static void tcg_reg_alloc_bb_end(TCGContext *s, TCGRegSet allocated_regs)
3097e5097dc8Sbellard {
3098e5097dc8Sbellard     int i;
3099e5097dc8Sbellard 
3100c896fe29Sbellard     for (i = s->nb_globals; i < s->nb_temps; i++) {
3101b13eb728SRichard Henderson         TCGTemp *ts = &s->temps[i];
3102641d5fbeSbellard         if (ts->temp_local) {
3103b13eb728SRichard Henderson             temp_save(s, ts, allocated_regs);
3104641d5fbeSbellard         } else {
31052c0366f0SAurelien Jarno             /* The liveness analysis already ensures that temps are dead.
3106eabb7b91SAurelien Jarno                Keep an tcg_debug_assert for safety. */
3107eabb7b91SAurelien Jarno             tcg_debug_assert(ts->val_type == TEMP_VAL_DEAD);
3108c896fe29Sbellard         }
3109641d5fbeSbellard     }
3110e8996ee0Sbellard 
3111e8996ee0Sbellard     save_globals(s, allocated_regs);
3112c896fe29Sbellard }
3113c896fe29Sbellard 
31140fe4fca4SPaolo Bonzini static void tcg_reg_alloc_do_movi(TCGContext *s, TCGTemp *ots,
3115ba87719cSRichard Henderson                                   tcg_target_ulong val, TCGLifeData arg_life,
3116ba87719cSRichard Henderson                                   TCGRegSet preferred_regs)
3117e8996ee0Sbellard {
3118e8996ee0Sbellard     if (ots->fixed_reg) {
311959d7c14eSRichard Henderson         /* For fixed registers, we do not do any constant propagation.  */
3120e8996ee0Sbellard         tcg_out_movi(s, ots->type, ots->reg, val);
312159d7c14eSRichard Henderson         return;
312259d7c14eSRichard Henderson     }
312359d7c14eSRichard Henderson 
312459d7c14eSRichard Henderson     /* The movi is not explicitly generated here.  */
3125f8b2f202SRichard Henderson     if (ots->val_type == TEMP_VAL_REG) {
3126f8b2f202SRichard Henderson         s->reg_to_temp[ots->reg] = NULL;
3127f8b2f202SRichard Henderson     }
3128e8996ee0Sbellard     ots->val_type = TEMP_VAL_CONST;
3129e8996ee0Sbellard     ots->val = val;
313059d7c14eSRichard Henderson     ots->mem_coherent = 0;
3131ec7a869dSAurelien Jarno     if (NEED_SYNC_ARG(0)) {
3132ba87719cSRichard Henderson         temp_sync(s, ots, s->reserved_regs, preferred_regs, IS_DEAD_ARG(0));
313359d7c14eSRichard Henderson     } else if (IS_DEAD_ARG(0)) {
3134f8bf00f1SRichard Henderson         temp_dead(s, ots);
31354c4e1ab2SAurelien Jarno     }
3136e8996ee0Sbellard }
3137e8996ee0Sbellard 
3138dd186292SRichard Henderson static void tcg_reg_alloc_movi(TCGContext *s, const TCGOp *op)
31390fe4fca4SPaolo Bonzini {
314043439139SRichard Henderson     TCGTemp *ots = arg_temp(op->args[0]);
3141dd186292SRichard Henderson     tcg_target_ulong val = op->args[1];
31420fe4fca4SPaolo Bonzini 
314369e3706dSRichard Henderson     tcg_reg_alloc_do_movi(s, ots, val, op->life, op->output_pref[0]);
31440fe4fca4SPaolo Bonzini }
31450fe4fca4SPaolo Bonzini 
3146dd186292SRichard Henderson static void tcg_reg_alloc_mov(TCGContext *s, const TCGOp *op)
3147c896fe29Sbellard {
3148dd186292SRichard Henderson     const TCGLifeData arg_life = op->life;
314969e3706dSRichard Henderson     TCGRegSet allocated_regs, preferred_regs;
3150c896fe29Sbellard     TCGTemp *ts, *ots;
3151450445d5SRichard Henderson     TCGType otype, itype;
3152c896fe29Sbellard 
3153d21369f5SRichard Henderson     allocated_regs = s->reserved_regs;
315469e3706dSRichard Henderson     preferred_regs = op->output_pref[0];
315543439139SRichard Henderson     ots = arg_temp(op->args[0]);
315643439139SRichard Henderson     ts = arg_temp(op->args[1]);
3157450445d5SRichard Henderson 
3158450445d5SRichard Henderson     /* Note that otype != itype for no-op truncation.  */
3159450445d5SRichard Henderson     otype = ots->type;
3160450445d5SRichard Henderson     itype = ts->type;
3161c896fe29Sbellard 
31620fe4fca4SPaolo Bonzini     if (ts->val_type == TEMP_VAL_CONST) {
31630fe4fca4SPaolo Bonzini         /* propagate constant or generate sti */
31640fe4fca4SPaolo Bonzini         tcg_target_ulong val = ts->val;
31650fe4fca4SPaolo Bonzini         if (IS_DEAD_ARG(1)) {
31660fe4fca4SPaolo Bonzini             temp_dead(s, ts);
31670fe4fca4SPaolo Bonzini         }
316869e3706dSRichard Henderson         tcg_reg_alloc_do_movi(s, ots, val, arg_life, preferred_regs);
31690fe4fca4SPaolo Bonzini         return;
31700fe4fca4SPaolo Bonzini     }
31710fe4fca4SPaolo Bonzini 
31720fe4fca4SPaolo Bonzini     /* If the source value is in memory we're going to be forced
31730fe4fca4SPaolo Bonzini        to have it in a register in order to perform the copy.  Copy
31740fe4fca4SPaolo Bonzini        the SOURCE value into its own register first, that way we
31750fe4fca4SPaolo Bonzini        don't have to reload SOURCE the next time it is used. */
31760fe4fca4SPaolo Bonzini     if (ts->val_type == TEMP_VAL_MEM) {
317769e3706dSRichard Henderson         temp_load(s, ts, tcg_target_available_regs[itype],
317869e3706dSRichard Henderson                   allocated_regs, preferred_regs);
3179c29c1d7eSAurelien Jarno     }
3180c29c1d7eSAurelien Jarno 
31810fe4fca4SPaolo Bonzini     tcg_debug_assert(ts->val_type == TEMP_VAL_REG);
3182c29c1d7eSAurelien Jarno     if (IS_DEAD_ARG(0) && !ots->fixed_reg) {
3183c29c1d7eSAurelien Jarno         /* mov to a non-saved dead register makes no sense (even with
3184c29c1d7eSAurelien Jarno            liveness analysis disabled). */
3185eabb7b91SAurelien Jarno         tcg_debug_assert(NEED_SYNC_ARG(0));
3186c29c1d7eSAurelien Jarno         if (!ots->mem_allocated) {
31872272e4a7SRichard Henderson             temp_allocate_frame(s, ots);
3188c29c1d7eSAurelien Jarno         }
3189b3a62939SRichard Henderson         tcg_out_st(s, otype, ts->reg, ots->mem_base->reg, ots->mem_offset);
3190c29c1d7eSAurelien Jarno         if (IS_DEAD_ARG(1)) {
3191f8bf00f1SRichard Henderson             temp_dead(s, ts);
3192c29c1d7eSAurelien Jarno         }
3193f8bf00f1SRichard Henderson         temp_dead(s, ots);
3194e8996ee0Sbellard     } else {
3195c29c1d7eSAurelien Jarno         if (IS_DEAD_ARG(1) && !ts->fixed_reg && !ots->fixed_reg) {
3196c29c1d7eSAurelien Jarno             /* the mov can be suppressed */
3197c29c1d7eSAurelien Jarno             if (ots->val_type == TEMP_VAL_REG) {
3198f8b2f202SRichard Henderson                 s->reg_to_temp[ots->reg] = NULL;
3199c896fe29Sbellard             }
3200c29c1d7eSAurelien Jarno             ots->reg = ts->reg;
3201f8bf00f1SRichard Henderson             temp_dead(s, ts);
3202c29c1d7eSAurelien Jarno         } else {
3203c29c1d7eSAurelien Jarno             if (ots->val_type != TEMP_VAL_REG) {
3204c29c1d7eSAurelien Jarno                 /* When allocating a new register, make sure to not spill the
3205c29c1d7eSAurelien Jarno                    input one. */
3206c29c1d7eSAurelien Jarno                 tcg_regset_set_reg(allocated_regs, ts->reg);
3207450445d5SRichard Henderson                 ots->reg = tcg_reg_alloc(s, tcg_target_available_regs[otype],
320869e3706dSRichard Henderson                                          allocated_regs, preferred_regs,
3209b016486eSRichard Henderson                                          ots->indirect_base);
3210c29c1d7eSAurelien Jarno             }
3211450445d5SRichard Henderson             tcg_out_mov(s, otype, ots->reg, ts->reg);
3212c29c1d7eSAurelien Jarno         }
3213c896fe29Sbellard         ots->val_type = TEMP_VAL_REG;
3214c896fe29Sbellard         ots->mem_coherent = 0;
3215f8b2f202SRichard Henderson         s->reg_to_temp[ots->reg] = ots;
3216ec7a869dSAurelien Jarno         if (NEED_SYNC_ARG(0)) {
321798b4e186SRichard Henderson             temp_sync(s, ots, allocated_regs, 0, 0);
3218c29c1d7eSAurelien Jarno         }
3219ec7a869dSAurelien Jarno     }
3220c896fe29Sbellard }
3221c896fe29Sbellard 
3222dd186292SRichard Henderson static void tcg_reg_alloc_op(TCGContext *s, const TCGOp *op)
3223c896fe29Sbellard {
3224dd186292SRichard Henderson     const TCGLifeData arg_life = op->life;
3225dd186292SRichard Henderson     const TCGOpDef * const def = &tcg_op_defs[op->opc];
322682790a87SRichard Henderson     TCGRegSet i_allocated_regs;
322782790a87SRichard Henderson     TCGRegSet o_allocated_regs;
3228b6638662SRichard Henderson     int i, k, nb_iargs, nb_oargs;
3229b6638662SRichard Henderson     TCGReg reg;
3230c896fe29Sbellard     TCGArg arg;
3231c896fe29Sbellard     const TCGArgConstraint *arg_ct;
3232c896fe29Sbellard     TCGTemp *ts;
3233c896fe29Sbellard     TCGArg new_args[TCG_MAX_OP_ARGS];
3234c896fe29Sbellard     int const_args[TCG_MAX_OP_ARGS];
3235c896fe29Sbellard 
3236c896fe29Sbellard     nb_oargs = def->nb_oargs;
3237c896fe29Sbellard     nb_iargs = def->nb_iargs;
3238c896fe29Sbellard 
3239c896fe29Sbellard     /* copy constants */
3240c896fe29Sbellard     memcpy(new_args + nb_oargs + nb_iargs,
3241dd186292SRichard Henderson            op->args + nb_oargs + nb_iargs,
3242c896fe29Sbellard            sizeof(TCGArg) * def->nb_cargs);
3243c896fe29Sbellard 
3244d21369f5SRichard Henderson     i_allocated_regs = s->reserved_regs;
3245d21369f5SRichard Henderson     o_allocated_regs = s->reserved_regs;
324682790a87SRichard Henderson 
3247c896fe29Sbellard     /* satisfy input constraints */
3248c896fe29Sbellard     for (k = 0; k < nb_iargs; k++) {
3249d62816f2SRichard Henderson         TCGRegSet i_preferred_regs, o_preferred_regs;
3250d62816f2SRichard Henderson 
3251c896fe29Sbellard         i = def->sorted_args[nb_oargs + k];
3252dd186292SRichard Henderson         arg = op->args[i];
3253c896fe29Sbellard         arg_ct = &def->args_ct[i];
325443439139SRichard Henderson         ts = arg_temp(arg);
325540ae5c62SRichard Henderson 
325640ae5c62SRichard Henderson         if (ts->val_type == TEMP_VAL_CONST
325740ae5c62SRichard Henderson             && tcg_target_const_match(ts->val, ts->type, arg_ct)) {
3258c896fe29Sbellard             /* constant is OK for instruction */
3259c896fe29Sbellard             const_args[i] = 1;
3260c896fe29Sbellard             new_args[i] = ts->val;
3261d62816f2SRichard Henderson             continue;
3262c896fe29Sbellard         }
326340ae5c62SRichard Henderson 
3264d62816f2SRichard Henderson         i_preferred_regs = o_preferred_regs = 0;
32655ff9d6a4Sbellard         if (arg_ct->ct & TCG_CT_IALIAS) {
3266d62816f2SRichard Henderson             o_preferred_regs = op->output_pref[arg_ct->alias_index];
32675ff9d6a4Sbellard             if (ts->fixed_reg) {
32685ff9d6a4Sbellard                 /* if fixed register, we must allocate a new register
32695ff9d6a4Sbellard                    if the alias is not the same register */
3270d62816f2SRichard Henderson                 if (arg != op->args[arg_ct->alias_index]) {
32715ff9d6a4Sbellard                     goto allocate_in_reg;
3272d62816f2SRichard Henderson                 }
32735ff9d6a4Sbellard             } else {
3274c896fe29Sbellard                 /* if the input is aliased to an output and if it is
3275c896fe29Sbellard                    not dead after the instruction, we must allocate
3276c896fe29Sbellard                    a new register and move it */
3277866cb6cbSAurelien Jarno                 if (!IS_DEAD_ARG(i)) {
3278c896fe29Sbellard                     goto allocate_in_reg;
3279c896fe29Sbellard                 }
3280d62816f2SRichard Henderson 
32817e1df267SAurelien Jarno                 /* check if the current register has already been allocated
32827e1df267SAurelien Jarno                    for another input aliased to an output */
3283d62816f2SRichard Henderson                 if (ts->val_type == TEMP_VAL_REG) {
32847e1df267SAurelien Jarno                     int k2, i2;
3285d62816f2SRichard Henderson                     reg = ts->reg;
32867e1df267SAurelien Jarno                     for (k2 = 0 ; k2 < k ; k2++) {
32877e1df267SAurelien Jarno                         i2 = def->sorted_args[nb_oargs + k2];
32887e1df267SAurelien Jarno                         if ((def->args_ct[i2].ct & TCG_CT_IALIAS) &&
3289d62816f2SRichard Henderson                             reg == new_args[i2]) {
32907e1df267SAurelien Jarno                             goto allocate_in_reg;
32917e1df267SAurelien Jarno                         }
32927e1df267SAurelien Jarno                     }
32935ff9d6a4Sbellard                 }
3294d62816f2SRichard Henderson                 i_preferred_regs = o_preferred_regs;
3295866cb6cbSAurelien Jarno             }
3296d62816f2SRichard Henderson         }
3297d62816f2SRichard Henderson 
3298d62816f2SRichard Henderson         temp_load(s, ts, arg_ct->u.regs, i_allocated_regs, i_preferred_regs);
3299c896fe29Sbellard         reg = ts->reg;
3300d62816f2SRichard Henderson 
3301c896fe29Sbellard         if (tcg_regset_test_reg(arg_ct->u.regs, reg)) {
3302c896fe29Sbellard             /* nothing to do : the constraint is satisfied */
3303c896fe29Sbellard         } else {
3304c896fe29Sbellard         allocate_in_reg:
3305c896fe29Sbellard             /* allocate a new register matching the constraint
3306c896fe29Sbellard                and move the temporary register into it */
3307d62816f2SRichard Henderson             temp_load(s, ts, tcg_target_available_regs[ts->type],
3308d62816f2SRichard Henderson                       i_allocated_regs, 0);
330982790a87SRichard Henderson             reg = tcg_reg_alloc(s, arg_ct->u.regs, i_allocated_regs,
3310d62816f2SRichard Henderson                                 o_preferred_regs, ts->indirect_base);
33113b6dac34SRichard Henderson             tcg_out_mov(s, ts->type, reg, ts->reg);
3312c896fe29Sbellard         }
3313c896fe29Sbellard         new_args[i] = reg;
3314c896fe29Sbellard         const_args[i] = 0;
331582790a87SRichard Henderson         tcg_regset_set_reg(i_allocated_regs, reg);
3316c896fe29Sbellard     }
3317c896fe29Sbellard 
3318c896fe29Sbellard     /* mark dead temporaries and free the associated registers */
3319866cb6cbSAurelien Jarno     for (i = nb_oargs; i < nb_oargs + nb_iargs; i++) {
3320866cb6cbSAurelien Jarno         if (IS_DEAD_ARG(i)) {
332143439139SRichard Henderson             temp_dead(s, arg_temp(op->args[i]));
3322c896fe29Sbellard         }
3323c896fe29Sbellard     }
3324c896fe29Sbellard 
3325a52ad07eSAurelien Jarno     if (def->flags & TCG_OPF_BB_END) {
332682790a87SRichard Henderson         tcg_reg_alloc_bb_end(s, i_allocated_regs);
3327a52ad07eSAurelien Jarno     } else {
3328c896fe29Sbellard         if (def->flags & TCG_OPF_CALL_CLOBBER) {
3329b03cce8eSbellard             /* XXX: permit generic clobber register list ? */
3330c8074023SRichard Henderson             for (i = 0; i < TCG_TARGET_NB_REGS; i++) {
3331c8074023SRichard Henderson                 if (tcg_regset_test_reg(tcg_target_call_clobber_regs, i)) {
333282790a87SRichard Henderson                     tcg_reg_free(s, i, i_allocated_regs);
3333c896fe29Sbellard                 }
3334c896fe29Sbellard             }
33353d5c5f87SAurelien Jarno         }
33363d5c5f87SAurelien Jarno         if (def->flags & TCG_OPF_SIDE_EFFECTS) {
33373d5c5f87SAurelien Jarno             /* sync globals if the op has side effects and might trigger
33383d5c5f87SAurelien Jarno                an exception. */
333982790a87SRichard Henderson             sync_globals(s, i_allocated_regs);
3340c896fe29Sbellard         }
3341c896fe29Sbellard 
3342c896fe29Sbellard         /* satisfy the output constraints */
3343c896fe29Sbellard         for(k = 0; k < nb_oargs; k++) {
3344c896fe29Sbellard             i = def->sorted_args[k];
3345dd186292SRichard Henderson             arg = op->args[i];
3346c896fe29Sbellard             arg_ct = &def->args_ct[i];
334743439139SRichard Henderson             ts = arg_temp(arg);
334817280ff4SRichard Henderson             if ((arg_ct->ct & TCG_CT_ALIAS)
334917280ff4SRichard Henderson                 && !const_args[arg_ct->alias_index]) {
33505ff9d6a4Sbellard                 reg = new_args[arg_ct->alias_index];
335182790a87SRichard Henderson             } else if (arg_ct->ct & TCG_CT_NEWREG) {
335282790a87SRichard Henderson                 reg = tcg_reg_alloc(s, arg_ct->u.regs,
335382790a87SRichard Henderson                                     i_allocated_regs | o_allocated_regs,
335469e3706dSRichard Henderson                                     op->output_pref[k], ts->indirect_base);
3355c896fe29Sbellard             } else {
3356c896fe29Sbellard                 /* if fixed register, we try to use it */
3357c896fe29Sbellard                 reg = ts->reg;
3358c896fe29Sbellard                 if (ts->fixed_reg &&
3359c896fe29Sbellard                     tcg_regset_test_reg(arg_ct->u.regs, reg)) {
3360c896fe29Sbellard                     goto oarg_end;
3361c896fe29Sbellard                 }
336282790a87SRichard Henderson                 reg = tcg_reg_alloc(s, arg_ct->u.regs, o_allocated_regs,
336369e3706dSRichard Henderson                                     op->output_pref[k], ts->indirect_base);
3364c896fe29Sbellard             }
336582790a87SRichard Henderson             tcg_regset_set_reg(o_allocated_regs, reg);
3366c896fe29Sbellard             /* if a fixed register is used, then a move will be done afterwards */
3367c896fe29Sbellard             if (!ts->fixed_reg) {
3368639368ddSAurelien Jarno                 if (ts->val_type == TEMP_VAL_REG) {
3369f8b2f202SRichard Henderson                     s->reg_to_temp[ts->reg] = NULL;
3370639368ddSAurelien Jarno                 }
3371c896fe29Sbellard                 ts->val_type = TEMP_VAL_REG;
3372c896fe29Sbellard                 ts->reg = reg;
3373c896fe29Sbellard                 /* temp value is modified, so the value kept in memory is
3374c896fe29Sbellard                    potentially not the same */
3375c896fe29Sbellard                 ts->mem_coherent = 0;
3376f8b2f202SRichard Henderson                 s->reg_to_temp[reg] = ts;
3377c896fe29Sbellard             }
3378c896fe29Sbellard         oarg_end:
3379c896fe29Sbellard             new_args[i] = reg;
3380c896fe29Sbellard         }
3381e8996ee0Sbellard     }
3382c896fe29Sbellard 
3383c896fe29Sbellard     /* emit instruction */
3384d2fd745fSRichard Henderson     if (def->flags & TCG_OPF_VECTOR) {
3385d2fd745fSRichard Henderson         tcg_out_vec_op(s, op->opc, TCGOP_VECL(op), TCGOP_VECE(op),
3386d2fd745fSRichard Henderson                        new_args, const_args);
3387d2fd745fSRichard Henderson     } else {
3388dd186292SRichard Henderson         tcg_out_op(s, op->opc, new_args, const_args);
3389d2fd745fSRichard Henderson     }
3390c896fe29Sbellard 
3391c896fe29Sbellard     /* move the outputs in the correct register if needed */
3392c896fe29Sbellard     for(i = 0; i < nb_oargs; i++) {
339343439139SRichard Henderson         ts = arg_temp(op->args[i]);
3394c896fe29Sbellard         reg = new_args[i];
3395c896fe29Sbellard         if (ts->fixed_reg && ts->reg != reg) {
33963b6dac34SRichard Henderson             tcg_out_mov(s, ts->type, ts->reg, reg);
3397c896fe29Sbellard         }
3398ec7a869dSAurelien Jarno         if (NEED_SYNC_ARG(i)) {
339998b4e186SRichard Henderson             temp_sync(s, ts, o_allocated_regs, 0, IS_DEAD_ARG(i));
340059d7c14eSRichard Henderson         } else if (IS_DEAD_ARG(i)) {
3401f8bf00f1SRichard Henderson             temp_dead(s, ts);
3402ec7a869dSAurelien Jarno         }
3403c896fe29Sbellard     }
3404c896fe29Sbellard }
3405c896fe29Sbellard 
3406b03cce8eSbellard #ifdef TCG_TARGET_STACK_GROWSUP
3407b03cce8eSbellard #define STACK_DIR(x) (-(x))
3408b03cce8eSbellard #else
3409b03cce8eSbellard #define STACK_DIR(x) (x)
3410b03cce8eSbellard #endif
3411b03cce8eSbellard 
3412dd186292SRichard Henderson static void tcg_reg_alloc_call(TCGContext *s, TCGOp *op)
3413c896fe29Sbellard {
3414cd9090aaSRichard Henderson     const int nb_oargs = TCGOP_CALLO(op);
3415cd9090aaSRichard Henderson     const int nb_iargs = TCGOP_CALLI(op);
3416dd186292SRichard Henderson     const TCGLifeData arg_life = op->life;
3417b6638662SRichard Henderson     int flags, nb_regs, i;
3418b6638662SRichard Henderson     TCGReg reg;
3419cf066674SRichard Henderson     TCGArg arg;
3420c896fe29Sbellard     TCGTemp *ts;
3421d3452f1fSRichard Henderson     intptr_t stack_offset;
3422d3452f1fSRichard Henderson     size_t call_stack_size;
3423cf066674SRichard Henderson     tcg_insn_unit *func_addr;
3424cf066674SRichard Henderson     int allocate_args;
3425c896fe29Sbellard     TCGRegSet allocated_regs;
3426c896fe29Sbellard 
3427dd186292SRichard Henderson     func_addr = (tcg_insn_unit *)(intptr_t)op->args[nb_oargs + nb_iargs];
3428dd186292SRichard Henderson     flags = op->args[nb_oargs + nb_iargs + 1];
3429c896fe29Sbellard 
34306e17d0c5SStefan Weil     nb_regs = ARRAY_SIZE(tcg_target_call_iarg_regs);
3431c45cb8bbSRichard Henderson     if (nb_regs > nb_iargs) {
3432c45cb8bbSRichard Henderson         nb_regs = nb_iargs;
3433cf066674SRichard Henderson     }
3434c896fe29Sbellard 
3435c896fe29Sbellard     /* assign stack slots first */
3436c45cb8bbSRichard Henderson     call_stack_size = (nb_iargs - nb_regs) * sizeof(tcg_target_long);
3437c896fe29Sbellard     call_stack_size = (call_stack_size + TCG_TARGET_STACK_ALIGN - 1) &
3438c896fe29Sbellard         ~(TCG_TARGET_STACK_ALIGN - 1);
3439b03cce8eSbellard     allocate_args = (call_stack_size > TCG_STATIC_CALL_ARGS_SIZE);
3440b03cce8eSbellard     if (allocate_args) {
3441345649c0SBlue Swirl         /* XXX: if more than TCG_STATIC_CALL_ARGS_SIZE is needed,
3442345649c0SBlue Swirl            preallocate call stack */
3443345649c0SBlue Swirl         tcg_abort();
3444b03cce8eSbellard     }
344539cf05d3Sbellard 
344639cf05d3Sbellard     stack_offset = TCG_TARGET_CALL_STACK_OFFSET;
3447c45cb8bbSRichard Henderson     for (i = nb_regs; i < nb_iargs; i++) {
3448dd186292SRichard Henderson         arg = op->args[nb_oargs + i];
344939cf05d3Sbellard #ifdef TCG_TARGET_STACK_GROWSUP
345039cf05d3Sbellard         stack_offset -= sizeof(tcg_target_long);
345139cf05d3Sbellard #endif
345239cf05d3Sbellard         if (arg != TCG_CALL_DUMMY_ARG) {
345343439139SRichard Henderson             ts = arg_temp(arg);
345440ae5c62SRichard Henderson             temp_load(s, ts, tcg_target_available_regs[ts->type],
3455b722452aSRichard Henderson                       s->reserved_regs, 0);
3456e4d5434cSblueswir1             tcg_out_st(s, ts->type, ts->reg, TCG_REG_CALL_STACK, stack_offset);
345739cf05d3Sbellard         }
345839cf05d3Sbellard #ifndef TCG_TARGET_STACK_GROWSUP
345939cf05d3Sbellard         stack_offset += sizeof(tcg_target_long);
346039cf05d3Sbellard #endif
3461c896fe29Sbellard     }
3462c896fe29Sbellard 
3463c896fe29Sbellard     /* assign input registers */
3464d21369f5SRichard Henderson     allocated_regs = s->reserved_regs;
3465c896fe29Sbellard     for (i = 0; i < nb_regs; i++) {
3466dd186292SRichard Henderson         arg = op->args[nb_oargs + i];
346739cf05d3Sbellard         if (arg != TCG_CALL_DUMMY_ARG) {
346843439139SRichard Henderson             ts = arg_temp(arg);
3469c896fe29Sbellard             reg = tcg_target_call_iarg_regs[i];
3470b3915dbbSRichard Henderson             tcg_reg_free(s, reg, allocated_regs);
347140ae5c62SRichard Henderson 
3472c896fe29Sbellard             if (ts->val_type == TEMP_VAL_REG) {
3473c896fe29Sbellard                 if (ts->reg != reg) {
34743b6dac34SRichard Henderson                     tcg_out_mov(s, ts->type, reg, ts->reg);
3475c896fe29Sbellard                 }
3476c896fe29Sbellard             } else {
3477ccb1bb66SRichard Henderson                 TCGRegSet arg_set = 0;
347840ae5c62SRichard Henderson 
347940ae5c62SRichard Henderson                 tcg_regset_set_reg(arg_set, reg);
3480b722452aSRichard Henderson                 temp_load(s, ts, arg_set, allocated_regs, 0);
3481c896fe29Sbellard             }
348240ae5c62SRichard Henderson 
3483c896fe29Sbellard             tcg_regset_set_reg(allocated_regs, reg);
3484c896fe29Sbellard         }
348539cf05d3Sbellard     }
3486c896fe29Sbellard 
3487c896fe29Sbellard     /* mark dead temporaries and free the associated registers */
3488866cb6cbSAurelien Jarno     for (i = nb_oargs; i < nb_iargs + nb_oargs; i++) {
3489866cb6cbSAurelien Jarno         if (IS_DEAD_ARG(i)) {
349043439139SRichard Henderson             temp_dead(s, arg_temp(op->args[i]));
3491c896fe29Sbellard         }
3492c896fe29Sbellard     }
3493c896fe29Sbellard 
3494c896fe29Sbellard     /* clobber call registers */
3495c8074023SRichard Henderson     for (i = 0; i < TCG_TARGET_NB_REGS; i++) {
3496c8074023SRichard Henderson         if (tcg_regset_test_reg(tcg_target_call_clobber_regs, i)) {
3497b3915dbbSRichard Henderson             tcg_reg_free(s, i, allocated_regs);
3498c896fe29Sbellard         }
3499c896fe29Sbellard     }
3500c896fe29Sbellard 
350178505279SAurelien Jarno     /* Save globals if they might be written by the helper, sync them if
350278505279SAurelien Jarno        they might be read. */
350378505279SAurelien Jarno     if (flags & TCG_CALL_NO_READ_GLOBALS) {
350478505279SAurelien Jarno         /* Nothing to do */
350578505279SAurelien Jarno     } else if (flags & TCG_CALL_NO_WRITE_GLOBALS) {
350678505279SAurelien Jarno         sync_globals(s, allocated_regs);
350778505279SAurelien Jarno     } else {
3508e8996ee0Sbellard         save_globals(s, allocated_regs);
3509b9c18f56Saurel32     }
3510c896fe29Sbellard 
3511cf066674SRichard Henderson     tcg_out_call(s, func_addr);
3512c896fe29Sbellard 
3513c896fe29Sbellard     /* assign output registers and emit moves if needed */
3514c896fe29Sbellard     for(i = 0; i < nb_oargs; i++) {
3515dd186292SRichard Henderson         arg = op->args[i];
351643439139SRichard Henderson         ts = arg_temp(arg);
3517c896fe29Sbellard         reg = tcg_target_call_oarg_regs[i];
3518eabb7b91SAurelien Jarno         tcg_debug_assert(s->reg_to_temp[reg] == NULL);
351934b1a49cSRichard Henderson 
3520c896fe29Sbellard         if (ts->fixed_reg) {
3521c896fe29Sbellard             if (ts->reg != reg) {
35223b6dac34SRichard Henderson                 tcg_out_mov(s, ts->type, ts->reg, reg);
3523c896fe29Sbellard             }
3524c896fe29Sbellard         } else {
3525639368ddSAurelien Jarno             if (ts->val_type == TEMP_VAL_REG) {
3526f8b2f202SRichard Henderson                 s->reg_to_temp[ts->reg] = NULL;
3527639368ddSAurelien Jarno             }
3528c896fe29Sbellard             ts->val_type = TEMP_VAL_REG;
3529c896fe29Sbellard             ts->reg = reg;
3530c896fe29Sbellard             ts->mem_coherent = 0;
3531f8b2f202SRichard Henderson             s->reg_to_temp[reg] = ts;
3532ec7a869dSAurelien Jarno             if (NEED_SYNC_ARG(i)) {
353398b4e186SRichard Henderson                 temp_sync(s, ts, allocated_regs, 0, IS_DEAD_ARG(i));
353459d7c14eSRichard Henderson             } else if (IS_DEAD_ARG(i)) {
3535f8bf00f1SRichard Henderson                 temp_dead(s, ts);
3536c896fe29Sbellard             }
3537c896fe29Sbellard         }
35388c11ad25SAurelien Jarno     }
3539c896fe29Sbellard }
3540c896fe29Sbellard 
3541c896fe29Sbellard #ifdef CONFIG_PROFILER
3542c896fe29Sbellard 
3543c3fac113SEmilio G. Cota /* avoid copy/paste errors */
3544c3fac113SEmilio G. Cota #define PROF_ADD(to, from, field)                       \
3545c3fac113SEmilio G. Cota     do {                                                \
3546c3fac113SEmilio G. Cota         (to)->field += atomic_read(&((from)->field));   \
3547c3fac113SEmilio G. Cota     } while (0)
3548c896fe29Sbellard 
3549c3fac113SEmilio G. Cota #define PROF_MAX(to, from, field)                                       \
3550c3fac113SEmilio G. Cota     do {                                                                \
3551c3fac113SEmilio G. Cota         typeof((from)->field) val__ = atomic_read(&((from)->field));    \
3552c3fac113SEmilio G. Cota         if (val__ > (to)->field) {                                      \
3553c3fac113SEmilio G. Cota             (to)->field = val__;                                        \
3554c3fac113SEmilio G. Cota         }                                                               \
3555c3fac113SEmilio G. Cota     } while (0)
3556c3fac113SEmilio G. Cota 
3557c3fac113SEmilio G. Cota /* Pass in a zero'ed @prof */
3558c3fac113SEmilio G. Cota static inline
3559c3fac113SEmilio G. Cota void tcg_profile_snapshot(TCGProfile *prof, bool counters, bool table)
3560c896fe29Sbellard {
35613468b59eSEmilio G. Cota     unsigned int n_ctxs = atomic_read(&n_tcg_ctxs);
3562c3fac113SEmilio G. Cota     unsigned int i;
3563c3fac113SEmilio G. Cota 
35643468b59eSEmilio G. Cota     for (i = 0; i < n_ctxs; i++) {
35653468b59eSEmilio G. Cota         TCGContext *s = atomic_read(&tcg_ctxs[i]);
35663468b59eSEmilio G. Cota         const TCGProfile *orig = &s->prof;
3567c3fac113SEmilio G. Cota 
3568c3fac113SEmilio G. Cota         if (counters) {
356972fd2efbSEmilio G. Cota             PROF_ADD(prof, orig, cpu_exec_time);
3570c3fac113SEmilio G. Cota             PROF_ADD(prof, orig, tb_count1);
3571c3fac113SEmilio G. Cota             PROF_ADD(prof, orig, tb_count);
3572c3fac113SEmilio G. Cota             PROF_ADD(prof, orig, op_count);
3573c3fac113SEmilio G. Cota             PROF_MAX(prof, orig, op_count_max);
3574c3fac113SEmilio G. Cota             PROF_ADD(prof, orig, temp_count);
3575c3fac113SEmilio G. Cota             PROF_MAX(prof, orig, temp_count_max);
3576c3fac113SEmilio G. Cota             PROF_ADD(prof, orig, del_op_count);
3577c3fac113SEmilio G. Cota             PROF_ADD(prof, orig, code_in_len);
3578c3fac113SEmilio G. Cota             PROF_ADD(prof, orig, code_out_len);
3579c3fac113SEmilio G. Cota             PROF_ADD(prof, orig, search_out_len);
3580c3fac113SEmilio G. Cota             PROF_ADD(prof, orig, interm_time);
3581c3fac113SEmilio G. Cota             PROF_ADD(prof, orig, code_time);
3582c3fac113SEmilio G. Cota             PROF_ADD(prof, orig, la_time);
3583c3fac113SEmilio G. Cota             PROF_ADD(prof, orig, opt_time);
3584c3fac113SEmilio G. Cota             PROF_ADD(prof, orig, restore_count);
3585c3fac113SEmilio G. Cota             PROF_ADD(prof, orig, restore_time);
3586c3fac113SEmilio G. Cota         }
3587c3fac113SEmilio G. Cota         if (table) {
3588c896fe29Sbellard             int i;
3589d70724ceSzhanghailiang 
359015fc7daaSRichard Henderson             for (i = 0; i < NB_OPS; i++) {
3591c3fac113SEmilio G. Cota                 PROF_ADD(prof, orig, table_op_count[i]);
3592c3fac113SEmilio G. Cota             }
3593c3fac113SEmilio G. Cota         }
3594c3fac113SEmilio G. Cota     }
3595c3fac113SEmilio G. Cota }
3596c3fac113SEmilio G. Cota 
3597c3fac113SEmilio G. Cota #undef PROF_ADD
3598c3fac113SEmilio G. Cota #undef PROF_MAX
3599c3fac113SEmilio G. Cota 
3600c3fac113SEmilio G. Cota static void tcg_profile_snapshot_counters(TCGProfile *prof)
3601c3fac113SEmilio G. Cota {
3602c3fac113SEmilio G. Cota     tcg_profile_snapshot(prof, true, false);
3603c3fac113SEmilio G. Cota }
3604c3fac113SEmilio G. Cota 
3605c3fac113SEmilio G. Cota static void tcg_profile_snapshot_table(TCGProfile *prof)
3606c3fac113SEmilio G. Cota {
3607c3fac113SEmilio G. Cota     tcg_profile_snapshot(prof, false, true);
3608c3fac113SEmilio G. Cota }
3609c3fac113SEmilio G. Cota 
3610c3fac113SEmilio G. Cota void tcg_dump_op_count(FILE *f, fprintf_function cpu_fprintf)
3611c3fac113SEmilio G. Cota {
3612c3fac113SEmilio G. Cota     TCGProfile prof = {};
3613c3fac113SEmilio G. Cota     int i;
3614c3fac113SEmilio G. Cota 
3615c3fac113SEmilio G. Cota     tcg_profile_snapshot_table(&prof);
3616c3fac113SEmilio G. Cota     for (i = 0; i < NB_OPS; i++) {
3617246ae24dSMax Filippov         cpu_fprintf(f, "%s %" PRId64 "\n", tcg_op_defs[i].name,
3618c3fac113SEmilio G. Cota                     prof.table_op_count[i]);
3619c896fe29Sbellard     }
3620c896fe29Sbellard }
362172fd2efbSEmilio G. Cota 
362272fd2efbSEmilio G. Cota int64_t tcg_cpu_exec_time(void)
362372fd2efbSEmilio G. Cota {
362472fd2efbSEmilio G. Cota     unsigned int n_ctxs = atomic_read(&n_tcg_ctxs);
362572fd2efbSEmilio G. Cota     unsigned int i;
362672fd2efbSEmilio G. Cota     int64_t ret = 0;
362772fd2efbSEmilio G. Cota 
362872fd2efbSEmilio G. Cota     for (i = 0; i < n_ctxs; i++) {
362972fd2efbSEmilio G. Cota         const TCGContext *s = atomic_read(&tcg_ctxs[i]);
363072fd2efbSEmilio G. Cota         const TCGProfile *prof = &s->prof;
363172fd2efbSEmilio G. Cota 
363272fd2efbSEmilio G. Cota         ret += atomic_read(&prof->cpu_exec_time);
363372fd2efbSEmilio G. Cota     }
363472fd2efbSEmilio G. Cota     return ret;
363572fd2efbSEmilio G. Cota }
3636246ae24dSMax Filippov #else
3637246ae24dSMax Filippov void tcg_dump_op_count(FILE *f, fprintf_function cpu_fprintf)
3638246ae24dSMax Filippov {
3639246ae24dSMax Filippov     cpu_fprintf(f, "[TCG profiler not compiled]\n");
3640246ae24dSMax Filippov }
364172fd2efbSEmilio G. Cota 
364272fd2efbSEmilio G. Cota int64_t tcg_cpu_exec_time(void)
364372fd2efbSEmilio G. Cota {
364472fd2efbSEmilio G. Cota     error_report("%s: TCG profiler not compiled", __func__);
364572fd2efbSEmilio G. Cota     exit(EXIT_FAILURE);
364672fd2efbSEmilio G. Cota }
3647c896fe29Sbellard #endif
3648c896fe29Sbellard 
3649c896fe29Sbellard 
36505bd2ec3dSAlex Bennée int tcg_gen_code(TCGContext *s, TranslationBlock *tb)
3651c896fe29Sbellard {
3652c3fac113SEmilio G. Cota #ifdef CONFIG_PROFILER
3653c3fac113SEmilio G. Cota     TCGProfile *prof = &s->prof;
3654c3fac113SEmilio G. Cota #endif
365515fa08f8SRichard Henderson     int i, num_insns;
365615fa08f8SRichard Henderson     TCGOp *op;
3657c896fe29Sbellard 
365804fe6400SRichard Henderson #ifdef CONFIG_PROFILER
365904fe6400SRichard Henderson     {
3660c1f543b7SEmilio G. Cota         int n = 0;
366104fe6400SRichard Henderson 
366215fa08f8SRichard Henderson         QTAILQ_FOREACH(op, &s->ops, link) {
366315fa08f8SRichard Henderson             n++;
366415fa08f8SRichard Henderson         }
3665c3fac113SEmilio G. Cota         atomic_set(&prof->op_count, prof->op_count + n);
3666c3fac113SEmilio G. Cota         if (n > prof->op_count_max) {
3667c3fac113SEmilio G. Cota             atomic_set(&prof->op_count_max, n);
366804fe6400SRichard Henderson         }
366904fe6400SRichard Henderson 
367004fe6400SRichard Henderson         n = s->nb_temps;
3671c3fac113SEmilio G. Cota         atomic_set(&prof->temp_count, prof->temp_count + n);
3672c3fac113SEmilio G. Cota         if (n > prof->temp_count_max) {
3673c3fac113SEmilio G. Cota             atomic_set(&prof->temp_count_max, n);
367404fe6400SRichard Henderson         }
367504fe6400SRichard Henderson     }
367604fe6400SRichard Henderson #endif
367704fe6400SRichard Henderson 
3678c896fe29Sbellard #ifdef DEBUG_DISAS
3679d977e1c2SAlex Bennée     if (unlikely(qemu_loglevel_mask(CPU_LOG_TB_OP)
3680d977e1c2SAlex Bennée                  && qemu_log_in_addr_range(tb->pc))) {
36811ee73216SRichard Henderson         qemu_log_lock();
368293fcfe39Saliguori         qemu_log("OP:\n");
36831894f69aSRichard Henderson         tcg_dump_ops(s, false);
368493fcfe39Saliguori         qemu_log("\n");
36851ee73216SRichard Henderson         qemu_log_unlock();
3686c896fe29Sbellard     }
3687c896fe29Sbellard #endif
3688c896fe29Sbellard 
3689c5cc28ffSAurelien Jarno #ifdef CONFIG_PROFILER
3690c3fac113SEmilio G. Cota     atomic_set(&prof->opt_time, prof->opt_time - profile_getclock());
3691c5cc28ffSAurelien Jarno #endif
3692c5cc28ffSAurelien Jarno 
36938f2e8c07SKirill Batuzov #ifdef USE_TCG_OPTIMIZATIONS
3694c45cb8bbSRichard Henderson     tcg_optimize(s);
36958f2e8c07SKirill Batuzov #endif
36968f2e8c07SKirill Batuzov 
3697a23a9ec6Sbellard #ifdef CONFIG_PROFILER
3698c3fac113SEmilio G. Cota     atomic_set(&prof->opt_time, prof->opt_time + profile_getclock());
3699c3fac113SEmilio G. Cota     atomic_set(&prof->la_time, prof->la_time - profile_getclock());
3700a23a9ec6Sbellard #endif
3701c5cc28ffSAurelien Jarno 
3702b4fc67c7SRichard Henderson     reachable_code_pass(s);
3703b83eabeaSRichard Henderson     liveness_pass_1(s);
37045a18407fSRichard Henderson 
37055a18407fSRichard Henderson     if (s->nb_indirects > 0) {
37065a18407fSRichard Henderson #ifdef DEBUG_DISAS
37075a18407fSRichard Henderson         if (unlikely(qemu_loglevel_mask(CPU_LOG_TB_OP_IND)
37085a18407fSRichard Henderson                      && qemu_log_in_addr_range(tb->pc))) {
37091ee73216SRichard Henderson             qemu_log_lock();
37105a18407fSRichard Henderson             qemu_log("OP before indirect lowering:\n");
37111894f69aSRichard Henderson             tcg_dump_ops(s, false);
37125a18407fSRichard Henderson             qemu_log("\n");
37131ee73216SRichard Henderson             qemu_log_unlock();
37145a18407fSRichard Henderson         }
37155a18407fSRichard Henderson #endif
37165a18407fSRichard Henderson         /* Replace indirect temps with direct temps.  */
3717b83eabeaSRichard Henderson         if (liveness_pass_2(s)) {
37185a18407fSRichard Henderson             /* If changes were made, re-run liveness.  */
3719b83eabeaSRichard Henderson             liveness_pass_1(s);
37205a18407fSRichard Henderson         }
37215a18407fSRichard Henderson     }
3722c5cc28ffSAurelien Jarno 
3723a23a9ec6Sbellard #ifdef CONFIG_PROFILER
3724c3fac113SEmilio G. Cota     atomic_set(&prof->la_time, prof->la_time + profile_getclock());
3725a23a9ec6Sbellard #endif
3726c896fe29Sbellard 
3727c896fe29Sbellard #ifdef DEBUG_DISAS
3728d977e1c2SAlex Bennée     if (unlikely(qemu_loglevel_mask(CPU_LOG_TB_OP_OPT)
3729d977e1c2SAlex Bennée                  && qemu_log_in_addr_range(tb->pc))) {
37301ee73216SRichard Henderson         qemu_log_lock();
3731c5cc28ffSAurelien Jarno         qemu_log("OP after optimization and liveness analysis:\n");
37321894f69aSRichard Henderson         tcg_dump_ops(s, true);
373393fcfe39Saliguori         qemu_log("\n");
37341ee73216SRichard Henderson         qemu_log_unlock();
3735c896fe29Sbellard     }
3736c896fe29Sbellard #endif
3737c896fe29Sbellard 
3738c896fe29Sbellard     tcg_reg_alloc_start(s);
3739c896fe29Sbellard 
3740e7e168f4SEmilio G. Cota     s->code_buf = tb->tc.ptr;
3741e7e168f4SEmilio G. Cota     s->code_ptr = tb->tc.ptr;
3742c896fe29Sbellard 
3743659ef5cbSRichard Henderson #ifdef TCG_TARGET_NEED_LDST_LABELS
37446001f772SLaurent Vivier     QSIMPLEQ_INIT(&s->ldst_labels);
3745659ef5cbSRichard Henderson #endif
374657a26946SRichard Henderson #ifdef TCG_TARGET_NEED_POOL_LABELS
374757a26946SRichard Henderson     s->pool_labels = NULL;
374857a26946SRichard Henderson #endif
37499ecefc84SRichard Henderson 
3750fca8a500SRichard Henderson     num_insns = -1;
375115fa08f8SRichard Henderson     QTAILQ_FOREACH(op, &s->ops, link) {
3752c45cb8bbSRichard Henderson         TCGOpcode opc = op->opc;
3753b3db8758Sblueswir1 
3754c896fe29Sbellard #ifdef CONFIG_PROFILER
3755c3fac113SEmilio G. Cota         atomic_set(&prof->table_op_count[opc], prof->table_op_count[opc] + 1);
3756c896fe29Sbellard #endif
3757c45cb8bbSRichard Henderson 
3758c896fe29Sbellard         switch (opc) {
3759c896fe29Sbellard         case INDEX_op_mov_i32:
3760c896fe29Sbellard         case INDEX_op_mov_i64:
3761d2fd745fSRichard Henderson         case INDEX_op_mov_vec:
3762dd186292SRichard Henderson             tcg_reg_alloc_mov(s, op);
3763c896fe29Sbellard             break;
3764e8996ee0Sbellard         case INDEX_op_movi_i32:
3765e8996ee0Sbellard         case INDEX_op_movi_i64:
3766d2fd745fSRichard Henderson         case INDEX_op_dupi_vec:
3767dd186292SRichard Henderson             tcg_reg_alloc_movi(s, op);
3768e8996ee0Sbellard             break;
3769765b842aSRichard Henderson         case INDEX_op_insn_start:
3770fca8a500SRichard Henderson             if (num_insns >= 0) {
37719f754620SRichard Henderson                 size_t off = tcg_current_code_size(s);
37729f754620SRichard Henderson                 s->gen_insn_end_off[num_insns] = off;
37739f754620SRichard Henderson                 /* Assert that we do not overflow our stored offset.  */
37749f754620SRichard Henderson                 assert(s->gen_insn_end_off[num_insns] == off);
3775fca8a500SRichard Henderson             }
3776fca8a500SRichard Henderson             num_insns++;
3777bad729e2SRichard Henderson             for (i = 0; i < TARGET_INSN_START_WORDS; ++i) {
3778bad729e2SRichard Henderson                 target_ulong a;
3779bad729e2SRichard Henderson #if TARGET_LONG_BITS > TCG_TARGET_REG_BITS
3780efee3746SRichard Henderson                 a = deposit64(op->args[i * 2], 32, 32, op->args[i * 2 + 1]);
3781bad729e2SRichard Henderson #else
3782efee3746SRichard Henderson                 a = op->args[i];
3783bad729e2SRichard Henderson #endif
3784fca8a500SRichard Henderson                 s->gen_insn_data[num_insns][i] = a;
3785bad729e2SRichard Henderson             }
3786c896fe29Sbellard             break;
37875ff9d6a4Sbellard         case INDEX_op_discard:
378843439139SRichard Henderson             temp_dead(s, arg_temp(op->args[0]));
37895ff9d6a4Sbellard             break;
3790c896fe29Sbellard         case INDEX_op_set_label:
3791e8996ee0Sbellard             tcg_reg_alloc_bb_end(s, s->reserved_regs);
3792efee3746SRichard Henderson             tcg_out_label(s, arg_label(op->args[0]), s->code_ptr);
3793c896fe29Sbellard             break;
3794c896fe29Sbellard         case INDEX_op_call:
3795dd186292SRichard Henderson             tcg_reg_alloc_call(s, op);
3796c45cb8bbSRichard Henderson             break;
3797c896fe29Sbellard         default:
379825c4d9ccSRichard Henderson             /* Sanity check that we've not introduced any unhandled opcodes. */
3799be0f34b5SRichard Henderson             tcg_debug_assert(tcg_op_supported(opc));
3800c896fe29Sbellard             /* Note: in order to speed up the code, it would be much
3801c896fe29Sbellard                faster to have specialized register allocator functions for
3802c896fe29Sbellard                some common argument patterns */
3803dd186292SRichard Henderson             tcg_reg_alloc_op(s, op);
3804c896fe29Sbellard             break;
3805c896fe29Sbellard         }
38068d8fdbaeSAurelien Jarno #ifdef CONFIG_DEBUG_TCG
3807c896fe29Sbellard         check_regs(s);
3808c896fe29Sbellard #endif
3809b125f9dcSRichard Henderson         /* Test for (pending) buffer overflow.  The assumption is that any
3810b125f9dcSRichard Henderson            one operation beginning below the high water mark cannot overrun
3811b125f9dcSRichard Henderson            the buffer completely.  Thus we can test for overflow after
3812b125f9dcSRichard Henderson            generating code without having to check during generation.  */
3813644da9b3SJohn Clarke         if (unlikely((void *)s->code_ptr > s->code_gen_highwater)) {
3814b125f9dcSRichard Henderson             return -1;
3815b125f9dcSRichard Henderson         }
3816c896fe29Sbellard     }
3817fca8a500SRichard Henderson     tcg_debug_assert(num_insns >= 0);
3818fca8a500SRichard Henderson     s->gen_insn_end_off[num_insns] = tcg_current_code_size(s);
3819c45cb8bbSRichard Henderson 
3820b76f0d8cSYeongkyoon Lee     /* Generate TB finalization at the end of block */
3821659ef5cbSRichard Henderson #ifdef TCG_TARGET_NEED_LDST_LABELS
3822659ef5cbSRichard Henderson     if (!tcg_out_ldst_finalize(s)) {
382323dceda6SRichard Henderson         return -1;
382423dceda6SRichard Henderson     }
3825659ef5cbSRichard Henderson #endif
382657a26946SRichard Henderson #ifdef TCG_TARGET_NEED_POOL_LABELS
382757a26946SRichard Henderson     if (!tcg_out_pool_finalize(s)) {
382857a26946SRichard Henderson         return -1;
382957a26946SRichard Henderson     }
383057a26946SRichard Henderson #endif
3831c896fe29Sbellard 
3832c896fe29Sbellard     /* flush instruction cache */
38331813e175SRichard Henderson     flush_icache_range((uintptr_t)s->code_buf, (uintptr_t)s->code_ptr);
38342aeabc08SStefan Weil 
38351813e175SRichard Henderson     return tcg_current_code_size(s);
3836c896fe29Sbellard }
3837c896fe29Sbellard 
3838a23a9ec6Sbellard #ifdef CONFIG_PROFILER
3839405cf9ffSStefan Weil void tcg_dump_info(FILE *f, fprintf_function cpu_fprintf)
3840a23a9ec6Sbellard {
3841c3fac113SEmilio G. Cota     TCGProfile prof = {};
3842c3fac113SEmilio G. Cota     const TCGProfile *s;
3843c3fac113SEmilio G. Cota     int64_t tb_count;
3844c3fac113SEmilio G. Cota     int64_t tb_div_count;
3845c3fac113SEmilio G. Cota     int64_t tot;
3846c3fac113SEmilio G. Cota 
3847c3fac113SEmilio G. Cota     tcg_profile_snapshot_counters(&prof);
3848c3fac113SEmilio G. Cota     s = &prof;
3849c3fac113SEmilio G. Cota     tb_count = s->tb_count;
3850c3fac113SEmilio G. Cota     tb_div_count = tb_count ? tb_count : 1;
3851c3fac113SEmilio G. Cota     tot = s->interm_time + s->code_time;
3852a23a9ec6Sbellard 
3853a23a9ec6Sbellard     cpu_fprintf(f, "JIT cycles          %" PRId64 " (%0.3f s at 2.4 GHz)\n",
3854a23a9ec6Sbellard                 tot, tot / 2.4e9);
3855a23a9ec6Sbellard     cpu_fprintf(f, "translated TBs      %" PRId64 " (aborted=%" PRId64 " %0.1f%%)\n",
3856fca8a500SRichard Henderson                 tb_count, s->tb_count1 - tb_count,
3857fca8a500SRichard Henderson                 (double)(s->tb_count1 - s->tb_count)
3858fca8a500SRichard Henderson                 / (s->tb_count1 ? s->tb_count1 : 1) * 100.0);
3859a23a9ec6Sbellard     cpu_fprintf(f, "avg ops/TB          %0.1f max=%d\n",
3860fca8a500SRichard Henderson                 (double)s->op_count / tb_div_count, s->op_count_max);
3861a23a9ec6Sbellard     cpu_fprintf(f, "deleted ops/TB      %0.2f\n",
3862fca8a500SRichard Henderson                 (double)s->del_op_count / tb_div_count);
3863a23a9ec6Sbellard     cpu_fprintf(f, "avg temps/TB        %0.2f max=%d\n",
3864fca8a500SRichard Henderson                 (double)s->temp_count / tb_div_count, s->temp_count_max);
3865fca8a500SRichard Henderson     cpu_fprintf(f, "avg host code/TB    %0.1f\n",
3866fca8a500SRichard Henderson                 (double)s->code_out_len / tb_div_count);
3867fca8a500SRichard Henderson     cpu_fprintf(f, "avg search data/TB  %0.1f\n",
3868fca8a500SRichard Henderson                 (double)s->search_out_len / tb_div_count);
3869a23a9ec6Sbellard 
3870a23a9ec6Sbellard     cpu_fprintf(f, "cycles/op           %0.1f\n",
3871a23a9ec6Sbellard                 s->op_count ? (double)tot / s->op_count : 0);
3872a23a9ec6Sbellard     cpu_fprintf(f, "cycles/in byte      %0.1f\n",
3873a23a9ec6Sbellard                 s->code_in_len ? (double)tot / s->code_in_len : 0);
3874a23a9ec6Sbellard     cpu_fprintf(f, "cycles/out byte     %0.1f\n",
3875a23a9ec6Sbellard                 s->code_out_len ? (double)tot / s->code_out_len : 0);
3876fca8a500SRichard Henderson     cpu_fprintf(f, "cycles/search byte     %0.1f\n",
3877fca8a500SRichard Henderson                 s->search_out_len ? (double)tot / s->search_out_len : 0);
3878fca8a500SRichard Henderson     if (tot == 0) {
3879a23a9ec6Sbellard         tot = 1;
3880fca8a500SRichard Henderson     }
3881a23a9ec6Sbellard     cpu_fprintf(f, "  gen_interm time   %0.1f%%\n",
3882a23a9ec6Sbellard                 (double)s->interm_time / tot * 100.0);
3883a23a9ec6Sbellard     cpu_fprintf(f, "  gen_code time     %0.1f%%\n",
3884a23a9ec6Sbellard                 (double)s->code_time / tot * 100.0);
3885c5cc28ffSAurelien Jarno     cpu_fprintf(f, "optim./code time    %0.1f%%\n",
3886c5cc28ffSAurelien Jarno                 (double)s->opt_time / (s->code_time ? s->code_time : 1)
3887c5cc28ffSAurelien Jarno                 * 100.0);
3888a23a9ec6Sbellard     cpu_fprintf(f, "liveness/code time  %0.1f%%\n",
3889a23a9ec6Sbellard                 (double)s->la_time / (s->code_time ? s->code_time : 1) * 100.0);
3890a23a9ec6Sbellard     cpu_fprintf(f, "cpu_restore count   %" PRId64 "\n",
3891a23a9ec6Sbellard                 s->restore_count);
3892a23a9ec6Sbellard     cpu_fprintf(f, "  avg cycles        %0.1f\n",
3893a23a9ec6Sbellard                 s->restore_count ? (double)s->restore_time / s->restore_count : 0);
3894a23a9ec6Sbellard }
3895a23a9ec6Sbellard #else
3896405cf9ffSStefan Weil void tcg_dump_info(FILE *f, fprintf_function cpu_fprintf)
3897a23a9ec6Sbellard {
389824bf7b3aSbellard     cpu_fprintf(f, "[TCG profiler not compiled]\n");
3899a23a9ec6Sbellard }
3900a23a9ec6Sbellard #endif
3901813da627SRichard Henderson 
3902813da627SRichard Henderson #ifdef ELF_HOST_MACHINE
39035872bbf2SRichard Henderson /* In order to use this feature, the backend needs to do three things:
39045872bbf2SRichard Henderson 
39055872bbf2SRichard Henderson    (1) Define ELF_HOST_MACHINE to indicate both what value to
39065872bbf2SRichard Henderson        put into the ELF image and to indicate support for the feature.
39075872bbf2SRichard Henderson 
39085872bbf2SRichard Henderson    (2) Define tcg_register_jit.  This should create a buffer containing
39095872bbf2SRichard Henderson        the contents of a .debug_frame section that describes the post-
39105872bbf2SRichard Henderson        prologue unwind info for the tcg machine.
39115872bbf2SRichard Henderson 
39125872bbf2SRichard Henderson    (3) Call tcg_register_jit_int, with the constructed .debug_frame.
39135872bbf2SRichard Henderson */
3914813da627SRichard Henderson 
3915813da627SRichard Henderson /* Begin GDB interface.  THE FOLLOWING MUST MATCH GDB DOCS.  */
3916813da627SRichard Henderson typedef enum {
3917813da627SRichard Henderson     JIT_NOACTION = 0,
3918813da627SRichard Henderson     JIT_REGISTER_FN,
3919813da627SRichard Henderson     JIT_UNREGISTER_FN
3920813da627SRichard Henderson } jit_actions_t;
3921813da627SRichard Henderson 
3922813da627SRichard Henderson struct jit_code_entry {
3923813da627SRichard Henderson     struct jit_code_entry *next_entry;
3924813da627SRichard Henderson     struct jit_code_entry *prev_entry;
3925813da627SRichard Henderson     const void *symfile_addr;
3926813da627SRichard Henderson     uint64_t symfile_size;
3927813da627SRichard Henderson };
3928813da627SRichard Henderson 
3929813da627SRichard Henderson struct jit_descriptor {
3930813da627SRichard Henderson     uint32_t version;
3931813da627SRichard Henderson     uint32_t action_flag;
3932813da627SRichard Henderson     struct jit_code_entry *relevant_entry;
3933813da627SRichard Henderson     struct jit_code_entry *first_entry;
3934813da627SRichard Henderson };
3935813da627SRichard Henderson 
3936813da627SRichard Henderson void __jit_debug_register_code(void) __attribute__((noinline));
3937813da627SRichard Henderson void __jit_debug_register_code(void)
3938813da627SRichard Henderson {
3939813da627SRichard Henderson     asm("");
3940813da627SRichard Henderson }
3941813da627SRichard Henderson 
3942813da627SRichard Henderson /* Must statically initialize the version, because GDB may check
3943813da627SRichard Henderson    the version before we can set it.  */
3944813da627SRichard Henderson struct jit_descriptor __jit_debug_descriptor = { 1, 0, 0, 0 };
3945813da627SRichard Henderson 
3946813da627SRichard Henderson /* End GDB interface.  */
3947813da627SRichard Henderson 
3948813da627SRichard Henderson static int find_string(const char *strtab, const char *str)
3949813da627SRichard Henderson {
3950813da627SRichard Henderson     const char *p = strtab + 1;
3951813da627SRichard Henderson 
3952813da627SRichard Henderson     while (1) {
3953813da627SRichard Henderson         if (strcmp(p, str) == 0) {
3954813da627SRichard Henderson             return p - strtab;
3955813da627SRichard Henderson         }
3956813da627SRichard Henderson         p += strlen(p) + 1;
3957813da627SRichard Henderson     }
3958813da627SRichard Henderson }
3959813da627SRichard Henderson 
39605872bbf2SRichard Henderson static void tcg_register_jit_int(void *buf_ptr, size_t buf_size,
39612c90784aSRichard Henderson                                  const void *debug_frame,
39622c90784aSRichard Henderson                                  size_t debug_frame_size)
3963813da627SRichard Henderson {
39645872bbf2SRichard Henderson     struct __attribute__((packed)) DebugInfo {
39655872bbf2SRichard Henderson         uint32_t  len;
39665872bbf2SRichard Henderson         uint16_t  version;
39675872bbf2SRichard Henderson         uint32_t  abbrev;
39685872bbf2SRichard Henderson         uint8_t   ptr_size;
39695872bbf2SRichard Henderson         uint8_t   cu_die;
39705872bbf2SRichard Henderson         uint16_t  cu_lang;
39715872bbf2SRichard Henderson         uintptr_t cu_low_pc;
39725872bbf2SRichard Henderson         uintptr_t cu_high_pc;
39735872bbf2SRichard Henderson         uint8_t   fn_die;
39745872bbf2SRichard Henderson         char      fn_name[16];
39755872bbf2SRichard Henderson         uintptr_t fn_low_pc;
39765872bbf2SRichard Henderson         uintptr_t fn_high_pc;
39775872bbf2SRichard Henderson         uint8_t   cu_eoc;
39785872bbf2SRichard Henderson     };
3979813da627SRichard Henderson 
3980813da627SRichard Henderson     struct ElfImage {
3981813da627SRichard Henderson         ElfW(Ehdr) ehdr;
3982813da627SRichard Henderson         ElfW(Phdr) phdr;
39835872bbf2SRichard Henderson         ElfW(Shdr) shdr[7];
39845872bbf2SRichard Henderson         ElfW(Sym)  sym[2];
39855872bbf2SRichard Henderson         struct DebugInfo di;
39865872bbf2SRichard Henderson         uint8_t    da[24];
39875872bbf2SRichard Henderson         char       str[80];
39885872bbf2SRichard Henderson     };
39895872bbf2SRichard Henderson 
39905872bbf2SRichard Henderson     struct ElfImage *img;
39915872bbf2SRichard Henderson 
39925872bbf2SRichard Henderson     static const struct ElfImage img_template = {
39935872bbf2SRichard Henderson         .ehdr = {
39945872bbf2SRichard Henderson             .e_ident[EI_MAG0] = ELFMAG0,
39955872bbf2SRichard Henderson             .e_ident[EI_MAG1] = ELFMAG1,
39965872bbf2SRichard Henderson             .e_ident[EI_MAG2] = ELFMAG2,
39975872bbf2SRichard Henderson             .e_ident[EI_MAG3] = ELFMAG3,
39985872bbf2SRichard Henderson             .e_ident[EI_CLASS] = ELF_CLASS,
39995872bbf2SRichard Henderson             .e_ident[EI_DATA] = ELF_DATA,
40005872bbf2SRichard Henderson             .e_ident[EI_VERSION] = EV_CURRENT,
40015872bbf2SRichard Henderson             .e_type = ET_EXEC,
40025872bbf2SRichard Henderson             .e_machine = ELF_HOST_MACHINE,
40035872bbf2SRichard Henderson             .e_version = EV_CURRENT,
40045872bbf2SRichard Henderson             .e_phoff = offsetof(struct ElfImage, phdr),
40055872bbf2SRichard Henderson             .e_shoff = offsetof(struct ElfImage, shdr),
40065872bbf2SRichard Henderson             .e_ehsize = sizeof(ElfW(Shdr)),
40075872bbf2SRichard Henderson             .e_phentsize = sizeof(ElfW(Phdr)),
40085872bbf2SRichard Henderson             .e_phnum = 1,
40095872bbf2SRichard Henderson             .e_shentsize = sizeof(ElfW(Shdr)),
40105872bbf2SRichard Henderson             .e_shnum = ARRAY_SIZE(img->shdr),
40115872bbf2SRichard Henderson             .e_shstrndx = ARRAY_SIZE(img->shdr) - 1,
4012abbb3eaeSRichard Henderson #ifdef ELF_HOST_FLAGS
4013abbb3eaeSRichard Henderson             .e_flags = ELF_HOST_FLAGS,
4014abbb3eaeSRichard Henderson #endif
4015abbb3eaeSRichard Henderson #ifdef ELF_OSABI
4016abbb3eaeSRichard Henderson             .e_ident[EI_OSABI] = ELF_OSABI,
4017abbb3eaeSRichard Henderson #endif
40185872bbf2SRichard Henderson         },
40195872bbf2SRichard Henderson         .phdr = {
40205872bbf2SRichard Henderson             .p_type = PT_LOAD,
40215872bbf2SRichard Henderson             .p_flags = PF_X,
40225872bbf2SRichard Henderson         },
40235872bbf2SRichard Henderson         .shdr = {
40245872bbf2SRichard Henderson             [0] = { .sh_type = SHT_NULL },
40255872bbf2SRichard Henderson             /* Trick: The contents of code_gen_buffer are not present in
40265872bbf2SRichard Henderson                this fake ELF file; that got allocated elsewhere.  Therefore
40275872bbf2SRichard Henderson                we mark .text as SHT_NOBITS (similar to .bss) so that readers
40285872bbf2SRichard Henderson                will not look for contents.  We can record any address.  */
40295872bbf2SRichard Henderson             [1] = { /* .text */
40305872bbf2SRichard Henderson                 .sh_type = SHT_NOBITS,
40315872bbf2SRichard Henderson                 .sh_flags = SHF_EXECINSTR | SHF_ALLOC,
40325872bbf2SRichard Henderson             },
40335872bbf2SRichard Henderson             [2] = { /* .debug_info */
40345872bbf2SRichard Henderson                 .sh_type = SHT_PROGBITS,
40355872bbf2SRichard Henderson                 .sh_offset = offsetof(struct ElfImage, di),
40365872bbf2SRichard Henderson                 .sh_size = sizeof(struct DebugInfo),
40375872bbf2SRichard Henderson             },
40385872bbf2SRichard Henderson             [3] = { /* .debug_abbrev */
40395872bbf2SRichard Henderson                 .sh_type = SHT_PROGBITS,
40405872bbf2SRichard Henderson                 .sh_offset = offsetof(struct ElfImage, da),
40415872bbf2SRichard Henderson                 .sh_size = sizeof(img->da),
40425872bbf2SRichard Henderson             },
40435872bbf2SRichard Henderson             [4] = { /* .debug_frame */
40445872bbf2SRichard Henderson                 .sh_type = SHT_PROGBITS,
40455872bbf2SRichard Henderson                 .sh_offset = sizeof(struct ElfImage),
40465872bbf2SRichard Henderson             },
40475872bbf2SRichard Henderson             [5] = { /* .symtab */
40485872bbf2SRichard Henderson                 .sh_type = SHT_SYMTAB,
40495872bbf2SRichard Henderson                 .sh_offset = offsetof(struct ElfImage, sym),
40505872bbf2SRichard Henderson                 .sh_size = sizeof(img->sym),
40515872bbf2SRichard Henderson                 .sh_info = 1,
40525872bbf2SRichard Henderson                 .sh_link = ARRAY_SIZE(img->shdr) - 1,
40535872bbf2SRichard Henderson                 .sh_entsize = sizeof(ElfW(Sym)),
40545872bbf2SRichard Henderson             },
40555872bbf2SRichard Henderson             [6] = { /* .strtab */
40565872bbf2SRichard Henderson                 .sh_type = SHT_STRTAB,
40575872bbf2SRichard Henderson                 .sh_offset = offsetof(struct ElfImage, str),
40585872bbf2SRichard Henderson                 .sh_size = sizeof(img->str),
40595872bbf2SRichard Henderson             }
40605872bbf2SRichard Henderson         },
40615872bbf2SRichard Henderson         .sym = {
40625872bbf2SRichard Henderson             [1] = { /* code_gen_buffer */
40635872bbf2SRichard Henderson                 .st_info = ELF_ST_INFO(STB_GLOBAL, STT_FUNC),
40645872bbf2SRichard Henderson                 .st_shndx = 1,
40655872bbf2SRichard Henderson             }
40665872bbf2SRichard Henderson         },
40675872bbf2SRichard Henderson         .di = {
40685872bbf2SRichard Henderson             .len = sizeof(struct DebugInfo) - 4,
40695872bbf2SRichard Henderson             .version = 2,
40705872bbf2SRichard Henderson             .ptr_size = sizeof(void *),
40715872bbf2SRichard Henderson             .cu_die = 1,
40725872bbf2SRichard Henderson             .cu_lang = 0x8001,  /* DW_LANG_Mips_Assembler */
40735872bbf2SRichard Henderson             .fn_die = 2,
40745872bbf2SRichard Henderson             .fn_name = "code_gen_buffer"
40755872bbf2SRichard Henderson         },
40765872bbf2SRichard Henderson         .da = {
40775872bbf2SRichard Henderson             1,          /* abbrev number (the cu) */
40785872bbf2SRichard Henderson             0x11, 1,    /* DW_TAG_compile_unit, has children */
40795872bbf2SRichard Henderson             0x13, 0x5,  /* DW_AT_language, DW_FORM_data2 */
40805872bbf2SRichard Henderson             0x11, 0x1,  /* DW_AT_low_pc, DW_FORM_addr */
40815872bbf2SRichard Henderson             0x12, 0x1,  /* DW_AT_high_pc, DW_FORM_addr */
40825872bbf2SRichard Henderson             0, 0,       /* end of abbrev */
40835872bbf2SRichard Henderson             2,          /* abbrev number (the fn) */
40845872bbf2SRichard Henderson             0x2e, 0,    /* DW_TAG_subprogram, no children */
40855872bbf2SRichard Henderson             0x3, 0x8,   /* DW_AT_name, DW_FORM_string */
40865872bbf2SRichard Henderson             0x11, 0x1,  /* DW_AT_low_pc, DW_FORM_addr */
40875872bbf2SRichard Henderson             0x12, 0x1,  /* DW_AT_high_pc, DW_FORM_addr */
40885872bbf2SRichard Henderson             0, 0,       /* end of abbrev */
40895872bbf2SRichard Henderson             0           /* no more abbrev */
40905872bbf2SRichard Henderson         },
40915872bbf2SRichard Henderson         .str = "\0" ".text\0" ".debug_info\0" ".debug_abbrev\0"
40925872bbf2SRichard Henderson                ".debug_frame\0" ".symtab\0" ".strtab\0" "code_gen_buffer",
4093813da627SRichard Henderson     };
4094813da627SRichard Henderson 
4095813da627SRichard Henderson     /* We only need a single jit entry; statically allocate it.  */
4096813da627SRichard Henderson     static struct jit_code_entry one_entry;
4097813da627SRichard Henderson 
40985872bbf2SRichard Henderson     uintptr_t buf = (uintptr_t)buf_ptr;
4099813da627SRichard Henderson     size_t img_size = sizeof(struct ElfImage) + debug_frame_size;
41002c90784aSRichard Henderson     DebugFrameHeader *dfh;
4101813da627SRichard Henderson 
41025872bbf2SRichard Henderson     img = g_malloc(img_size);
41035872bbf2SRichard Henderson     *img = img_template;
4104813da627SRichard Henderson 
41055872bbf2SRichard Henderson     img->phdr.p_vaddr = buf;
41065872bbf2SRichard Henderson     img->phdr.p_paddr = buf;
41075872bbf2SRichard Henderson     img->phdr.p_memsz = buf_size;
4108813da627SRichard Henderson 
41095872bbf2SRichard Henderson     img->shdr[1].sh_name = find_string(img->str, ".text");
41105872bbf2SRichard Henderson     img->shdr[1].sh_addr = buf;
41115872bbf2SRichard Henderson     img->shdr[1].sh_size = buf_size;
4112813da627SRichard Henderson 
41135872bbf2SRichard Henderson     img->shdr[2].sh_name = find_string(img->str, ".debug_info");
41145872bbf2SRichard Henderson     img->shdr[3].sh_name = find_string(img->str, ".debug_abbrev");
41155872bbf2SRichard Henderson 
41165872bbf2SRichard Henderson     img->shdr[4].sh_name = find_string(img->str, ".debug_frame");
41175872bbf2SRichard Henderson     img->shdr[4].sh_size = debug_frame_size;
41185872bbf2SRichard Henderson 
41195872bbf2SRichard Henderson     img->shdr[5].sh_name = find_string(img->str, ".symtab");
41205872bbf2SRichard Henderson     img->shdr[6].sh_name = find_string(img->str, ".strtab");
41215872bbf2SRichard Henderson 
41225872bbf2SRichard Henderson     img->sym[1].st_name = find_string(img->str, "code_gen_buffer");
41235872bbf2SRichard Henderson     img->sym[1].st_value = buf;
41245872bbf2SRichard Henderson     img->sym[1].st_size = buf_size;
41255872bbf2SRichard Henderson 
41265872bbf2SRichard Henderson     img->di.cu_low_pc = buf;
412745aba097SRichard Henderson     img->di.cu_high_pc = buf + buf_size;
41285872bbf2SRichard Henderson     img->di.fn_low_pc = buf;
412945aba097SRichard Henderson     img->di.fn_high_pc = buf + buf_size;
4130813da627SRichard Henderson 
41312c90784aSRichard Henderson     dfh = (DebugFrameHeader *)(img + 1);
41322c90784aSRichard Henderson     memcpy(dfh, debug_frame, debug_frame_size);
41332c90784aSRichard Henderson     dfh->fde.func_start = buf;
41342c90784aSRichard Henderson     dfh->fde.func_len = buf_size;
41352c90784aSRichard Henderson 
4136813da627SRichard Henderson #ifdef DEBUG_JIT
4137813da627SRichard Henderson     /* Enable this block to be able to debug the ELF image file creation.
4138813da627SRichard Henderson        One can use readelf, objdump, or other inspection utilities.  */
4139813da627SRichard Henderson     {
4140813da627SRichard Henderson         FILE *f = fopen("/tmp/qemu.jit", "w+b");
4141813da627SRichard Henderson         if (f) {
41425872bbf2SRichard Henderson             if (fwrite(img, img_size, 1, f) != img_size) {
4143813da627SRichard Henderson                 /* Avoid stupid unused return value warning for fwrite.  */
4144813da627SRichard Henderson             }
4145813da627SRichard Henderson             fclose(f);
4146813da627SRichard Henderson         }
4147813da627SRichard Henderson     }
4148813da627SRichard Henderson #endif
4149813da627SRichard Henderson 
4150813da627SRichard Henderson     one_entry.symfile_addr = img;
4151813da627SRichard Henderson     one_entry.symfile_size = img_size;
4152813da627SRichard Henderson 
4153813da627SRichard Henderson     __jit_debug_descriptor.action_flag = JIT_REGISTER_FN;
4154813da627SRichard Henderson     __jit_debug_descriptor.relevant_entry = &one_entry;
4155813da627SRichard Henderson     __jit_debug_descriptor.first_entry = &one_entry;
4156813da627SRichard Henderson     __jit_debug_register_code();
4157813da627SRichard Henderson }
4158813da627SRichard Henderson #else
41595872bbf2SRichard Henderson /* No support for the feature.  Provide the entry point expected by exec.c,
41605872bbf2SRichard Henderson    and implement the internal function we declared earlier.  */
4161813da627SRichard Henderson 
4162813da627SRichard Henderson static void tcg_register_jit_int(void *buf, size_t size,
41632c90784aSRichard Henderson                                  const void *debug_frame,
41642c90784aSRichard Henderson                                  size_t debug_frame_size)
4165813da627SRichard Henderson {
4166813da627SRichard Henderson }
4167813da627SRichard Henderson 
4168813da627SRichard Henderson void tcg_register_jit(void *buf, size_t buf_size)
4169813da627SRichard Henderson {
4170813da627SRichard Henderson }
4171813da627SRichard Henderson #endif /* ELF_HOST_MACHINE */
4172db432672SRichard Henderson 
4173db432672SRichard Henderson #if !TCG_TARGET_MAYBE_vec
4174db432672SRichard Henderson void tcg_expand_vec_op(TCGOpcode o, TCGType t, unsigned e, TCGArg a0, ...)
4175db432672SRichard Henderson {
4176db432672SRichard Henderson     g_assert_not_reached();
4177db432672SRichard Henderson }
4178db432672SRichard Henderson #endif
4179