xref: /qemu/include/tcg/tcg.h (revision c5f122fdcc280a82e7c5f31de890f985aa7ba773)
1 /*
2  * Tiny Code Generator for QEMU
3  *
4  * Copyright (c) 2008 Fabrice Bellard
5  *
6  * Permission is hereby granted, free of charge, to any person obtaining a copy
7  * of this software and associated documentation files (the "Software"), to deal
8  * in the Software without restriction, including without limitation the rights
9  * to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
10  * copies of the Software, and to permit persons to whom the Software is
11  * furnished to do so, subject to the following conditions:
12  *
13  * The above copyright notice and this permission notice shall be included in
14  * all copies or substantial portions of the Software.
15  *
16  * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
17  * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
18  * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
19  * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
20  * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
21  * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
22  * THE SOFTWARE.
23  */
24 
25 #ifndef TCG_H
26 #define TCG_H
27 
28 #include "exec/memop.h"
29 #include "exec/memopidx.h"
30 #include "qemu/bitops.h"
31 #include "qemu/plugin.h"
32 #include "qemu/queue.h"
33 #include "tcg/tcg-mo.h"
34 #include "tcg-target-reg-bits.h"
35 #include "tcg-target.h"
36 #include "tcg/tcg-cond.h"
37 #include "tcg/insn-start-words.h"
38 #include "tcg/debug-assert.h"
39 
40 /* XXX: make safe guess about sizes */
41 #define MAX_OP_PER_INSTR 266
42 
43 #define CPU_TEMP_BUF_NLONGS 128
44 #define TCG_STATIC_FRAME_SIZE  (CPU_TEMP_BUF_NLONGS * sizeof(long))
45 
46 #if TCG_TARGET_REG_BITS == 32
47 typedef int32_t tcg_target_long;
48 typedef uint32_t tcg_target_ulong;
49 #define TCG_PRIlx PRIx32
50 #define TCG_PRIld PRId32
51 #elif TCG_TARGET_REG_BITS == 64
52 typedef int64_t tcg_target_long;
53 typedef uint64_t tcg_target_ulong;
54 #define TCG_PRIlx PRIx64
55 #define TCG_PRIld PRId64
56 #else
57 #error unsupported
58 #endif
59 
60 #if TCG_TARGET_NB_REGS <= 32
61 typedef uint32_t TCGRegSet;
62 #elif TCG_TARGET_NB_REGS <= 64
63 typedef uint64_t TCGRegSet;
64 #else
65 #error unsupported
66 #endif
67 
68 typedef enum TCGOpcode {
69 #define DEF(name, oargs, iargs, cargs, flags) INDEX_op_ ## name,
70 #include "tcg/tcg-opc.h"
71 #undef DEF
72     NB_OPS,
73 } TCGOpcode;
74 
75 #define tcg_regset_set_reg(d, r)   ((d) |= (TCGRegSet)1 << (r))
76 #define tcg_regset_reset_reg(d, r) ((d) &= ~((TCGRegSet)1 << (r)))
77 #define tcg_regset_test_reg(d, r)  (((d) >> (r)) & 1)
78 
79 #ifndef TCG_TARGET_INSN_UNIT_SIZE
80 # error "Missing TCG_TARGET_INSN_UNIT_SIZE"
81 #elif TCG_TARGET_INSN_UNIT_SIZE == 1
82 typedef uint8_t tcg_insn_unit;
83 #elif TCG_TARGET_INSN_UNIT_SIZE == 2
84 typedef uint16_t tcg_insn_unit;
85 #elif TCG_TARGET_INSN_UNIT_SIZE == 4
86 typedef uint32_t tcg_insn_unit;
87 #elif TCG_TARGET_INSN_UNIT_SIZE == 8
88 typedef uint64_t tcg_insn_unit;
89 #else
90 /* The port better have done this.  */
91 #endif
92 
93 typedef struct TCGRelocation TCGRelocation;
94 struct TCGRelocation {
95     QSIMPLEQ_ENTRY(TCGRelocation) next;
96     tcg_insn_unit *ptr;
97     intptr_t addend;
98     int type;
99 };
100 
101 typedef struct TCGOp TCGOp;
102 typedef struct TCGLabelUse TCGLabelUse;
103 struct TCGLabelUse {
104     QSIMPLEQ_ENTRY(TCGLabelUse) next;
105     TCGOp *op;
106 };
107 
108 typedef struct TCGLabel TCGLabel;
109 struct TCGLabel {
110     bool present;
111     bool has_value;
112     uint16_t id;
113     union {
114         uintptr_t value;
115         const tcg_insn_unit *value_ptr;
116     } u;
117     QSIMPLEQ_HEAD(, TCGLabelUse) branches;
118     QSIMPLEQ_HEAD(, TCGRelocation) relocs;
119     QSIMPLEQ_ENTRY(TCGLabel) next;
120 };
121 
122 typedef struct TCGPool {
123     struct TCGPool *next;
124     int size;
125     uint8_t data[] __attribute__ ((aligned));
126 } TCGPool;
127 
128 #define TCG_POOL_CHUNK_SIZE 32768
129 
130 #define TCG_MAX_TEMPS 512
131 #define TCG_MAX_INSNS 512
132 
133 /* when the size of the arguments of a called function is smaller than
134    this value, they are statically allocated in the TB stack frame */
135 #define TCG_STATIC_CALL_ARGS_SIZE 128
136 
137 typedef enum TCGType {
138     TCG_TYPE_I32,
139     TCG_TYPE_I64,
140     TCG_TYPE_I128,
141 
142     TCG_TYPE_V64,
143     TCG_TYPE_V128,
144     TCG_TYPE_V256,
145 
146     /* Number of different types (integer not enum) */
147 #define TCG_TYPE_COUNT  (TCG_TYPE_V256 + 1)
148 
149     /* An alias for the size of the host register.  */
150 #if TCG_TARGET_REG_BITS == 32
151     TCG_TYPE_REG = TCG_TYPE_I32,
152 #else
153     TCG_TYPE_REG = TCG_TYPE_I64,
154 #endif
155 
156     /* An alias for the size of the native pointer.  */
157 #if UINTPTR_MAX == UINT32_MAX
158     TCG_TYPE_PTR = TCG_TYPE_I32,
159 #else
160     TCG_TYPE_PTR = TCG_TYPE_I64,
161 #endif
162 } TCGType;
163 
164 /**
165  * tcg_type_size
166  * @t: type
167  *
168  * Return the size of the type in bytes.
169  */
170 static inline int tcg_type_size(TCGType t)
171 {
172     unsigned i = t;
173     if (i >= TCG_TYPE_V64) {
174         tcg_debug_assert(i < TCG_TYPE_COUNT);
175         i -= TCG_TYPE_V64 - 1;
176     }
177     return 4 << i;
178 }
179 
180 typedef tcg_target_ulong TCGArg;
181 
182 /* Define type and accessor macros for TCG variables.
183 
184    TCG variables are the inputs and outputs of TCG ops, as described
185    in tcg/README. Target CPU front-end code uses these types to deal
186    with TCG variables as it emits TCG code via the tcg_gen_* functions.
187    They come in several flavours:
188     * TCGv_i32  : 32 bit integer type
189     * TCGv_i64  : 64 bit integer type
190     * TCGv_i128 : 128 bit integer type
191     * TCGv_ptr  : a host pointer type
192     * TCGv_vec  : a host vector type; the exact size is not exposed
193                   to the CPU front-end code.
194     * TCGv      : an integer type the same size as target_ulong
195                   (an alias for either TCGv_i32 or TCGv_i64)
196    The compiler's type checking will complain if you mix them
197    up and pass the wrong sized TCGv to a function.
198 
199    Users of tcg_gen_* don't need to know about any of the internal
200    details of these, and should treat them as opaque types.
201    You won't be able to look inside them in a debugger either.
202 
203    Internal implementation details follow:
204 
205    Note that there is no definition of the structs TCGv_i32_d etc anywhere.
206    This is deliberate, because the values we store in variables of type
207    TCGv_i32 are not really pointers-to-structures. They're just small
208    integers, but keeping them in pointer types like this means that the
209    compiler will complain if you accidentally pass a TCGv_i32 to a
210    function which takes a TCGv_i64, and so on. Only the internals of
211    TCG need to care about the actual contents of the types.  */
212 
213 typedef struct TCGv_i32_d *TCGv_i32;
214 typedef struct TCGv_i64_d *TCGv_i64;
215 typedef struct TCGv_i128_d *TCGv_i128;
216 typedef struct TCGv_ptr_d *TCGv_ptr;
217 typedef struct TCGv_vec_d *TCGv_vec;
218 typedef TCGv_ptr TCGv_env;
219 
220 /* call flags */
221 /* Helper does not read globals (either directly or through an exception). It
222    implies TCG_CALL_NO_WRITE_GLOBALS. */
223 #define TCG_CALL_NO_READ_GLOBALS    0x0001
224 /* Helper does not write globals */
225 #define TCG_CALL_NO_WRITE_GLOBALS   0x0002
226 /* Helper can be safely suppressed if the return value is not used. */
227 #define TCG_CALL_NO_SIDE_EFFECTS    0x0004
228 /* Helper is G_NORETURN.  */
229 #define TCG_CALL_NO_RETURN          0x0008
230 
231 /* convenience version of most used call flags */
232 #define TCG_CALL_NO_RWG         TCG_CALL_NO_READ_GLOBALS
233 #define TCG_CALL_NO_WG          TCG_CALL_NO_WRITE_GLOBALS
234 #define TCG_CALL_NO_SE          TCG_CALL_NO_SIDE_EFFECTS
235 #define TCG_CALL_NO_RWG_SE      (TCG_CALL_NO_RWG | TCG_CALL_NO_SE)
236 #define TCG_CALL_NO_WG_SE       (TCG_CALL_NO_WG | TCG_CALL_NO_SE)
237 
238 /*
239  * Flags for the bswap opcodes.
240  * If IZ, the input is zero-extended, otherwise unknown.
241  * If OZ or OS, the output is zero- or sign-extended respectively,
242  * otherwise the high bits are undefined.
243  */
244 enum {
245     TCG_BSWAP_IZ = 1,
246     TCG_BSWAP_OZ = 2,
247     TCG_BSWAP_OS = 4,
248 };
249 
250 typedef enum TCGTempVal {
251     TEMP_VAL_DEAD,
252     TEMP_VAL_REG,
253     TEMP_VAL_MEM,
254     TEMP_VAL_CONST,
255 } TCGTempVal;
256 
257 typedef enum TCGTempKind {
258     /*
259      * Temp is dead at the end of the extended basic block (EBB),
260      * the single-entry multiple-exit region that falls through
261      * conditional branches.
262      */
263     TEMP_EBB,
264     /* Temp is live across the entire translation block, but dead at end. */
265     TEMP_TB,
266     /* Temp is live across the entire translation block, and between them. */
267     TEMP_GLOBAL,
268     /* Temp is in a fixed register. */
269     TEMP_FIXED,
270     /* Temp is a fixed constant. */
271     TEMP_CONST,
272 } TCGTempKind;
273 
274 typedef struct TCGTemp {
275     TCGReg reg:8;
276     TCGTempVal val_type:8;
277     TCGType base_type:8;
278     TCGType type:8;
279     TCGTempKind kind:3;
280     unsigned int indirect_reg:1;
281     unsigned int indirect_base:1;
282     unsigned int mem_coherent:1;
283     unsigned int mem_allocated:1;
284     unsigned int temp_allocated:1;
285     unsigned int temp_subindex:2;
286 
287     int64_t val;
288     struct TCGTemp *mem_base;
289     intptr_t mem_offset;
290     const char *name;
291 
292     /* Pass-specific information that can be stored for a temporary.
293        One word worth of integer data, and one pointer to data
294        allocated separately.  */
295     uintptr_t state;
296     void *state_ptr;
297 } TCGTemp;
298 
299 typedef struct TCGContext TCGContext;
300 
301 typedef struct TCGTempSet {
302     unsigned long l[BITS_TO_LONGS(TCG_MAX_TEMPS)];
303 } TCGTempSet;
304 
305 /*
306  * With 1 128-bit output, a 32-bit host requires 4 output parameters,
307  * which leaves a maximum of 28 other slots.  Which is enough for 7
308  * 128-bit operands.
309  */
310 #define DEAD_ARG  (1 << 4)
311 #define SYNC_ARG  (1 << 0)
312 typedef uint32_t TCGLifeData;
313 
314 struct TCGOp {
315     TCGOpcode opc   : 8;
316     unsigned nargs  : 8;
317 
318     /* Parameters for this opcode.  See below.  */
319     unsigned param1 : 8;
320     unsigned param2 : 8;
321 
322     /* Lifetime data of the operands.  */
323     TCGLifeData life;
324 
325     /* Next and previous opcodes.  */
326     QTAILQ_ENTRY(TCGOp) link;
327 
328     /* Register preferences for the output(s).  */
329     TCGRegSet output_pref[2];
330 
331     /* Arguments for the opcode.  */
332     TCGArg args[];
333 };
334 
335 #define TCGOP_CALLI(X)    (X)->param1
336 #define TCGOP_CALLO(X)    (X)->param2
337 
338 #define TCGOP_TYPE(X)     (X)->param1
339 #define TCGOP_FLAGS(X)    (X)->param2
340 #define TCGOP_VECE(X)     (X)->param2
341 
342 /* Make sure operands fit in the bitfields above.  */
343 QEMU_BUILD_BUG_ON(NB_OPS > (1 << 8));
344 
345 static inline TCGRegSet output_pref(const TCGOp *op, unsigned i)
346 {
347     return i < ARRAY_SIZE(op->output_pref) ? op->output_pref[i] : 0;
348 }
349 
350 struct TCGContext {
351     uint8_t *pool_cur, *pool_end;
352     TCGPool *pool_first, *pool_current, *pool_first_large;
353     int nb_labels;
354     int nb_globals;
355     int nb_temps;
356     int nb_indirects;
357     int nb_ops;
358     TCGType addr_type;            /* TCG_TYPE_I32 or TCG_TYPE_I64 */
359 
360     int page_mask;
361     uint8_t page_bits;
362     uint8_t tlb_dyn_max_bits;
363     TCGBar guest_mo;
364 
365     TCGRegSet reserved_regs;
366     intptr_t current_frame_offset;
367     intptr_t frame_start;
368     intptr_t frame_end;
369     TCGTemp *frame_temp;
370 
371     TranslationBlock *gen_tb;     /* tb for which code is being generated */
372     tcg_insn_unit *code_buf;      /* pointer for start of tb */
373     tcg_insn_unit *code_ptr;      /* pointer for running end of tb */
374 
375 #ifdef CONFIG_DEBUG_TCG
376     int goto_tb_issue_mask;
377     const TCGOpcode *vecop_list;
378 #endif
379 
380     /* Code generation.  Note that we specifically do not use tcg_insn_unit
381        here, because there's too much arithmetic throughout that relies
382        on addition and subtraction working on bytes.  Rely on the GCC
383        extension that allows arithmetic on void*.  */
384     void *code_gen_buffer;
385     size_t code_gen_buffer_size;
386     void *code_gen_ptr;
387     void *data_gen_ptr;
388 
389     /* Threshold to flush the translated code buffer.  */
390     void *code_gen_highwater;
391 
392     /* Track which vCPU triggers events */
393     CPUState *cpu;                      /* *_trans */
394 
395     /* These structures are private to tcg-target.c.inc.  */
396     QSIMPLEQ_HEAD(, TCGLabelQemuLdst) ldst_labels;
397     struct TCGLabelPoolData *pool_labels;
398 
399     TCGLabel *exitreq_label;
400 
401 #ifdef CONFIG_PLUGIN
402     /*
403      * We keep one plugin_tb struct per TCGContext. Note that on every TB
404      * translation we clear but do not free its contents; this way we
405      * avoid a lot of malloc/free churn, since after a few TB's it's
406      * unlikely that we'll need to allocate either more instructions or more
407      * space for instructions (for variable-instruction-length ISAs).
408      */
409     struct qemu_plugin_tb *plugin_tb;
410     const struct DisasContextBase *plugin_db;
411 
412     /* descriptor of the instruction being translated */
413     struct qemu_plugin_insn *plugin_insn;
414 #endif
415 
416     /* For host-specific values. */
417 #ifdef __riscv
418     MemOp riscv_cur_vsew;
419     TCGType riscv_cur_type;
420 #endif
421     /*
422      * During the tcg_reg_alloc_op loop, we are within a sequence of
423      * carry-using opcodes like addco+addci.
424      */
425     bool carry_live;
426 
427     GHashTable *const_table[TCG_TYPE_COUNT];
428     TCGTempSet free_temps[TCG_TYPE_COUNT];
429     TCGTemp temps[TCG_MAX_TEMPS]; /* globals first, temps after */
430 
431     QTAILQ_HEAD(, TCGOp) ops, free_ops;
432     QSIMPLEQ_HEAD(, TCGLabel) labels;
433 
434     /*
435      * When clear, new ops are added to the tail of @ops.
436      * When set, new ops are added in front of @emit_before_op.
437      */
438     TCGOp *emit_before_op;
439 
440     /* Tells which temporary holds a given register.
441        It does not take into account fixed registers */
442     TCGTemp *reg_to_temp[TCG_TARGET_NB_REGS];
443 
444     uint16_t gen_insn_end_off[TCG_MAX_INSNS];
445     uint64_t *gen_insn_data;
446 
447     /* Exit to translator on overflow. */
448     sigjmp_buf jmp_trans;
449 };
450 
451 static inline bool temp_readonly(TCGTemp *ts)
452 {
453     return ts->kind >= TEMP_FIXED;
454 }
455 
456 #ifdef CONFIG_USER_ONLY
457 extern bool tcg_use_softmmu;
458 #else
459 #define tcg_use_softmmu  true
460 #endif
461 
462 extern __thread TCGContext *tcg_ctx;
463 extern const void *tcg_code_gen_epilogue;
464 extern uintptr_t tcg_splitwx_diff;
465 extern TCGv_env tcg_env;
466 
467 bool in_code_gen_buffer(const void *p);
468 
469 #ifdef CONFIG_DEBUG_TCG
470 const void *tcg_splitwx_to_rx(void *rw);
471 void *tcg_splitwx_to_rw(const void *rx);
472 #else
473 static inline const void *tcg_splitwx_to_rx(void *rw)
474 {
475     return rw ? rw + tcg_splitwx_diff : NULL;
476 }
477 
478 static inline void *tcg_splitwx_to_rw(const void *rx)
479 {
480     return rx ? (void *)rx - tcg_splitwx_diff : NULL;
481 }
482 #endif
483 
484 static inline TCGArg temp_arg(TCGTemp *ts)
485 {
486     return (uintptr_t)ts;
487 }
488 
489 static inline TCGTemp *arg_temp(TCGArg a)
490 {
491     return (TCGTemp *)(uintptr_t)a;
492 }
493 
494 #ifdef CONFIG_DEBUG_TCG
495 size_t temp_idx(TCGTemp *ts);
496 TCGTemp *tcgv_i32_temp(TCGv_i32 v);
497 #else
498 static inline size_t temp_idx(TCGTemp *ts)
499 {
500     return ts - tcg_ctx->temps;
501 }
502 
503 /*
504  * Using the offset of a temporary, relative to TCGContext, rather than
505  * its index means that we don't use 0.  That leaves offset 0 free for
506  * a NULL representation without having to leave index 0 unused.
507  */
508 static inline TCGTemp *tcgv_i32_temp(TCGv_i32 v)
509 {
510     return (void *)tcg_ctx + (uintptr_t)v;
511 }
512 #endif
513 
514 static inline TCGTemp *tcgv_i64_temp(TCGv_i64 v)
515 {
516     return tcgv_i32_temp((TCGv_i32)v);
517 }
518 
519 static inline TCGTemp *tcgv_i128_temp(TCGv_i128 v)
520 {
521     return tcgv_i32_temp((TCGv_i32)v);
522 }
523 
524 static inline TCGTemp *tcgv_ptr_temp(TCGv_ptr v)
525 {
526     return tcgv_i32_temp((TCGv_i32)v);
527 }
528 
529 static inline TCGTemp *tcgv_vec_temp(TCGv_vec v)
530 {
531     return tcgv_i32_temp((TCGv_i32)v);
532 }
533 
534 static inline TCGArg tcgv_i32_arg(TCGv_i32 v)
535 {
536     return temp_arg(tcgv_i32_temp(v));
537 }
538 
539 static inline TCGArg tcgv_i64_arg(TCGv_i64 v)
540 {
541     return temp_arg(tcgv_i64_temp(v));
542 }
543 
544 static inline TCGArg tcgv_i128_arg(TCGv_i128 v)
545 {
546     return temp_arg(tcgv_i128_temp(v));
547 }
548 
549 static inline TCGArg tcgv_ptr_arg(TCGv_ptr v)
550 {
551     return temp_arg(tcgv_ptr_temp(v));
552 }
553 
554 static inline TCGArg tcgv_vec_arg(TCGv_vec v)
555 {
556     return temp_arg(tcgv_vec_temp(v));
557 }
558 
559 static inline TCGv_i32 temp_tcgv_i32(TCGTemp *t)
560 {
561     (void)temp_idx(t); /* trigger embedded assert */
562     return (TCGv_i32)((void *)t - (void *)tcg_ctx);
563 }
564 
565 static inline TCGv_i64 temp_tcgv_i64(TCGTemp *t)
566 {
567     return (TCGv_i64)temp_tcgv_i32(t);
568 }
569 
570 static inline TCGv_i128 temp_tcgv_i128(TCGTemp *t)
571 {
572     return (TCGv_i128)temp_tcgv_i32(t);
573 }
574 
575 static inline TCGv_ptr temp_tcgv_ptr(TCGTemp *t)
576 {
577     return (TCGv_ptr)temp_tcgv_i32(t);
578 }
579 
580 static inline TCGv_vec temp_tcgv_vec(TCGTemp *t)
581 {
582     return (TCGv_vec)temp_tcgv_i32(t);
583 }
584 
585 static inline TCGArg tcg_get_insn_param(TCGOp *op, unsigned arg)
586 {
587     return op->args[arg];
588 }
589 
590 static inline void tcg_set_insn_param(TCGOp *op, unsigned arg, TCGArg v)
591 {
592     op->args[arg] = v;
593 }
594 
595 static inline uint64_t tcg_get_insn_start_param(TCGOp *op, unsigned arg)
596 {
597     tcg_debug_assert(arg < INSN_START_WORDS);
598     if (TCG_TARGET_REG_BITS == 64) {
599         return tcg_get_insn_param(op, arg);
600     } else {
601         return deposit64(tcg_get_insn_param(op, arg * 2), 32, 32,
602                          tcg_get_insn_param(op, arg * 2 + 1));
603     }
604 }
605 
606 static inline void tcg_set_insn_start_param(TCGOp *op, unsigned arg, uint64_t v)
607 {
608     tcg_debug_assert(arg < INSN_START_WORDS);
609     if (TCG_TARGET_REG_BITS == 64) {
610         tcg_set_insn_param(op, arg, v);
611     } else {
612         tcg_set_insn_param(op, arg * 2, v);
613         tcg_set_insn_param(op, arg * 2 + 1, v >> 32);
614     }
615 }
616 
617 /* The last op that was emitted.  */
618 static inline TCGOp *tcg_last_op(void)
619 {
620     return QTAILQ_LAST(&tcg_ctx->ops);
621 }
622 
623 /* Test for whether to terminate the TB for using too many opcodes.  */
624 static inline bool tcg_op_buf_full(void)
625 {
626     /* This is not a hard limit, it merely stops translation when
627      * we have produced "enough" opcodes.  We want to limit TB size
628      * such that a RISC host can reasonably use a 16-bit signed
629      * branch within the TB.  We also need to be mindful of the
630      * 16-bit unsigned offsets, TranslationBlock.jmp_reset_offset[]
631      * and TCGContext.gen_insn_end_off[].
632      */
633     return tcg_ctx->nb_ops >= 4000;
634 }
635 
636 /* pool based memory allocation */
637 
638 /* user-mode: mmap_lock must be held for tcg_malloc_internal. */
639 void *tcg_malloc_internal(TCGContext *s, int size);
640 void tcg_pool_reset(TCGContext *s);
641 TranslationBlock *tcg_tb_alloc(TCGContext *s);
642 
643 void tcg_region_reset_all(void);
644 
645 size_t tcg_code_size(void);
646 size_t tcg_code_capacity(void);
647 
648 /**
649  * tcg_tb_insert:
650  * @tb: translation block to insert
651  *
652  * Insert @tb into the region trees.
653  */
654 void tcg_tb_insert(TranslationBlock *tb);
655 
656 /**
657  * tcg_tb_remove:
658  * @tb: translation block to remove
659  *
660  * Remove @tb from the region trees.
661  */
662 void tcg_tb_remove(TranslationBlock *tb);
663 
664 /**
665  * tcg_tb_lookup:
666  * @tc_ptr: host PC to look up
667  *
668  * Look up a translation block inside the region trees by @tc_ptr. This is
669  * useful for exception handling, but must not be used for the purposes of
670  * executing the returned translation block. See struct tb_tc for more
671  * information.
672  *
673  * Returns: a translation block previously inserted into the region trees,
674  * such that @tc_ptr points anywhere inside the code generated for it, or
675  * NULL.
676  */
677 TranslationBlock *tcg_tb_lookup(uintptr_t tc_ptr);
678 
679 /**
680  * tcg_tb_foreach:
681  * @func: callback
682  * @user_data: opaque value to pass to @callback
683  *
684  * Call @func for each translation block inserted into the region trees.
685  */
686 void tcg_tb_foreach(GTraverseFunc func, gpointer user_data);
687 
688 /**
689  * tcg_nb_tbs:
690  *
691  * Returns: the number of translation blocks inserted into the region trees.
692  */
693 size_t tcg_nb_tbs(void);
694 
695 /* user-mode: Called with mmap_lock held.  */
696 static inline void *tcg_malloc(int size)
697 {
698     TCGContext *s = tcg_ctx;
699     uint8_t *ptr, *ptr_end;
700 
701     /* ??? This is a weak placeholder for minimum malloc alignment.  */
702     size = QEMU_ALIGN_UP(size, 8);
703 
704     ptr = s->pool_cur;
705     ptr_end = ptr + size;
706     if (unlikely(ptr_end > s->pool_end)) {
707         return tcg_malloc_internal(tcg_ctx, size);
708     } else {
709         s->pool_cur = ptr_end;
710         return ptr;
711     }
712 }
713 
714 void tcg_func_start(TCGContext *s);
715 
716 int tcg_gen_code(TCGContext *s, TranslationBlock *tb, uint64_t pc_start);
717 
718 void tb_target_set_jmp_target(const TranslationBlock *, int,
719                               uintptr_t, uintptr_t);
720 
721 void tcg_set_frame(TCGContext *s, TCGReg reg, intptr_t start, intptr_t size);
722 
723 #define TCG_CT_CONST      1  /* any constant of register size */
724 #define TCG_CT_REG_ZERO   2  /* zero, in TCG_REG_ZERO */
725 
726 typedef struct TCGArgConstraint {
727     unsigned ct : 16;
728     unsigned alias_index : 4;
729     unsigned sort_index : 4;
730     unsigned pair_index : 4;
731     unsigned pair : 2;  /* 0: none, 1: first, 2: second, 3: second alias */
732     bool oalias : 1;
733     bool ialias : 1;
734     bool newreg : 1;
735     TCGRegSet regs;
736 } TCGArgConstraint;
737 
738 #define TCG_MAX_OP_ARGS 16
739 
740 /* Bits for TCGOpDef->flags, 8 bits available, all used.  */
741 enum {
742     /* Instruction exits the translation block.  */
743     TCG_OPF_BB_EXIT      = 0x01,
744     /* Instruction defines the end of a basic block.  */
745     TCG_OPF_BB_END       = 0x02,
746     /* Instruction clobbers call registers and potentially update globals.  */
747     TCG_OPF_CALL_CLOBBER = 0x04,
748     /* Instruction has side effects: it cannot be removed if its outputs
749        are not used, and might trigger exceptions.  */
750     TCG_OPF_SIDE_EFFECTS = 0x08,
751     /* Instruction operands may be I32 or I64 */
752     TCG_OPF_INT          = 0x10,
753     /* Instruction is optional and not implemented by the host, or insn
754        is generic and should not be implemented by the host.  */
755     TCG_OPF_NOT_PRESENT  = 0x20,
756     /* Instruction operands are vectors.  */
757     TCG_OPF_VECTOR       = 0x40,
758     /* Instruction is a conditional branch. */
759     TCG_OPF_COND_BRANCH  = 0x80,
760     /* Instruction produces carry out. */
761     TCG_OPF_CARRY_OUT    = 0x100,
762     /* Instruction consumes carry in. */
763     TCG_OPF_CARRY_IN     = 0x200,
764 };
765 
766 typedef struct TCGOpDef {
767     const char *name;
768     uint8_t nb_oargs, nb_iargs, nb_cargs, nb_args;
769     uint16_t flags;
770 } TCGOpDef;
771 
772 extern const TCGOpDef tcg_op_defs[];
773 extern const size_t tcg_op_defs_max;
774 
775 /*
776  * tcg_op_supported:
777  * Query if @op, for @type and @flags, is supported by the host
778  * on which we are currently executing.
779  */
780 bool tcg_op_supported(TCGOpcode op, TCGType type, unsigned flags);
781 /*
782  * tcg_op_deposit_valid:
783  * Query if a deposit into (ofs, len) is supported for @type by
784  * the host on which we are currently executing.
785  */
786 bool tcg_op_deposit_valid(TCGType type, unsigned ofs, unsigned len);
787 
788 void tcg_gen_call0(void *func, TCGHelperInfo *, TCGTemp *ret);
789 void tcg_gen_call1(void *func, TCGHelperInfo *, TCGTemp *ret, TCGTemp *);
790 void tcg_gen_call2(void *func, TCGHelperInfo *, TCGTemp *ret,
791                    TCGTemp *, TCGTemp *);
792 void tcg_gen_call3(void *func, TCGHelperInfo *, TCGTemp *ret,
793                    TCGTemp *, TCGTemp *, TCGTemp *);
794 void tcg_gen_call4(void *func, TCGHelperInfo *, TCGTemp *ret,
795                    TCGTemp *, TCGTemp *, TCGTemp *, TCGTemp *);
796 void tcg_gen_call5(void *func, TCGHelperInfo *, TCGTemp *ret,
797                    TCGTemp *, TCGTemp *, TCGTemp *, TCGTemp *, TCGTemp *);
798 void tcg_gen_call6(void *func, TCGHelperInfo *, TCGTemp *ret,
799                    TCGTemp *, TCGTemp *, TCGTemp *, TCGTemp *,
800                    TCGTemp *, TCGTemp *);
801 void tcg_gen_call7(void *func, TCGHelperInfo *, TCGTemp *ret,
802                    TCGTemp *, TCGTemp *, TCGTemp *, TCGTemp *,
803                    TCGTemp *, TCGTemp *, TCGTemp *);
804 
805 TCGOp *tcg_emit_op(TCGOpcode opc, unsigned nargs);
806 void tcg_op_remove(TCGContext *s, TCGOp *op);
807 
808 /**
809  * tcg_remove_ops_after:
810  * @op: target operation
811  *
812  * Discard any opcodes emitted since @op.  Expected usage is to save
813  * a starting point with tcg_last_op(), speculatively emit opcodes,
814  * then decide whether or not to keep those opcodes after the fact.
815  */
816 void tcg_remove_ops_after(TCGOp *op);
817 
818 void tcg_optimize(TCGContext *s);
819 
820 TCGLabel *gen_new_label(void);
821 
822 /**
823  * label_arg
824  * @l: label
825  *
826  * Encode a label for storage in the TCG opcode stream.
827  */
828 
829 static inline TCGArg label_arg(TCGLabel *l)
830 {
831     return (uintptr_t)l;
832 }
833 
834 /**
835  * arg_label
836  * @i: value
837  *
838  * The opposite of label_arg.  Retrieve a label from the
839  * encoding of the TCG opcode stream.
840  */
841 
842 static inline TCGLabel *arg_label(TCGArg i)
843 {
844     return (TCGLabel *)(uintptr_t)i;
845 }
846 
847 /**
848  * tcg_ptr_byte_diff
849  * @a, @b: addresses to be differenced
850  *
851  * There are many places within the TCG backends where we need a byte
852  * difference between two pointers.  While this can be accomplished
853  * with local casting, it's easy to get wrong -- especially if one is
854  * concerned with the signedness of the result.
855  *
856  * This version relies on GCC's void pointer arithmetic to get the
857  * correct result.
858  */
859 
860 static inline ptrdiff_t tcg_ptr_byte_diff(const void *a, const void *b)
861 {
862     return a - b;
863 }
864 
865 /**
866  * tcg_pcrel_diff
867  * @s: the tcg context
868  * @target: address of the target
869  *
870  * Produce a pc-relative difference, from the current code_ptr
871  * to the destination address.
872  */
873 
874 static inline ptrdiff_t tcg_pcrel_diff(TCGContext *s, const void *target)
875 {
876     return tcg_ptr_byte_diff(target, tcg_splitwx_to_rx(s->code_ptr));
877 }
878 
879 /**
880  * tcg_tbrel_diff
881  * @s: the tcg context
882  * @target: address of the target
883  *
884  * Produce a difference, from the beginning of the current TB code
885  * to the destination address.
886  */
887 static inline ptrdiff_t tcg_tbrel_diff(TCGContext *s, const void *target)
888 {
889     return tcg_ptr_byte_diff(target, tcg_splitwx_to_rx(s->code_buf));
890 }
891 
892 /**
893  * tcg_current_code_size
894  * @s: the tcg context
895  *
896  * Compute the current code size within the translation block.
897  * This is used to fill in qemu's data structures for goto_tb.
898  */
899 
900 static inline size_t tcg_current_code_size(TCGContext *s)
901 {
902     return tcg_ptr_byte_diff(s->code_ptr, s->code_buf);
903 }
904 
905 /**
906  * tcg_qemu_tb_exec:
907  * @env: pointer to CPUArchState for the CPU
908  * @tb_ptr: address of generated code for the TB to execute
909  *
910  * Start executing code from a given translation block.
911  * Where translation blocks have been linked, execution
912  * may proceed from the given TB into successive ones.
913  * Control eventually returns only when some action is needed
914  * from the top-level loop: either control must pass to a TB
915  * which has not yet been directly linked, or an asynchronous
916  * event such as an interrupt needs handling.
917  *
918  * Return: The return value is the value passed to the corresponding
919  * tcg_gen_exit_tb() at translation time of the last TB attempted to execute.
920  * The value is either zero or a 4-byte aligned pointer to that TB combined
921  * with additional information in its two least significant bits. The
922  * additional information is encoded as follows:
923  *  0, 1: the link between this TB and the next is via the specified
924  *        TB index (0 or 1). That is, we left the TB via (the equivalent
925  *        of) "goto_tb <index>". The main loop uses this to determine
926  *        how to link the TB just executed to the next.
927  *  2:    we are using instruction counting code generation, and we
928  *        did not start executing this TB because the instruction counter
929  *        would hit zero midway through it. In this case the pointer
930  *        returned is the TB we were about to execute, and the caller must
931  *        arrange to execute the remaining count of instructions.
932  *  3:    we stopped because the CPU's exit_request flag was set
933  *        (usually meaning that there is an interrupt that needs to be
934  *        handled). The pointer returned is the TB we were about to execute
935  *        when we noticed the pending exit request.
936  *
937  * If the bottom two bits indicate an exit-via-index then the CPU
938  * state is correctly synchronised and ready for execution of the next
939  * TB (and in particular the guest PC is the address to execute next).
940  * Otherwise, we gave up on execution of this TB before it started, and
941  * the caller must fix up the CPU state by calling the CPU's
942  * synchronize_from_tb() method with the TB pointer we return (falling
943  * back to calling the CPU's set_pc method with tb->pb if no
944  * synchronize_from_tb() method exists).
945  *
946  * Note that TCG targets may use a different definition of tcg_qemu_tb_exec
947  * to this default (which just calls the prologue.code emitted by
948  * tcg_target_qemu_prologue()).
949  */
950 #define TB_EXIT_MASK      3
951 #define TB_EXIT_IDX0      0
952 #define TB_EXIT_IDX1      1
953 #define TB_EXIT_IDXMAX    1
954 #define TB_EXIT_REQUESTED 3
955 
956 #ifdef CONFIG_TCG_INTERPRETER
957 uintptr_t tcg_qemu_tb_exec(CPUArchState *env, const void *tb_ptr);
958 #else
959 typedef uintptr_t tcg_prologue_fn(CPUArchState *env, const void *tb_ptr);
960 extern tcg_prologue_fn *tcg_qemu_tb_exec;
961 #endif
962 
963 void tcg_register_jit(const void *buf, size_t buf_size);
964 
965 /* Return zero if the tuple (opc, type, vece) is unsupportable;
966    return > 0 if it is directly supportable;
967    return < 0 if we must call tcg_expand_vec_op.  */
968 int tcg_can_emit_vec_op(TCGOpcode, TCGType, unsigned);
969 
970 /* Expand the tuple (opc, type, vece) on the given arguments.  */
971 void tcg_expand_vec_op(TCGOpcode, TCGType, unsigned, TCGArg, ...);
972 
973 /* Replicate a constant C according to the log2 of the element size.  */
974 uint64_t dup_const(unsigned vece, uint64_t c);
975 
976 #define dup_const(VECE, C)                                         \
977     (__builtin_constant_p(VECE)                                    \
978      ? (  (VECE) == MO_8  ? 0x0101010101010101ull * (uint8_t)(C)   \
979         : (VECE) == MO_16 ? 0x0001000100010001ull * (uint16_t)(C)  \
980         : (VECE) == MO_32 ? 0x0000000100000001ull * (uint32_t)(C)  \
981         : (VECE) == MO_64 ? (uint64_t)(C)                          \
982         : (qemu_build_not_reached_always(), 0))                    \
983      : dup_const(VECE, C))
984 
985 static inline const TCGOpcode *tcg_swap_vecop_list(const TCGOpcode *n)
986 {
987 #ifdef CONFIG_DEBUG_TCG
988     const TCGOpcode *o = tcg_ctx->vecop_list;
989     tcg_ctx->vecop_list = n;
990     return o;
991 #else
992     return NULL;
993 #endif
994 }
995 
996 bool tcg_can_emit_vecop_list(const TCGOpcode *, TCGType, unsigned);
997 void tcg_dump_ops(TCGContext *s, FILE *f, bool have_prefs);
998 
999 #endif /* TCG_H */
1000