18c033f24SRichard Henderson /* SPDX-License-Identifier: MIT */ 28c033f24SRichard Henderson /* 38c033f24SRichard Henderson * Define target-specific opcode support 48c033f24SRichard Henderson * Copyright (c) 2008 Fabrice Bellard 58c033f24SRichard Henderson */ 68c033f24SRichard Henderson 78c033f24SRichard Henderson #ifndef TCG_TARGET_HAS_H 88c033f24SRichard Henderson #define TCG_TARGET_HAS_H 98c033f24SRichard Henderson 108c033f24SRichard Henderson #include "host/cpuinfo.h" 118c033f24SRichard Henderson 128c033f24SRichard Henderson #define have_bmi1 (cpuinfo & CPUINFO_BMI1) 138c033f24SRichard Henderson #define have_popcnt (cpuinfo & CPUINFO_POPCNT) 148c033f24SRichard Henderson #define have_avx1 (cpuinfo & CPUINFO_AVX1) 158c033f24SRichard Henderson #define have_avx2 (cpuinfo & CPUINFO_AVX2) 168c033f24SRichard Henderson #define have_movbe (cpuinfo & CPUINFO_MOVBE) 178c033f24SRichard Henderson 188c033f24SRichard Henderson /* 198c033f24SRichard Henderson * There are interesting instructions in AVX512, so long as we have AVX512VL, 208c033f24SRichard Henderson * which indicates support for EVEX on sizes smaller than 512 bits. 218c033f24SRichard Henderson */ 228c033f24SRichard Henderson #define have_avx512vl ((cpuinfo & CPUINFO_AVX512VL) && \ 238c033f24SRichard Henderson (cpuinfo & CPUINFO_AVX512F)) 248c033f24SRichard Henderson #define have_avx512bw ((cpuinfo & CPUINFO_AVX512BW) && have_avx512vl) 258c033f24SRichard Henderson #define have_avx512dq ((cpuinfo & CPUINFO_AVX512DQ) && have_avx512vl) 268c033f24SRichard Henderson #define have_avx512vbmi2 ((cpuinfo & CPUINFO_AVX512VBMI2) && have_avx512vl) 278c033f24SRichard Henderson 288c033f24SRichard Henderson /* optional instructions */ 298c033f24SRichard Henderson #define TCG_TARGET_HAS_div2_i32 1 308c033f24SRichard Henderson #define TCG_TARGET_HAS_rot_i32 1 318c033f24SRichard Henderson #define TCG_TARGET_HAS_ext8s_i32 1 328c033f24SRichard Henderson #define TCG_TARGET_HAS_ext16s_i32 1 338c033f24SRichard Henderson #define TCG_TARGET_HAS_ext8u_i32 1 348c033f24SRichard Henderson #define TCG_TARGET_HAS_ext16u_i32 1 358c033f24SRichard Henderson #define TCG_TARGET_HAS_bswap16_i32 1 368c033f24SRichard Henderson #define TCG_TARGET_HAS_bswap32_i32 1 378c033f24SRichard Henderson #define TCG_TARGET_HAS_not_i32 1 388c033f24SRichard Henderson #define TCG_TARGET_HAS_andc_i32 have_bmi1 398c033f24SRichard Henderson #define TCG_TARGET_HAS_orc_i32 0 408c033f24SRichard Henderson #define TCG_TARGET_HAS_eqv_i32 0 418c033f24SRichard Henderson #define TCG_TARGET_HAS_nand_i32 0 428c033f24SRichard Henderson #define TCG_TARGET_HAS_nor_i32 0 438c033f24SRichard Henderson #define TCG_TARGET_HAS_clz_i32 1 448c033f24SRichard Henderson #define TCG_TARGET_HAS_ctz_i32 1 458c033f24SRichard Henderson #define TCG_TARGET_HAS_ctpop_i32 have_popcnt 468c033f24SRichard Henderson #define TCG_TARGET_HAS_deposit_i32 1 478c033f24SRichard Henderson #define TCG_TARGET_HAS_extract_i32 1 488c033f24SRichard Henderson #define TCG_TARGET_HAS_sextract_i32 1 498c033f24SRichard Henderson #define TCG_TARGET_HAS_extract2_i32 1 508c033f24SRichard Henderson #define TCG_TARGET_HAS_negsetcond_i32 1 518c033f24SRichard Henderson #define TCG_TARGET_HAS_add2_i32 1 528c033f24SRichard Henderson #define TCG_TARGET_HAS_sub2_i32 1 538c033f24SRichard Henderson #define TCG_TARGET_HAS_mulu2_i32 1 548c033f24SRichard Henderson #define TCG_TARGET_HAS_muls2_i32 1 558c033f24SRichard Henderson #define TCG_TARGET_HAS_muluh_i32 0 568c033f24SRichard Henderson #define TCG_TARGET_HAS_mulsh_i32 0 578c033f24SRichard Henderson 588c033f24SRichard Henderson #if TCG_TARGET_REG_BITS == 64 598c033f24SRichard Henderson /* Keep 32-bit values zero-extended in a register. */ 608c033f24SRichard Henderson #define TCG_TARGET_HAS_extr_i64_i32 1 618c033f24SRichard Henderson #define TCG_TARGET_HAS_div2_i64 1 628c033f24SRichard Henderson #define TCG_TARGET_HAS_rot_i64 1 638c033f24SRichard Henderson #define TCG_TARGET_HAS_ext8s_i64 1 648c033f24SRichard Henderson #define TCG_TARGET_HAS_ext16s_i64 1 658c033f24SRichard Henderson #define TCG_TARGET_HAS_ext32s_i64 1 668c033f24SRichard Henderson #define TCG_TARGET_HAS_ext8u_i64 1 678c033f24SRichard Henderson #define TCG_TARGET_HAS_ext16u_i64 1 688c033f24SRichard Henderson #define TCG_TARGET_HAS_ext32u_i64 1 698c033f24SRichard Henderson #define TCG_TARGET_HAS_bswap16_i64 1 708c033f24SRichard Henderson #define TCG_TARGET_HAS_bswap32_i64 1 718c033f24SRichard Henderson #define TCG_TARGET_HAS_bswap64_i64 1 728c033f24SRichard Henderson #define TCG_TARGET_HAS_not_i64 1 738c033f24SRichard Henderson #define TCG_TARGET_HAS_andc_i64 have_bmi1 748c033f24SRichard Henderson #define TCG_TARGET_HAS_orc_i64 0 758c033f24SRichard Henderson #define TCG_TARGET_HAS_eqv_i64 0 768c033f24SRichard Henderson #define TCG_TARGET_HAS_nand_i64 0 778c033f24SRichard Henderson #define TCG_TARGET_HAS_nor_i64 0 788c033f24SRichard Henderson #define TCG_TARGET_HAS_clz_i64 1 798c033f24SRichard Henderson #define TCG_TARGET_HAS_ctz_i64 1 808c033f24SRichard Henderson #define TCG_TARGET_HAS_ctpop_i64 have_popcnt 818c033f24SRichard Henderson #define TCG_TARGET_HAS_deposit_i64 1 828c033f24SRichard Henderson #define TCG_TARGET_HAS_extract_i64 1 83*4bce752cSRichard Henderson #define TCG_TARGET_HAS_sextract_i64 1 848c033f24SRichard Henderson #define TCG_TARGET_HAS_extract2_i64 1 858c033f24SRichard Henderson #define TCG_TARGET_HAS_negsetcond_i64 1 868c033f24SRichard Henderson #define TCG_TARGET_HAS_add2_i64 1 878c033f24SRichard Henderson #define TCG_TARGET_HAS_sub2_i64 1 888c033f24SRichard Henderson #define TCG_TARGET_HAS_mulu2_i64 1 898c033f24SRichard Henderson #define TCG_TARGET_HAS_muls2_i64 1 908c033f24SRichard Henderson #define TCG_TARGET_HAS_muluh_i64 0 918c033f24SRichard Henderson #define TCG_TARGET_HAS_mulsh_i64 0 928c033f24SRichard Henderson #define TCG_TARGET_HAS_qemu_st8_i32 0 938c033f24SRichard Henderson #else 948c033f24SRichard Henderson #define TCG_TARGET_HAS_qemu_st8_i32 1 958c033f24SRichard Henderson #endif 968c033f24SRichard Henderson 978c033f24SRichard Henderson #define TCG_TARGET_HAS_qemu_ldst_i128 \ 988c033f24SRichard Henderson (TCG_TARGET_REG_BITS == 64 && (cpuinfo & CPUINFO_ATOMIC_VMOVDQA)) 998c033f24SRichard Henderson 1008c033f24SRichard Henderson #define TCG_TARGET_HAS_tst 1 1018c033f24SRichard Henderson 1028c033f24SRichard Henderson /* We do not support older SSE systems, only beginning with AVX1. */ 1038c033f24SRichard Henderson #define TCG_TARGET_HAS_v64 have_avx1 1048c033f24SRichard Henderson #define TCG_TARGET_HAS_v128 have_avx1 1058c033f24SRichard Henderson #define TCG_TARGET_HAS_v256 have_avx2 1068c033f24SRichard Henderson 1078c033f24SRichard Henderson #define TCG_TARGET_HAS_andc_vec 1 1088c033f24SRichard Henderson #define TCG_TARGET_HAS_orc_vec have_avx512vl 1098c033f24SRichard Henderson #define TCG_TARGET_HAS_nand_vec have_avx512vl 1108c033f24SRichard Henderson #define TCG_TARGET_HAS_nor_vec have_avx512vl 1118c033f24SRichard Henderson #define TCG_TARGET_HAS_eqv_vec have_avx512vl 1128c033f24SRichard Henderson #define TCG_TARGET_HAS_not_vec have_avx512vl 1138c033f24SRichard Henderson #define TCG_TARGET_HAS_neg_vec 0 1148c033f24SRichard Henderson #define TCG_TARGET_HAS_abs_vec 1 1158c033f24SRichard Henderson #define TCG_TARGET_HAS_roti_vec have_avx512vl 1168c033f24SRichard Henderson #define TCG_TARGET_HAS_rots_vec 0 1178c033f24SRichard Henderson #define TCG_TARGET_HAS_rotv_vec have_avx512vl 1188c033f24SRichard Henderson #define TCG_TARGET_HAS_shi_vec 1 1198c033f24SRichard Henderson #define TCG_TARGET_HAS_shs_vec 1 1208c033f24SRichard Henderson #define TCG_TARGET_HAS_shv_vec have_avx2 1218c033f24SRichard Henderson #define TCG_TARGET_HAS_mul_vec 1 1228c033f24SRichard Henderson #define TCG_TARGET_HAS_sat_vec 1 1238c033f24SRichard Henderson #define TCG_TARGET_HAS_minmax_vec 1 1248c033f24SRichard Henderson #define TCG_TARGET_HAS_bitsel_vec have_avx512vl 1258c033f24SRichard Henderson #define TCG_TARGET_HAS_cmpsel_vec 1 1268c033f24SRichard Henderson #define TCG_TARGET_HAS_tst_vec have_avx512bw 1278c033f24SRichard Henderson 1288c033f24SRichard Henderson #define TCG_TARGET_deposit_i32_valid(ofs, len) \ 1298c033f24SRichard Henderson (((ofs) == 0 && ((len) == 8 || (len) == 16)) || \ 1308c033f24SRichard Henderson (TCG_TARGET_REG_BITS == 32 && (ofs) == 8 && (len) == 8)) 1318c033f24SRichard Henderson #define TCG_TARGET_deposit_i64_valid TCG_TARGET_deposit_i32_valid 1328c033f24SRichard Henderson 133*4bce752cSRichard Henderson /* 134*4bce752cSRichard Henderson * Check for the possibility of low byte/word extraction, high-byte extraction 135*4bce752cSRichard Henderson * and zero-extending 32-bit right-shift. 136*4bce752cSRichard Henderson * 137*4bce752cSRichard Henderson * We cannot sign-extend from high byte to 64-bits without using the 138*4bce752cSRichard Henderson * REX prefix that explicitly excludes access to the high-byte registers. 139*4bce752cSRichard Henderson */ 140*4bce752cSRichard Henderson static inline bool 141*4bce752cSRichard Henderson tcg_target_sextract_valid(TCGType type, unsigned ofs, unsigned len) 142*4bce752cSRichard Henderson { 143*4bce752cSRichard Henderson switch (ofs) { 144*4bce752cSRichard Henderson case 0: 145*4bce752cSRichard Henderson switch (len) { 146*4bce752cSRichard Henderson case 8: 147*4bce752cSRichard Henderson case 16: 148*4bce752cSRichard Henderson return true; 149*4bce752cSRichard Henderson case 32: 150*4bce752cSRichard Henderson return type == TCG_TYPE_I64; 151*4bce752cSRichard Henderson } 152*4bce752cSRichard Henderson return false; 153*4bce752cSRichard Henderson case 8: 154*4bce752cSRichard Henderson return len == 8 && type == TCG_TYPE_I32; 155*4bce752cSRichard Henderson } 156*4bce752cSRichard Henderson return false; 157*4bce752cSRichard Henderson } 158*4bce752cSRichard Henderson #define TCG_TARGET_sextract_valid tcg_target_sextract_valid 159*4bce752cSRichard Henderson 160*4bce752cSRichard Henderson static inline bool 161*4bce752cSRichard Henderson tcg_target_extract_valid(TCGType type, unsigned ofs, unsigned len) 162*4bce752cSRichard Henderson { 163*4bce752cSRichard Henderson if (type == TCG_TYPE_I64 && ofs + len == 32) { 164*4bce752cSRichard Henderson return true; 165*4bce752cSRichard Henderson } 166*4bce752cSRichard Henderson switch (ofs) { 167*4bce752cSRichard Henderson case 0: 168*4bce752cSRichard Henderson return len == 8 || len == 16; 169*4bce752cSRichard Henderson case 8: 170*4bce752cSRichard Henderson return len == 8; 171*4bce752cSRichard Henderson } 172*4bce752cSRichard Henderson return false; 173*4bce752cSRichard Henderson } 174*4bce752cSRichard Henderson #define TCG_TARGET_extract_valid tcg_target_extract_valid 1758c033f24SRichard Henderson 1768c033f24SRichard Henderson #endif 177