159e0fbf8Sbalrog /* See if various MMX/SSE SSSE3 instructions give expected results */
259e0fbf8Sbalrog #include <stdio.h>
359e0fbf8Sbalrog #include <string.h>
4*222a3336Sbalrog #include <stdint.h>
559e0fbf8Sbalrog
main(int argc,char * argv[])659e0fbf8Sbalrog int main(int argc, char *argv[]) {
759e0fbf8Sbalrog char hello[16];
859e0fbf8Sbalrog const char ehlo[8] = "EHLO ";
959e0fbf8Sbalrog uint64_t mask = 0x8080800302020001;
1059e0fbf8Sbalrog
1159e0fbf8Sbalrog uint64_t a = 0x0000000000090007;
1259e0fbf8Sbalrog uint64_t b = 0x0000000000000000;
13*222a3336Sbalrog uint32_t c;
14*222a3336Sbalrog uint16_t d;
1559e0fbf8Sbalrog
16*222a3336Sbalrog const char e[16] = "LLOaaaaaaaaaaaaa";
17*222a3336Sbalrog const char f[16] = "aaaaaaaaaaaaaaHE";
1859e0fbf8Sbalrog
1959e0fbf8Sbalrog /* pshufb mm1/xmm1, mm2/xmm2 */
2059e0fbf8Sbalrog asm volatile ("movq (%0), %%mm0" : : "r" (ehlo) : "mm0", "mm1");
2159e0fbf8Sbalrog asm volatile ("movq %0, %%mm1" : : "m" (mask));
2259e0fbf8Sbalrog asm volatile ("pshufb %mm1, %mm0");
2359e0fbf8Sbalrog asm volatile ("movq %%mm0, %0" : "=m" (hello));
2459e0fbf8Sbalrog printf("%s\n", hello);
2559e0fbf8Sbalrog
2659e0fbf8Sbalrog /* pshufb mm1/xmm1, m64/m128 */
2759e0fbf8Sbalrog asm volatile ("movq (%0), %%mm0" : : "r" (ehlo) : "mm0");
2859e0fbf8Sbalrog asm volatile ("pshufb %0, %%mm0" : : "m" (mask));
2959e0fbf8Sbalrog asm volatile ("movq %%mm0, %0" : "=m" (hello));
3059e0fbf8Sbalrog printf("%s\n", hello);
3159e0fbf8Sbalrog
3259e0fbf8Sbalrog /* psubsw mm1/xmm1, m64/m128 */
3359e0fbf8Sbalrog asm volatile ("movq %0, %%mm0" : : "r" (a) : "mm0");
3459e0fbf8Sbalrog asm volatile ("phsubsw %0, %%mm0" : : "m" (b));
3559e0fbf8Sbalrog asm volatile ("movq %%mm0, %0" : "=m" (a));
3659e0fbf8Sbalrog printf("%i - %i = %i\n", 9, 7, -(int16_t) a);
3759e0fbf8Sbalrog
3859e0fbf8Sbalrog /* palignr mm1/xmm1, m64/m128, imm8 */
39*222a3336Sbalrog asm volatile ("movdqa (%0), %%xmm0" : : "r" (e) : "xmm0");
40*222a3336Sbalrog asm volatile ("palignr $14, (%0), %%xmm0" : : "r" (f));
4159e0fbf8Sbalrog asm volatile ("movdqa %%xmm0, (%0)" : : "r" (hello));
4259e0fbf8Sbalrog printf("%5.5s\n", hello);
4359e0fbf8Sbalrog
44*222a3336Sbalrog #if 1 /* SSE4 */
45*222a3336Sbalrog /* popcnt r64, r/m64 */
46*222a3336Sbalrog asm volatile ("movq $0x8421000010009c63, %%rax" : : : "rax");
47*222a3336Sbalrog asm volatile ("popcnt %%ax, %%dx" : : : "dx");
48*222a3336Sbalrog asm volatile ("popcnt %%eax, %%ecx" : : : "ecx");
49*222a3336Sbalrog asm volatile ("popcnt %rax, %rax");
50*222a3336Sbalrog asm volatile ("movq %%rax, %0" : "=m" (a));
51*222a3336Sbalrog asm volatile ("movl %%ecx, %0" : "=m" (c));
52*222a3336Sbalrog asm volatile ("movw %%dx, %0" : "=m" (d));
53*222a3336Sbalrog printf("%i = %i\n%i = %i = %i\n", 13, (int) a, 9, c, d + 1);
54*222a3336Sbalrog #endif
55*222a3336Sbalrog
5659e0fbf8Sbalrog return 0;
5759e0fbf8Sbalrog }
58