18c2ecf20Sopenharmony_ci// SPDX-License-Identifier: GPL-2.0 28c2ecf20Sopenharmony_ci/* 38c2ecf20Sopenharmony_ci * This file contains instructions for testing by the test titled: 48c2ecf20Sopenharmony_ci * 58c2ecf20Sopenharmony_ci * "Test x86 instruction decoder - new instructions" 68c2ecf20Sopenharmony_ci * 78c2ecf20Sopenharmony_ci * Note that the 'Expecting' comment lines are consumed by the 88c2ecf20Sopenharmony_ci * gen-insn-x86-dat.awk script and have the format: 98c2ecf20Sopenharmony_ci * 108c2ecf20Sopenharmony_ci * Expecting: <op> <branch> <rel> 118c2ecf20Sopenharmony_ci * 128c2ecf20Sopenharmony_ci * If this file is changed, remember to run the gen-insn-x86-dat.sh 138c2ecf20Sopenharmony_ci * script and commit the result. 148c2ecf20Sopenharmony_ci * 158c2ecf20Sopenharmony_ci * Refer to insn-x86.c for more details. 168c2ecf20Sopenharmony_ci */ 178c2ecf20Sopenharmony_ci 188c2ecf20Sopenharmony_ciint main(void) 198c2ecf20Sopenharmony_ci{ 208c2ecf20Sopenharmony_ci /* Following line is a marker for the awk script - do not change */ 218c2ecf20Sopenharmony_ci asm volatile("rdtsc"); /* Start here */ 228c2ecf20Sopenharmony_ci 238c2ecf20Sopenharmony_ci /* Test fix for vcvtph2ps in x86-opcode-map.txt */ 248c2ecf20Sopenharmony_ci 258c2ecf20Sopenharmony_ci asm volatile("vcvtph2ps %xmm3,%ymm5"); 268c2ecf20Sopenharmony_ci 278c2ecf20Sopenharmony_ci#ifdef __x86_64__ 288c2ecf20Sopenharmony_ci 298c2ecf20Sopenharmony_ci /* AVX-512: Instructions with the same op codes as Mask Instructions */ 308c2ecf20Sopenharmony_ci 318c2ecf20Sopenharmony_ci asm volatile("cmovno %rax,%rbx"); 328c2ecf20Sopenharmony_ci asm volatile("cmovno 0x12345678(%rax),%rcx"); 338c2ecf20Sopenharmony_ci asm volatile("cmovno 0x12345678(%rax),%cx"); 348c2ecf20Sopenharmony_ci 358c2ecf20Sopenharmony_ci asm volatile("cmove %rax,%rbx"); 368c2ecf20Sopenharmony_ci asm volatile("cmove 0x12345678(%rax),%rcx"); 378c2ecf20Sopenharmony_ci asm volatile("cmove 0x12345678(%rax),%cx"); 388c2ecf20Sopenharmony_ci 398c2ecf20Sopenharmony_ci asm volatile("seto 0x12345678(%rax)"); 408c2ecf20Sopenharmony_ci asm volatile("setno 0x12345678(%rax)"); 418c2ecf20Sopenharmony_ci asm volatile("setb 0x12345678(%rax)"); 428c2ecf20Sopenharmony_ci asm volatile("setc 0x12345678(%rax)"); 438c2ecf20Sopenharmony_ci asm volatile("setnae 0x12345678(%rax)"); 448c2ecf20Sopenharmony_ci asm volatile("setae 0x12345678(%rax)"); 458c2ecf20Sopenharmony_ci asm volatile("setnb 0x12345678(%rax)"); 468c2ecf20Sopenharmony_ci asm volatile("setnc 0x12345678(%rax)"); 478c2ecf20Sopenharmony_ci asm volatile("sets 0x12345678(%rax)"); 488c2ecf20Sopenharmony_ci asm volatile("setns 0x12345678(%rax)"); 498c2ecf20Sopenharmony_ci 508c2ecf20Sopenharmony_ci /* AVX-512: Mask Instructions */ 518c2ecf20Sopenharmony_ci 528c2ecf20Sopenharmony_ci asm volatile("kandw %k7,%k6,%k5"); 538c2ecf20Sopenharmony_ci asm volatile("kandq %k7,%k6,%k5"); 548c2ecf20Sopenharmony_ci asm volatile("kandb %k7,%k6,%k5"); 558c2ecf20Sopenharmony_ci asm volatile("kandd %k7,%k6,%k5"); 568c2ecf20Sopenharmony_ci 578c2ecf20Sopenharmony_ci asm volatile("kandnw %k7,%k6,%k5"); 588c2ecf20Sopenharmony_ci asm volatile("kandnq %k7,%k6,%k5"); 598c2ecf20Sopenharmony_ci asm volatile("kandnb %k7,%k6,%k5"); 608c2ecf20Sopenharmony_ci asm volatile("kandnd %k7,%k6,%k5"); 618c2ecf20Sopenharmony_ci 628c2ecf20Sopenharmony_ci asm volatile("knotw %k7,%k6"); 638c2ecf20Sopenharmony_ci asm volatile("knotq %k7,%k6"); 648c2ecf20Sopenharmony_ci asm volatile("knotb %k7,%k6"); 658c2ecf20Sopenharmony_ci asm volatile("knotd %k7,%k6"); 668c2ecf20Sopenharmony_ci 678c2ecf20Sopenharmony_ci asm volatile("korw %k7,%k6,%k5"); 688c2ecf20Sopenharmony_ci asm volatile("korq %k7,%k6,%k5"); 698c2ecf20Sopenharmony_ci asm volatile("korb %k7,%k6,%k5"); 708c2ecf20Sopenharmony_ci asm volatile("kord %k7,%k6,%k5"); 718c2ecf20Sopenharmony_ci 728c2ecf20Sopenharmony_ci asm volatile("kxnorw %k7,%k6,%k5"); 738c2ecf20Sopenharmony_ci asm volatile("kxnorq %k7,%k6,%k5"); 748c2ecf20Sopenharmony_ci asm volatile("kxnorb %k7,%k6,%k5"); 758c2ecf20Sopenharmony_ci asm volatile("kxnord %k7,%k6,%k5"); 768c2ecf20Sopenharmony_ci 778c2ecf20Sopenharmony_ci asm volatile("kxorw %k7,%k6,%k5"); 788c2ecf20Sopenharmony_ci asm volatile("kxorq %k7,%k6,%k5"); 798c2ecf20Sopenharmony_ci asm volatile("kxorb %k7,%k6,%k5"); 808c2ecf20Sopenharmony_ci asm volatile("kxord %k7,%k6,%k5"); 818c2ecf20Sopenharmony_ci 828c2ecf20Sopenharmony_ci asm volatile("kaddw %k7,%k6,%k5"); 838c2ecf20Sopenharmony_ci asm volatile("kaddq %k7,%k6,%k5"); 848c2ecf20Sopenharmony_ci asm volatile("kaddb %k7,%k6,%k5"); 858c2ecf20Sopenharmony_ci asm volatile("kaddd %k7,%k6,%k5"); 868c2ecf20Sopenharmony_ci 878c2ecf20Sopenharmony_ci asm volatile("kunpckbw %k7,%k6,%k5"); 888c2ecf20Sopenharmony_ci asm volatile("kunpckwd %k7,%k6,%k5"); 898c2ecf20Sopenharmony_ci asm volatile("kunpckdq %k7,%k6,%k5"); 908c2ecf20Sopenharmony_ci 918c2ecf20Sopenharmony_ci asm volatile("kmovw %k6,%k5"); 928c2ecf20Sopenharmony_ci asm volatile("kmovw (%rcx),%k5"); 938c2ecf20Sopenharmony_ci asm volatile("kmovw 0x123(%rax,%r14,8),%k5"); 948c2ecf20Sopenharmony_ci asm volatile("kmovw %k5,(%rcx)"); 958c2ecf20Sopenharmony_ci asm volatile("kmovw %k5,0x123(%rax,%r14,8)"); 968c2ecf20Sopenharmony_ci asm volatile("kmovw %eax,%k5"); 978c2ecf20Sopenharmony_ci asm volatile("kmovw %ebp,%k5"); 988c2ecf20Sopenharmony_ci asm volatile("kmovw %r13d,%k5"); 998c2ecf20Sopenharmony_ci asm volatile("kmovw %k5,%eax"); 1008c2ecf20Sopenharmony_ci asm volatile("kmovw %k5,%ebp"); 1018c2ecf20Sopenharmony_ci asm volatile("kmovw %k5,%r13d"); 1028c2ecf20Sopenharmony_ci 1038c2ecf20Sopenharmony_ci asm volatile("kmovq %k6,%k5"); 1048c2ecf20Sopenharmony_ci asm volatile("kmovq (%rcx),%k5"); 1058c2ecf20Sopenharmony_ci asm volatile("kmovq 0x123(%rax,%r14,8),%k5"); 1068c2ecf20Sopenharmony_ci asm volatile("kmovq %k5,(%rcx)"); 1078c2ecf20Sopenharmony_ci asm volatile("kmovq %k5,0x123(%rax,%r14,8)"); 1088c2ecf20Sopenharmony_ci asm volatile("kmovq %rax,%k5"); 1098c2ecf20Sopenharmony_ci asm volatile("kmovq %rbp,%k5"); 1108c2ecf20Sopenharmony_ci asm volatile("kmovq %r13,%k5"); 1118c2ecf20Sopenharmony_ci asm volatile("kmovq %k5,%rax"); 1128c2ecf20Sopenharmony_ci asm volatile("kmovq %k5,%rbp"); 1138c2ecf20Sopenharmony_ci asm volatile("kmovq %k5,%r13"); 1148c2ecf20Sopenharmony_ci 1158c2ecf20Sopenharmony_ci asm volatile("kmovb %k6,%k5"); 1168c2ecf20Sopenharmony_ci asm volatile("kmovb (%rcx),%k5"); 1178c2ecf20Sopenharmony_ci asm volatile("kmovb 0x123(%rax,%r14,8),%k5"); 1188c2ecf20Sopenharmony_ci asm volatile("kmovb %k5,(%rcx)"); 1198c2ecf20Sopenharmony_ci asm volatile("kmovb %k5,0x123(%rax,%r14,8)"); 1208c2ecf20Sopenharmony_ci asm volatile("kmovb %eax,%k5"); 1218c2ecf20Sopenharmony_ci asm volatile("kmovb %ebp,%k5"); 1228c2ecf20Sopenharmony_ci asm volatile("kmovb %r13d,%k5"); 1238c2ecf20Sopenharmony_ci asm volatile("kmovb %k5,%eax"); 1248c2ecf20Sopenharmony_ci asm volatile("kmovb %k5,%ebp"); 1258c2ecf20Sopenharmony_ci asm volatile("kmovb %k5,%r13d"); 1268c2ecf20Sopenharmony_ci 1278c2ecf20Sopenharmony_ci asm volatile("kmovd %k6,%k5"); 1288c2ecf20Sopenharmony_ci asm volatile("kmovd (%rcx),%k5"); 1298c2ecf20Sopenharmony_ci asm volatile("kmovd 0x123(%rax,%r14,8),%k5"); 1308c2ecf20Sopenharmony_ci asm volatile("kmovd %k5,(%rcx)"); 1318c2ecf20Sopenharmony_ci asm volatile("kmovd %k5,0x123(%rax,%r14,8)"); 1328c2ecf20Sopenharmony_ci asm volatile("kmovd %eax,%k5"); 1338c2ecf20Sopenharmony_ci asm volatile("kmovd %ebp,%k5"); 1348c2ecf20Sopenharmony_ci asm volatile("kmovd %r13d,%k5"); 1358c2ecf20Sopenharmony_ci asm volatile("kmovd %k5,%eax"); 1368c2ecf20Sopenharmony_ci asm volatile("kmovd %k5,%ebp"); 1378c2ecf20Sopenharmony_ci asm volatile("kmovd %k5,%r13d"); 1388c2ecf20Sopenharmony_ci 1398c2ecf20Sopenharmony_ci asm volatile("kortestw %k6,%k5"); 1408c2ecf20Sopenharmony_ci asm volatile("kortestq %k6,%k5"); 1418c2ecf20Sopenharmony_ci asm volatile("kortestb %k6,%k5"); 1428c2ecf20Sopenharmony_ci asm volatile("kortestd %k6,%k5"); 1438c2ecf20Sopenharmony_ci 1448c2ecf20Sopenharmony_ci asm volatile("ktestw %k6,%k5"); 1458c2ecf20Sopenharmony_ci asm volatile("ktestq %k6,%k5"); 1468c2ecf20Sopenharmony_ci asm volatile("ktestb %k6,%k5"); 1478c2ecf20Sopenharmony_ci asm volatile("ktestd %k6,%k5"); 1488c2ecf20Sopenharmony_ci 1498c2ecf20Sopenharmony_ci asm volatile("kshiftrw $0x12,%k6,%k5"); 1508c2ecf20Sopenharmony_ci asm volatile("kshiftrq $0x5b,%k6,%k5"); 1518c2ecf20Sopenharmony_ci asm volatile("kshiftlw $0x12,%k6,%k5"); 1528c2ecf20Sopenharmony_ci asm volatile("kshiftlq $0x5b,%k6,%k5"); 1538c2ecf20Sopenharmony_ci 1548c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 5b */ 1558c2ecf20Sopenharmony_ci asm volatile("vcvtdq2ps %xmm5,%xmm6"); 1568c2ecf20Sopenharmony_ci asm volatile("vcvtqq2ps %zmm29,%ymm6{%k7}"); 1578c2ecf20Sopenharmony_ci asm volatile("vcvtps2dq %xmm5,%xmm6"); 1588c2ecf20Sopenharmony_ci asm volatile("vcvttps2dq %xmm5,%xmm6"); 1598c2ecf20Sopenharmony_ci 1608c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 6f */ 1618c2ecf20Sopenharmony_ci 1628c2ecf20Sopenharmony_ci asm volatile("movq %mm0,%mm4"); 1638c2ecf20Sopenharmony_ci asm volatile("vmovdqa %ymm4,%ymm6"); 1648c2ecf20Sopenharmony_ci asm volatile("vmovdqa32 %zmm25,%zmm26"); 1658c2ecf20Sopenharmony_ci asm volatile("vmovdqa64 %zmm25,%zmm26"); 1668c2ecf20Sopenharmony_ci asm volatile("vmovdqu %ymm4,%ymm6"); 1678c2ecf20Sopenharmony_ci asm volatile("vmovdqu32 %zmm29,%zmm30"); 1688c2ecf20Sopenharmony_ci asm volatile("vmovdqu64 %zmm25,%zmm26"); 1698c2ecf20Sopenharmony_ci asm volatile("vmovdqu8 %zmm29,%zmm30"); 1708c2ecf20Sopenharmony_ci asm volatile("vmovdqu16 %zmm25,%zmm26"); 1718c2ecf20Sopenharmony_ci 1728c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 78 */ 1738c2ecf20Sopenharmony_ci 1748c2ecf20Sopenharmony_ci asm volatile("vmread %rax,%rbx"); 1758c2ecf20Sopenharmony_ci asm volatile("vcvttps2udq %zmm25,%zmm26"); 1768c2ecf20Sopenharmony_ci asm volatile("vcvttpd2udq %zmm29,%ymm6{%k7}"); 1778c2ecf20Sopenharmony_ci asm volatile("vcvttsd2usi %xmm6,%rax"); 1788c2ecf20Sopenharmony_ci asm volatile("vcvttss2usi %xmm6,%rax"); 1798c2ecf20Sopenharmony_ci asm volatile("vcvttps2uqq %ymm5,%zmm26{%k7}"); 1808c2ecf20Sopenharmony_ci asm volatile("vcvttpd2uqq %zmm29,%zmm30"); 1818c2ecf20Sopenharmony_ci 1828c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 79 */ 1838c2ecf20Sopenharmony_ci 1848c2ecf20Sopenharmony_ci asm volatile("vmwrite %rax,%rbx"); 1858c2ecf20Sopenharmony_ci asm volatile("vcvtps2udq %zmm25,%zmm26"); 1868c2ecf20Sopenharmony_ci asm volatile("vcvtpd2udq %zmm29,%ymm6{%k7}"); 1878c2ecf20Sopenharmony_ci asm volatile("vcvtsd2usi %xmm6,%rax"); 1888c2ecf20Sopenharmony_ci asm volatile("vcvtss2usi %xmm6,%rax"); 1898c2ecf20Sopenharmony_ci asm volatile("vcvtps2uqq %ymm5,%zmm26{%k7}"); 1908c2ecf20Sopenharmony_ci asm volatile("vcvtpd2uqq %zmm29,%zmm30"); 1918c2ecf20Sopenharmony_ci 1928c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 7a */ 1938c2ecf20Sopenharmony_ci 1948c2ecf20Sopenharmony_ci asm volatile("vcvtudq2pd %ymm5,%zmm29{%k7}"); 1958c2ecf20Sopenharmony_ci asm volatile("vcvtuqq2pd %zmm25,%zmm26"); 1968c2ecf20Sopenharmony_ci asm volatile("vcvtudq2ps %zmm29,%zmm30"); 1978c2ecf20Sopenharmony_ci asm volatile("vcvtuqq2ps %zmm25,%ymm26{%k7}"); 1988c2ecf20Sopenharmony_ci asm volatile("vcvttps2qq %ymm25,%zmm26{%k7}"); 1998c2ecf20Sopenharmony_ci asm volatile("vcvttpd2qq %zmm29,%zmm30"); 2008c2ecf20Sopenharmony_ci 2018c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 7b */ 2028c2ecf20Sopenharmony_ci 2038c2ecf20Sopenharmony_ci asm volatile("vcvtusi2sd %eax,%xmm5,%xmm6"); 2048c2ecf20Sopenharmony_ci asm volatile("vcvtusi2ss %eax,%xmm5,%xmm6"); 2058c2ecf20Sopenharmony_ci asm volatile("vcvtps2qq %ymm5,%zmm26{%k7}"); 2068c2ecf20Sopenharmony_ci asm volatile("vcvtpd2qq %zmm29,%zmm30"); 2078c2ecf20Sopenharmony_ci 2088c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 7f */ 2098c2ecf20Sopenharmony_ci 2108c2ecf20Sopenharmony_ci asm volatile("movq.s %mm0,%mm4"); 2118c2ecf20Sopenharmony_ci asm volatile("vmovdqa %ymm8,%ymm6"); 2128c2ecf20Sopenharmony_ci asm volatile("vmovdqa32.s %zmm25,%zmm26"); 2138c2ecf20Sopenharmony_ci asm volatile("vmovdqa64.s %zmm25,%zmm26"); 2148c2ecf20Sopenharmony_ci asm volatile("vmovdqu %ymm8,%ymm6"); 2158c2ecf20Sopenharmony_ci asm volatile("vmovdqu32.s %zmm25,%zmm26"); 2168c2ecf20Sopenharmony_ci asm volatile("vmovdqu64.s %zmm25,%zmm26"); 2178c2ecf20Sopenharmony_ci asm volatile("vmovdqu8.s %zmm30,(%rcx)"); 2188c2ecf20Sopenharmony_ci asm volatile("vmovdqu16.s %zmm25,%zmm26"); 2198c2ecf20Sopenharmony_ci 2208c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f db */ 2218c2ecf20Sopenharmony_ci 2228c2ecf20Sopenharmony_ci asm volatile("pand %mm1,%mm2"); 2238c2ecf20Sopenharmony_ci asm volatile("pand %xmm1,%xmm2"); 2248c2ecf20Sopenharmony_ci asm volatile("vpand %ymm4,%ymm6,%ymm2"); 2258c2ecf20Sopenharmony_ci asm volatile("vpandd %zmm24,%zmm25,%zmm26"); 2268c2ecf20Sopenharmony_ci asm volatile("vpandq %zmm24,%zmm25,%zmm26"); 2278c2ecf20Sopenharmony_ci 2288c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f df */ 2298c2ecf20Sopenharmony_ci 2308c2ecf20Sopenharmony_ci asm volatile("pandn %mm1,%mm2"); 2318c2ecf20Sopenharmony_ci asm volatile("pandn %xmm1,%xmm2"); 2328c2ecf20Sopenharmony_ci asm volatile("vpandn %ymm4,%ymm6,%ymm2"); 2338c2ecf20Sopenharmony_ci asm volatile("vpandnd %zmm24,%zmm25,%zmm26"); 2348c2ecf20Sopenharmony_ci asm volatile("vpandnq %zmm24,%zmm25,%zmm26"); 2358c2ecf20Sopenharmony_ci 2368c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f e6 */ 2378c2ecf20Sopenharmony_ci 2388c2ecf20Sopenharmony_ci asm volatile("vcvttpd2dq %xmm1,%xmm2"); 2398c2ecf20Sopenharmony_ci asm volatile("vcvtdq2pd %xmm5,%xmm6"); 2408c2ecf20Sopenharmony_ci asm volatile("vcvtdq2pd %ymm5,%zmm26{%k7}"); 2418c2ecf20Sopenharmony_ci asm volatile("vcvtqq2pd %zmm25,%zmm26"); 2428c2ecf20Sopenharmony_ci asm volatile("vcvtpd2dq %xmm1,%xmm2"); 2438c2ecf20Sopenharmony_ci 2448c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f eb */ 2458c2ecf20Sopenharmony_ci 2468c2ecf20Sopenharmony_ci asm volatile("por %mm4,%mm6"); 2478c2ecf20Sopenharmony_ci asm volatile("vpor %ymm4,%ymm6,%ymm2"); 2488c2ecf20Sopenharmony_ci asm volatile("vpord %zmm24,%zmm25,%zmm26"); 2498c2ecf20Sopenharmony_ci asm volatile("vporq %zmm24,%zmm25,%zmm26"); 2508c2ecf20Sopenharmony_ci 2518c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f ef */ 2528c2ecf20Sopenharmony_ci 2538c2ecf20Sopenharmony_ci asm volatile("pxor %mm4,%mm6"); 2548c2ecf20Sopenharmony_ci asm volatile("vpxor %ymm4,%ymm6,%ymm2"); 2558c2ecf20Sopenharmony_ci asm volatile("vpxord %zmm24,%zmm25,%zmm26"); 2568c2ecf20Sopenharmony_ci asm volatile("vpxorq %zmm24,%zmm25,%zmm26"); 2578c2ecf20Sopenharmony_ci 2588c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 38 10 */ 2598c2ecf20Sopenharmony_ci 2608c2ecf20Sopenharmony_ci asm volatile("pblendvb %xmm1,%xmm0"); 2618c2ecf20Sopenharmony_ci asm volatile("vpsrlvw %zmm27,%zmm28,%zmm29"); 2628c2ecf20Sopenharmony_ci asm volatile("vpmovuswb %zmm28,%ymm6{%k7}"); 2638c2ecf20Sopenharmony_ci 2648c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 38 11 */ 2658c2ecf20Sopenharmony_ci 2668c2ecf20Sopenharmony_ci asm volatile("vpmovusdb %zmm28,%xmm6{%k7}"); 2678c2ecf20Sopenharmony_ci asm volatile("vpsravw %zmm27,%zmm28,%zmm29"); 2688c2ecf20Sopenharmony_ci 2698c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 38 12 */ 2708c2ecf20Sopenharmony_ci 2718c2ecf20Sopenharmony_ci asm volatile("vpmovusqb %zmm27,%xmm6{%k7}"); 2728c2ecf20Sopenharmony_ci asm volatile("vpsllvw %zmm27,%zmm28,%zmm29"); 2738c2ecf20Sopenharmony_ci 2748c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 38 13 */ 2758c2ecf20Sopenharmony_ci 2768c2ecf20Sopenharmony_ci asm volatile("vcvtph2ps %xmm3,%ymm5"); 2778c2ecf20Sopenharmony_ci asm volatile("vcvtph2ps %ymm5,%zmm27{%k7}"); 2788c2ecf20Sopenharmony_ci asm volatile("vpmovusdw %zmm27,%ymm6{%k7}"); 2798c2ecf20Sopenharmony_ci 2808c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 38 14 */ 2818c2ecf20Sopenharmony_ci 2828c2ecf20Sopenharmony_ci asm volatile("blendvps %xmm1,%xmm0"); 2838c2ecf20Sopenharmony_ci asm volatile("vpmovusqw %zmm27,%xmm6{%k7}"); 2848c2ecf20Sopenharmony_ci asm volatile("vprorvd %zmm27,%zmm28,%zmm29"); 2858c2ecf20Sopenharmony_ci asm volatile("vprorvq %zmm27,%zmm28,%zmm29"); 2868c2ecf20Sopenharmony_ci 2878c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 38 15 */ 2888c2ecf20Sopenharmony_ci 2898c2ecf20Sopenharmony_ci asm volatile("blendvpd %xmm1,%xmm0"); 2908c2ecf20Sopenharmony_ci asm volatile("vpmovusqd %zmm27,%ymm6{%k7}"); 2918c2ecf20Sopenharmony_ci asm volatile("vprolvd %zmm27,%zmm28,%zmm29"); 2928c2ecf20Sopenharmony_ci asm volatile("vprolvq %zmm27,%zmm28,%zmm29"); 2938c2ecf20Sopenharmony_ci 2948c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 38 16 */ 2958c2ecf20Sopenharmony_ci 2968c2ecf20Sopenharmony_ci asm volatile("vpermps %ymm4,%ymm6,%ymm2"); 2978c2ecf20Sopenharmony_ci asm volatile("vpermps %ymm24,%ymm26,%ymm22{%k7}"); 2988c2ecf20Sopenharmony_ci asm volatile("vpermpd %ymm24,%ymm26,%ymm22{%k7}"); 2998c2ecf20Sopenharmony_ci 3008c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 38 19 */ 3018c2ecf20Sopenharmony_ci 3028c2ecf20Sopenharmony_ci asm volatile("vbroadcastsd %xmm4,%ymm6"); 3038c2ecf20Sopenharmony_ci asm volatile("vbroadcastf32x2 %xmm27,%zmm26"); 3048c2ecf20Sopenharmony_ci 3058c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 38 1a */ 3068c2ecf20Sopenharmony_ci 3078c2ecf20Sopenharmony_ci asm volatile("vbroadcastf128 (%rcx),%ymm4"); 3088c2ecf20Sopenharmony_ci asm volatile("vbroadcastf32x4 (%rcx),%zmm26"); 3098c2ecf20Sopenharmony_ci asm volatile("vbroadcastf64x2 (%rcx),%zmm26"); 3108c2ecf20Sopenharmony_ci 3118c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 38 1b */ 3128c2ecf20Sopenharmony_ci 3138c2ecf20Sopenharmony_ci asm volatile("vbroadcastf32x8 (%rcx),%zmm27"); 3148c2ecf20Sopenharmony_ci asm volatile("vbroadcastf64x4 (%rcx),%zmm26"); 3158c2ecf20Sopenharmony_ci 3168c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 38 1f */ 3178c2ecf20Sopenharmony_ci 3188c2ecf20Sopenharmony_ci asm volatile("vpabsq %zmm27,%zmm28"); 3198c2ecf20Sopenharmony_ci 3208c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 38 20 */ 3218c2ecf20Sopenharmony_ci 3228c2ecf20Sopenharmony_ci asm volatile("vpmovsxbw %xmm4,%xmm5"); 3238c2ecf20Sopenharmony_ci asm volatile("vpmovswb %zmm27,%ymm6{%k7}"); 3248c2ecf20Sopenharmony_ci 3258c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 38 21 */ 3268c2ecf20Sopenharmony_ci 3278c2ecf20Sopenharmony_ci asm volatile("vpmovsxbd %xmm4,%ymm6"); 3288c2ecf20Sopenharmony_ci asm volatile("vpmovsdb %zmm27,%xmm6{%k7}"); 3298c2ecf20Sopenharmony_ci 3308c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 38 22 */ 3318c2ecf20Sopenharmony_ci 3328c2ecf20Sopenharmony_ci asm volatile("vpmovsxbq %xmm4,%ymm4"); 3338c2ecf20Sopenharmony_ci asm volatile("vpmovsqb %zmm27,%xmm6{%k7}"); 3348c2ecf20Sopenharmony_ci 3358c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 38 23 */ 3368c2ecf20Sopenharmony_ci 3378c2ecf20Sopenharmony_ci asm volatile("vpmovsxwd %xmm4,%ymm4"); 3388c2ecf20Sopenharmony_ci asm volatile("vpmovsdw %zmm27,%ymm6{%k7}"); 3398c2ecf20Sopenharmony_ci 3408c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 38 24 */ 3418c2ecf20Sopenharmony_ci 3428c2ecf20Sopenharmony_ci asm volatile("vpmovsxwq %xmm4,%ymm6"); 3438c2ecf20Sopenharmony_ci asm volatile("vpmovsqw %zmm27,%xmm6{%k7}"); 3448c2ecf20Sopenharmony_ci 3458c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 38 25 */ 3468c2ecf20Sopenharmony_ci 3478c2ecf20Sopenharmony_ci asm volatile("vpmovsxdq %xmm4,%ymm4"); 3488c2ecf20Sopenharmony_ci asm volatile("vpmovsqd %zmm27,%ymm6{%k7}"); 3498c2ecf20Sopenharmony_ci 3508c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 38 26 */ 3518c2ecf20Sopenharmony_ci 3528c2ecf20Sopenharmony_ci asm volatile("vptestmb %zmm27,%zmm28,%k5"); 3538c2ecf20Sopenharmony_ci asm volatile("vptestmw %zmm27,%zmm28,%k5"); 3548c2ecf20Sopenharmony_ci asm volatile("vptestnmb %zmm26,%zmm27,%k5"); 3558c2ecf20Sopenharmony_ci asm volatile("vptestnmw %zmm26,%zmm27,%k5"); 3568c2ecf20Sopenharmony_ci 3578c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 38 27 */ 3588c2ecf20Sopenharmony_ci 3598c2ecf20Sopenharmony_ci asm volatile("vptestmd %zmm27,%zmm28,%k5"); 3608c2ecf20Sopenharmony_ci asm volatile("vptestmq %zmm27,%zmm28,%k5"); 3618c2ecf20Sopenharmony_ci asm volatile("vptestnmd %zmm26,%zmm27,%k5"); 3628c2ecf20Sopenharmony_ci asm volatile("vptestnmq %zmm26,%zmm27,%k5"); 3638c2ecf20Sopenharmony_ci 3648c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 38 28 */ 3658c2ecf20Sopenharmony_ci 3668c2ecf20Sopenharmony_ci asm volatile("vpmuldq %ymm4,%ymm6,%ymm2"); 3678c2ecf20Sopenharmony_ci asm volatile("vpmovm2b %k5,%zmm28"); 3688c2ecf20Sopenharmony_ci asm volatile("vpmovm2w %k5,%zmm28"); 3698c2ecf20Sopenharmony_ci 3708c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 38 29 */ 3718c2ecf20Sopenharmony_ci 3728c2ecf20Sopenharmony_ci asm volatile("vpcmpeqq %ymm4,%ymm6,%ymm2"); 3738c2ecf20Sopenharmony_ci asm volatile("vpmovb2m %zmm28,%k5"); 3748c2ecf20Sopenharmony_ci asm volatile("vpmovw2m %zmm28,%k5"); 3758c2ecf20Sopenharmony_ci 3768c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 38 2a */ 3778c2ecf20Sopenharmony_ci 3788c2ecf20Sopenharmony_ci asm volatile("vmovntdqa (%rcx),%ymm4"); 3798c2ecf20Sopenharmony_ci asm volatile("vpbroadcastmb2q %k6,%zmm30"); 3808c2ecf20Sopenharmony_ci 3818c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 38 2c */ 3828c2ecf20Sopenharmony_ci 3838c2ecf20Sopenharmony_ci asm volatile("vmaskmovps (%rcx),%ymm4,%ymm6"); 3848c2ecf20Sopenharmony_ci asm volatile("vscalefps %zmm24,%zmm25,%zmm26"); 3858c2ecf20Sopenharmony_ci asm volatile("vscalefpd %zmm24,%zmm25,%zmm26"); 3868c2ecf20Sopenharmony_ci 3878c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 38 2d */ 3888c2ecf20Sopenharmony_ci 3898c2ecf20Sopenharmony_ci asm volatile("vmaskmovpd (%rcx),%ymm4,%ymm6"); 3908c2ecf20Sopenharmony_ci asm volatile("vscalefss %xmm24,%xmm25,%xmm26{%k7}"); 3918c2ecf20Sopenharmony_ci asm volatile("vscalefsd %xmm24,%xmm25,%xmm26{%k7}"); 3928c2ecf20Sopenharmony_ci 3938c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 38 30 */ 3948c2ecf20Sopenharmony_ci 3958c2ecf20Sopenharmony_ci asm volatile("vpmovzxbw %xmm4,%ymm4"); 3968c2ecf20Sopenharmony_ci asm volatile("vpmovwb %zmm27,%ymm6{%k7}"); 3978c2ecf20Sopenharmony_ci 3988c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 38 31 */ 3998c2ecf20Sopenharmony_ci 4008c2ecf20Sopenharmony_ci asm volatile("vpmovzxbd %xmm4,%ymm6"); 4018c2ecf20Sopenharmony_ci asm volatile("vpmovdb %zmm27,%xmm6{%k7}"); 4028c2ecf20Sopenharmony_ci 4038c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 38 32 */ 4048c2ecf20Sopenharmony_ci 4058c2ecf20Sopenharmony_ci asm volatile("vpmovzxbq %xmm4,%ymm4"); 4068c2ecf20Sopenharmony_ci asm volatile("vpmovqb %zmm27,%xmm6{%k7}"); 4078c2ecf20Sopenharmony_ci 4088c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 38 33 */ 4098c2ecf20Sopenharmony_ci 4108c2ecf20Sopenharmony_ci asm volatile("vpmovzxwd %xmm4,%ymm4"); 4118c2ecf20Sopenharmony_ci asm volatile("vpmovdw %zmm27,%ymm6{%k7}"); 4128c2ecf20Sopenharmony_ci 4138c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 38 34 */ 4148c2ecf20Sopenharmony_ci 4158c2ecf20Sopenharmony_ci asm volatile("vpmovzxwq %xmm4,%ymm6"); 4168c2ecf20Sopenharmony_ci asm volatile("vpmovqw %zmm27,%xmm6{%k7}"); 4178c2ecf20Sopenharmony_ci 4188c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 38 35 */ 4198c2ecf20Sopenharmony_ci 4208c2ecf20Sopenharmony_ci asm volatile("vpmovzxdq %xmm4,%ymm4"); 4218c2ecf20Sopenharmony_ci asm volatile("vpmovqd %zmm27,%ymm6{%k7}"); 4228c2ecf20Sopenharmony_ci 4238c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 38 38 */ 4248c2ecf20Sopenharmony_ci 4258c2ecf20Sopenharmony_ci asm volatile("vpermd %ymm4,%ymm6,%ymm2"); 4268c2ecf20Sopenharmony_ci asm volatile("vpermd %ymm24,%ymm26,%ymm22{%k7}"); 4278c2ecf20Sopenharmony_ci asm volatile("vpermq %ymm24,%ymm26,%ymm22{%k7}"); 4288c2ecf20Sopenharmony_ci 4298c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 38 38 */ 4308c2ecf20Sopenharmony_ci 4318c2ecf20Sopenharmony_ci asm volatile("vpminsb %ymm4,%ymm6,%ymm2"); 4328c2ecf20Sopenharmony_ci asm volatile("vpmovm2d %k5,%zmm28"); 4338c2ecf20Sopenharmony_ci asm volatile("vpmovm2q %k5,%zmm28"); 4348c2ecf20Sopenharmony_ci 4358c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 38 39 */ 4368c2ecf20Sopenharmony_ci 4378c2ecf20Sopenharmony_ci asm volatile("vpminsd %xmm1,%xmm2,%xmm3"); 4388c2ecf20Sopenharmony_ci asm volatile("vpminsd %zmm24,%zmm25,%zmm26"); 4398c2ecf20Sopenharmony_ci asm volatile("vpminsq %zmm24,%zmm25,%zmm26"); 4408c2ecf20Sopenharmony_ci asm volatile("vpmovd2m %zmm28,%k5"); 4418c2ecf20Sopenharmony_ci asm volatile("vpmovq2m %zmm28,%k5"); 4428c2ecf20Sopenharmony_ci 4438c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 38 3a */ 4448c2ecf20Sopenharmony_ci 4458c2ecf20Sopenharmony_ci asm volatile("vpminuw %ymm4,%ymm6,%ymm2"); 4468c2ecf20Sopenharmony_ci asm volatile("vpbroadcastmw2d %k6,%zmm28"); 4478c2ecf20Sopenharmony_ci 4488c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 38 3b */ 4498c2ecf20Sopenharmony_ci 4508c2ecf20Sopenharmony_ci asm volatile("vpminud %ymm4,%ymm6,%ymm2"); 4518c2ecf20Sopenharmony_ci asm volatile("vpminud %zmm24,%zmm25,%zmm26"); 4528c2ecf20Sopenharmony_ci asm volatile("vpminuq %zmm24,%zmm25,%zmm26"); 4538c2ecf20Sopenharmony_ci 4548c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 38 3d */ 4558c2ecf20Sopenharmony_ci 4568c2ecf20Sopenharmony_ci asm volatile("vpmaxsd %ymm4,%ymm6,%ymm2"); 4578c2ecf20Sopenharmony_ci asm volatile("vpmaxsd %zmm24,%zmm25,%zmm26"); 4588c2ecf20Sopenharmony_ci asm volatile("vpmaxsq %zmm24,%zmm25,%zmm26"); 4598c2ecf20Sopenharmony_ci 4608c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 38 3f */ 4618c2ecf20Sopenharmony_ci 4628c2ecf20Sopenharmony_ci asm volatile("vpmaxud %ymm4,%ymm6,%ymm2"); 4638c2ecf20Sopenharmony_ci asm volatile("vpmaxud %zmm24,%zmm25,%zmm26"); 4648c2ecf20Sopenharmony_ci asm volatile("vpmaxuq %zmm24,%zmm25,%zmm26"); 4658c2ecf20Sopenharmony_ci 4668c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 38 42 */ 4678c2ecf20Sopenharmony_ci 4688c2ecf20Sopenharmony_ci asm volatile("vpmulld %ymm4,%ymm6,%ymm2"); 4698c2ecf20Sopenharmony_ci asm volatile("vpmulld %zmm24,%zmm25,%zmm26"); 4708c2ecf20Sopenharmony_ci asm volatile("vpmullq %zmm24,%zmm25,%zmm26"); 4718c2ecf20Sopenharmony_ci 4728c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 38 42 */ 4738c2ecf20Sopenharmony_ci 4748c2ecf20Sopenharmony_ci asm volatile("vgetexpps %zmm25,%zmm26"); 4758c2ecf20Sopenharmony_ci asm volatile("vgetexppd %zmm27,%zmm28"); 4768c2ecf20Sopenharmony_ci 4778c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 38 43 */ 4788c2ecf20Sopenharmony_ci 4798c2ecf20Sopenharmony_ci asm volatile("vgetexpss %xmm24,%xmm25,%xmm26{%k7}"); 4808c2ecf20Sopenharmony_ci asm volatile("vgetexpsd %xmm28,%xmm29,%xmm30{%k7}"); 4818c2ecf20Sopenharmony_ci 4828c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 38 44 */ 4838c2ecf20Sopenharmony_ci 4848c2ecf20Sopenharmony_ci asm volatile("vplzcntd %zmm27,%zmm28"); 4858c2ecf20Sopenharmony_ci asm volatile("vplzcntq %zmm27,%zmm28"); 4868c2ecf20Sopenharmony_ci 4878c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 38 46 */ 4888c2ecf20Sopenharmony_ci 4898c2ecf20Sopenharmony_ci asm volatile("vpsravd %ymm4,%ymm6,%ymm2"); 4908c2ecf20Sopenharmony_ci asm volatile("vpsravd %zmm24,%zmm25,%zmm26"); 4918c2ecf20Sopenharmony_ci asm volatile("vpsravq %zmm24,%zmm25,%zmm26"); 4928c2ecf20Sopenharmony_ci 4938c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 38 4c */ 4948c2ecf20Sopenharmony_ci 4958c2ecf20Sopenharmony_ci asm volatile("vrcp14ps %zmm25,%zmm26"); 4968c2ecf20Sopenharmony_ci asm volatile("vrcp14pd %zmm27,%zmm28"); 4978c2ecf20Sopenharmony_ci 4988c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 38 4d */ 4998c2ecf20Sopenharmony_ci 5008c2ecf20Sopenharmony_ci asm volatile("vrcp14ss %xmm24,%xmm25,%xmm26{%k7}"); 5018c2ecf20Sopenharmony_ci asm volatile("vrcp14sd %xmm24,%xmm25,%xmm26{%k7}"); 5028c2ecf20Sopenharmony_ci 5038c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 38 4e */ 5048c2ecf20Sopenharmony_ci 5058c2ecf20Sopenharmony_ci asm volatile("vrsqrt14ps %zmm25,%zmm26"); 5068c2ecf20Sopenharmony_ci asm volatile("vrsqrt14pd %zmm27,%zmm28"); 5078c2ecf20Sopenharmony_ci 5088c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 38 4f */ 5098c2ecf20Sopenharmony_ci 5108c2ecf20Sopenharmony_ci asm volatile("vrsqrt14ss %xmm24,%xmm25,%xmm26{%k7}"); 5118c2ecf20Sopenharmony_ci asm volatile("vrsqrt14sd %xmm24,%xmm25,%xmm26{%k7}"); 5128c2ecf20Sopenharmony_ci 5138c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 38 50 */ 5148c2ecf20Sopenharmony_ci 5158c2ecf20Sopenharmony_ci asm volatile("vpdpbusd %xmm1, %xmm2, %xmm3"); 5168c2ecf20Sopenharmony_ci asm volatile("vpdpbusd %ymm1, %ymm2, %ymm3"); 5178c2ecf20Sopenharmony_ci asm volatile("vpdpbusd %zmm1, %zmm2, %zmm3"); 5188c2ecf20Sopenharmony_ci asm volatile("vpdpbusd 0x12345678(%rax,%rcx,8),%zmm2,%zmm3"); 5198c2ecf20Sopenharmony_ci asm volatile("vpdpbusd 0x12345678(%eax,%ecx,8),%zmm2,%zmm3"); 5208c2ecf20Sopenharmony_ci 5218c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 38 51 */ 5228c2ecf20Sopenharmony_ci 5238c2ecf20Sopenharmony_ci asm volatile("vpdpbusds %xmm1, %xmm2, %xmm3"); 5248c2ecf20Sopenharmony_ci asm volatile("vpdpbusds %ymm1, %ymm2, %ymm3"); 5258c2ecf20Sopenharmony_ci asm volatile("vpdpbusds %zmm1, %zmm2, %zmm3"); 5268c2ecf20Sopenharmony_ci asm volatile("vpdpbusds 0x12345678(%rax,%rcx,8),%zmm2,%zmm3"); 5278c2ecf20Sopenharmony_ci asm volatile("vpdpbusds 0x12345678(%eax,%ecx,8),%zmm2,%zmm3"); 5288c2ecf20Sopenharmony_ci 5298c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 38 52 */ 5308c2ecf20Sopenharmony_ci 5318c2ecf20Sopenharmony_ci asm volatile("vdpbf16ps %xmm1, %xmm2, %xmm3"); 5328c2ecf20Sopenharmony_ci asm volatile("vdpbf16ps %ymm1, %ymm2, %ymm3"); 5338c2ecf20Sopenharmony_ci asm volatile("vdpbf16ps %zmm1, %zmm2, %zmm3"); 5348c2ecf20Sopenharmony_ci asm volatile("vdpbf16ps 0x12345678(%rax,%rcx,8),%zmm2,%zmm3"); 5358c2ecf20Sopenharmony_ci asm volatile("vdpbf16ps 0x12345678(%eax,%ecx,8),%zmm2,%zmm3"); 5368c2ecf20Sopenharmony_ci 5378c2ecf20Sopenharmony_ci asm volatile("vpdpwssd %xmm1, %xmm2, %xmm3"); 5388c2ecf20Sopenharmony_ci asm volatile("vpdpwssd %ymm1, %ymm2, %ymm3"); 5398c2ecf20Sopenharmony_ci asm volatile("vpdpwssd %zmm1, %zmm2, %zmm3"); 5408c2ecf20Sopenharmony_ci asm volatile("vpdpwssd 0x12345678(%rax,%rcx,8),%zmm2,%zmm3"); 5418c2ecf20Sopenharmony_ci asm volatile("vpdpwssd 0x12345678(%eax,%ecx,8),%zmm2,%zmm3"); 5428c2ecf20Sopenharmony_ci 5438c2ecf20Sopenharmony_ci asm volatile("vp4dpwssd (%rax), %zmm0, %zmm4"); 5448c2ecf20Sopenharmony_ci asm volatile("vp4dpwssd (%eax), %zmm0, %zmm4"); 5458c2ecf20Sopenharmony_ci asm volatile("vp4dpwssd 0x12345678(%rax,%rcx,8),%zmm0,%zmm4"); 5468c2ecf20Sopenharmony_ci asm volatile("vp4dpwssd 0x12345678(%eax,%ecx,8),%zmm0,%zmm4"); 5478c2ecf20Sopenharmony_ci 5488c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 38 53 */ 5498c2ecf20Sopenharmony_ci 5508c2ecf20Sopenharmony_ci asm volatile("vpdpwssds %xmm1, %xmm2, %xmm3"); 5518c2ecf20Sopenharmony_ci asm volatile("vpdpwssds %ymm1, %ymm2, %ymm3"); 5528c2ecf20Sopenharmony_ci asm volatile("vpdpwssds %zmm1, %zmm2, %zmm3"); 5538c2ecf20Sopenharmony_ci asm volatile("vpdpwssds 0x12345678(%rax,%rcx,8),%zmm2,%zmm3"); 5548c2ecf20Sopenharmony_ci asm volatile("vpdpwssds 0x12345678(%eax,%ecx,8),%zmm2,%zmm3"); 5558c2ecf20Sopenharmony_ci 5568c2ecf20Sopenharmony_ci asm volatile("vp4dpwssds (%rax), %zmm0, %zmm4"); 5578c2ecf20Sopenharmony_ci asm volatile("vp4dpwssds (%eax), %zmm0, %zmm4"); 5588c2ecf20Sopenharmony_ci asm volatile("vp4dpwssds 0x12345678(%rax,%rcx,8),%zmm0,%zmm4"); 5598c2ecf20Sopenharmony_ci asm volatile("vp4dpwssds 0x12345678(%eax,%ecx,8),%zmm0,%zmm4"); 5608c2ecf20Sopenharmony_ci 5618c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 38 54 */ 5628c2ecf20Sopenharmony_ci 5638c2ecf20Sopenharmony_ci asm volatile("vpopcntb %xmm1, %xmm2"); 5648c2ecf20Sopenharmony_ci asm volatile("vpopcntb %ymm1, %ymm2"); 5658c2ecf20Sopenharmony_ci asm volatile("vpopcntb %zmm1, %zmm2"); 5668c2ecf20Sopenharmony_ci asm volatile("vpopcntb 0x12345678(%rax,%rcx,8),%zmm2"); 5678c2ecf20Sopenharmony_ci asm volatile("vpopcntb 0x12345678(%eax,%ecx,8),%zmm2"); 5688c2ecf20Sopenharmony_ci 5698c2ecf20Sopenharmony_ci asm volatile("vpopcntw %xmm1, %xmm2"); 5708c2ecf20Sopenharmony_ci asm volatile("vpopcntw %ymm1, %ymm2"); 5718c2ecf20Sopenharmony_ci asm volatile("vpopcntw %zmm1, %zmm2"); 5728c2ecf20Sopenharmony_ci asm volatile("vpopcntw 0x12345678(%rax,%rcx,8),%zmm2"); 5738c2ecf20Sopenharmony_ci asm volatile("vpopcntw 0x12345678(%eax,%ecx,8),%zmm2"); 5748c2ecf20Sopenharmony_ci 5758c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 38 55 */ 5768c2ecf20Sopenharmony_ci 5778c2ecf20Sopenharmony_ci asm volatile("vpopcntd %xmm1, %xmm2"); 5788c2ecf20Sopenharmony_ci asm volatile("vpopcntd %ymm1, %ymm2"); 5798c2ecf20Sopenharmony_ci asm volatile("vpopcntd %zmm1, %zmm2"); 5808c2ecf20Sopenharmony_ci asm volatile("vpopcntd 0x12345678(%rax,%rcx,8),%zmm2"); 5818c2ecf20Sopenharmony_ci asm volatile("vpopcntd 0x12345678(%eax,%ecx,8),%zmm2"); 5828c2ecf20Sopenharmony_ci 5838c2ecf20Sopenharmony_ci asm volatile("vpopcntq %xmm1, %xmm2"); 5848c2ecf20Sopenharmony_ci asm volatile("vpopcntq %ymm1, %ymm2"); 5858c2ecf20Sopenharmony_ci asm volatile("vpopcntq %zmm1, %zmm2"); 5868c2ecf20Sopenharmony_ci asm volatile("vpopcntq 0x12345678(%rax,%rcx,8),%zmm2"); 5878c2ecf20Sopenharmony_ci asm volatile("vpopcntq 0x12345678(%eax,%ecx,8),%zmm2"); 5888c2ecf20Sopenharmony_ci 5898c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 38 59 */ 5908c2ecf20Sopenharmony_ci 5918c2ecf20Sopenharmony_ci asm volatile("vpbroadcastq %xmm4,%xmm6"); 5928c2ecf20Sopenharmony_ci asm volatile("vbroadcasti32x2 %xmm27,%zmm26"); 5938c2ecf20Sopenharmony_ci 5948c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 38 5a */ 5958c2ecf20Sopenharmony_ci 5968c2ecf20Sopenharmony_ci asm volatile("vbroadcasti128 (%rcx),%ymm4"); 5978c2ecf20Sopenharmony_ci asm volatile("vbroadcasti32x4 (%rcx),%zmm26"); 5988c2ecf20Sopenharmony_ci asm volatile("vbroadcasti64x2 (%rcx),%zmm26"); 5998c2ecf20Sopenharmony_ci 6008c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 38 5b */ 6018c2ecf20Sopenharmony_ci 6028c2ecf20Sopenharmony_ci asm volatile("vbroadcasti32x8 (%rcx),%zmm28"); 6038c2ecf20Sopenharmony_ci asm volatile("vbroadcasti64x4 (%rcx),%zmm26"); 6048c2ecf20Sopenharmony_ci 6058c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 38 62 */ 6068c2ecf20Sopenharmony_ci 6078c2ecf20Sopenharmony_ci asm volatile("vpexpandb %xmm1, %xmm2"); 6088c2ecf20Sopenharmony_ci asm volatile("vpexpandb %ymm1, %ymm2"); 6098c2ecf20Sopenharmony_ci asm volatile("vpexpandb %zmm1, %zmm2"); 6108c2ecf20Sopenharmony_ci asm volatile("vpexpandb 0x12345678(%rax,%rcx,8),%zmm2"); 6118c2ecf20Sopenharmony_ci asm volatile("vpexpandb 0x12345678(%eax,%ecx,8),%zmm2"); 6128c2ecf20Sopenharmony_ci 6138c2ecf20Sopenharmony_ci asm volatile("vpexpandw %xmm1, %xmm2"); 6148c2ecf20Sopenharmony_ci asm volatile("vpexpandw %ymm1, %ymm2"); 6158c2ecf20Sopenharmony_ci asm volatile("vpexpandw %zmm1, %zmm2"); 6168c2ecf20Sopenharmony_ci asm volatile("vpexpandw 0x12345678(%rax,%rcx,8),%zmm2"); 6178c2ecf20Sopenharmony_ci asm volatile("vpexpandw 0x12345678(%eax,%ecx,8),%zmm2"); 6188c2ecf20Sopenharmony_ci 6198c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 38 63 */ 6208c2ecf20Sopenharmony_ci 6218c2ecf20Sopenharmony_ci asm volatile("vpcompressb %xmm1, %xmm2"); 6228c2ecf20Sopenharmony_ci asm volatile("vpcompressb %ymm1, %ymm2"); 6238c2ecf20Sopenharmony_ci asm volatile("vpcompressb %zmm1, %zmm2"); 6248c2ecf20Sopenharmony_ci asm volatile("vpcompressb %zmm2,0x12345678(%rax,%rcx,8)"); 6258c2ecf20Sopenharmony_ci asm volatile("vpcompressb %zmm2,0x12345678(%eax,%ecx,8)"); 6268c2ecf20Sopenharmony_ci 6278c2ecf20Sopenharmony_ci asm volatile("vpcompressw %xmm1, %xmm2"); 6288c2ecf20Sopenharmony_ci asm volatile("vpcompressw %ymm1, %ymm2"); 6298c2ecf20Sopenharmony_ci asm volatile("vpcompressw %zmm1, %zmm2"); 6308c2ecf20Sopenharmony_ci asm volatile("vpcompressw %zmm2,0x12345678(%rax,%rcx,8)"); 6318c2ecf20Sopenharmony_ci asm volatile("vpcompressw %zmm2,0x12345678(%eax,%ecx,8)"); 6328c2ecf20Sopenharmony_ci 6338c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 38 64 */ 6348c2ecf20Sopenharmony_ci 6358c2ecf20Sopenharmony_ci asm volatile("vpblendmd %zmm26,%zmm27,%zmm28"); 6368c2ecf20Sopenharmony_ci asm volatile("vpblendmq %zmm26,%zmm27,%zmm28"); 6378c2ecf20Sopenharmony_ci 6388c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 38 65 */ 6398c2ecf20Sopenharmony_ci 6408c2ecf20Sopenharmony_ci asm volatile("vblendmps %zmm24,%zmm25,%zmm26"); 6418c2ecf20Sopenharmony_ci asm volatile("vblendmpd %zmm26,%zmm27,%zmm28"); 6428c2ecf20Sopenharmony_ci 6438c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 38 66 */ 6448c2ecf20Sopenharmony_ci 6458c2ecf20Sopenharmony_ci asm volatile("vpblendmb %zmm26,%zmm27,%zmm28"); 6468c2ecf20Sopenharmony_ci asm volatile("vpblendmw %zmm26,%zmm27,%zmm28"); 6478c2ecf20Sopenharmony_ci 6488c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 38 68 */ 6498c2ecf20Sopenharmony_ci 6508c2ecf20Sopenharmony_ci asm volatile("vp2intersectd %xmm1, %xmm2, %k3"); 6518c2ecf20Sopenharmony_ci asm volatile("vp2intersectd %ymm1, %ymm2, %k3"); 6528c2ecf20Sopenharmony_ci asm volatile("vp2intersectd %zmm1, %zmm2, %k3"); 6538c2ecf20Sopenharmony_ci asm volatile("vp2intersectd 0x12345678(%rax,%rcx,8),%zmm2,%k3"); 6548c2ecf20Sopenharmony_ci asm volatile("vp2intersectd 0x12345678(%eax,%ecx,8),%zmm2,%k3"); 6558c2ecf20Sopenharmony_ci 6568c2ecf20Sopenharmony_ci asm volatile("vp2intersectq %xmm1, %xmm2, %k3"); 6578c2ecf20Sopenharmony_ci asm volatile("vp2intersectq %ymm1, %ymm2, %k3"); 6588c2ecf20Sopenharmony_ci asm volatile("vp2intersectq %zmm1, %zmm2, %k3"); 6598c2ecf20Sopenharmony_ci asm volatile("vp2intersectq 0x12345678(%rax,%rcx,8),%zmm2,%k3"); 6608c2ecf20Sopenharmony_ci asm volatile("vp2intersectq 0x12345678(%eax,%ecx,8),%zmm2,%k3"); 6618c2ecf20Sopenharmony_ci 6628c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 38 70 */ 6638c2ecf20Sopenharmony_ci 6648c2ecf20Sopenharmony_ci asm volatile("vpshldvw %xmm1, %xmm2, %xmm3"); 6658c2ecf20Sopenharmony_ci asm volatile("vpshldvw %ymm1, %ymm2, %ymm3"); 6668c2ecf20Sopenharmony_ci asm volatile("vpshldvw %zmm1, %zmm2, %zmm3"); 6678c2ecf20Sopenharmony_ci asm volatile("vpshldvw 0x12345678(%rax,%rcx,8),%zmm2,%zmm3"); 6688c2ecf20Sopenharmony_ci asm volatile("vpshldvw 0x12345678(%eax,%ecx,8),%zmm2,%zmm3"); 6698c2ecf20Sopenharmony_ci 6708c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 38 71 */ 6718c2ecf20Sopenharmony_ci 6728c2ecf20Sopenharmony_ci asm volatile("vpshldvd %xmm1, %xmm2, %xmm3"); 6738c2ecf20Sopenharmony_ci asm volatile("vpshldvd %ymm1, %ymm2, %ymm3"); 6748c2ecf20Sopenharmony_ci asm volatile("vpshldvd %zmm1, %zmm2, %zmm3"); 6758c2ecf20Sopenharmony_ci asm volatile("vpshldvd 0x12345678(%rax,%rcx,8),%zmm2,%zmm3"); 6768c2ecf20Sopenharmony_ci asm volatile("vpshldvd 0x12345678(%eax,%ecx,8),%zmm2,%zmm3"); 6778c2ecf20Sopenharmony_ci 6788c2ecf20Sopenharmony_ci asm volatile("vpshldvq %xmm1, %xmm2, %xmm3"); 6798c2ecf20Sopenharmony_ci asm volatile("vpshldvq %ymm1, %ymm2, %ymm3"); 6808c2ecf20Sopenharmony_ci asm volatile("vpshldvq %zmm1, %zmm2, %zmm3"); 6818c2ecf20Sopenharmony_ci asm volatile("vpshldvq 0x12345678(%rax,%rcx,8),%zmm2,%zmm3"); 6828c2ecf20Sopenharmony_ci asm volatile("vpshldvq 0x12345678(%eax,%ecx,8),%zmm2,%zmm3"); 6838c2ecf20Sopenharmony_ci 6848c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 38 72 */ 6858c2ecf20Sopenharmony_ci 6868c2ecf20Sopenharmony_ci asm volatile("vcvtne2ps2bf16 %xmm1, %xmm2, %xmm3"); 6878c2ecf20Sopenharmony_ci asm volatile("vcvtne2ps2bf16 %ymm1, %ymm2, %ymm3"); 6888c2ecf20Sopenharmony_ci asm volatile("vcvtne2ps2bf16 %zmm1, %zmm2, %zmm3"); 6898c2ecf20Sopenharmony_ci asm volatile("vcvtne2ps2bf16 0x12345678(%rax,%rcx,8),%zmm2,%zmm3"); 6908c2ecf20Sopenharmony_ci asm volatile("vcvtne2ps2bf16 0x12345678(%eax,%ecx,8),%zmm2,%zmm3"); 6918c2ecf20Sopenharmony_ci 6928c2ecf20Sopenharmony_ci asm volatile("vcvtneps2bf16 %xmm1, %xmm2"); 6938c2ecf20Sopenharmony_ci asm volatile("vcvtneps2bf16 %ymm1, %xmm2"); 6948c2ecf20Sopenharmony_ci asm volatile("vcvtneps2bf16 %zmm1, %ymm2"); 6958c2ecf20Sopenharmony_ci asm volatile("vcvtneps2bf16 0x12345678(%rax,%rcx,8),%ymm2"); 6968c2ecf20Sopenharmony_ci asm volatile("vcvtneps2bf16 0x12345678(%eax,%ecx,8),%ymm2"); 6978c2ecf20Sopenharmony_ci 6988c2ecf20Sopenharmony_ci asm volatile("vpshrdvw %xmm1, %xmm2, %xmm3"); 6998c2ecf20Sopenharmony_ci asm volatile("vpshrdvw %ymm1, %ymm2, %ymm3"); 7008c2ecf20Sopenharmony_ci asm volatile("vpshrdvw %zmm1, %zmm2, %zmm3"); 7018c2ecf20Sopenharmony_ci asm volatile("vpshrdvw 0x12345678(%rax,%rcx,8),%zmm2,%zmm3"); 7028c2ecf20Sopenharmony_ci asm volatile("vpshrdvw 0x12345678(%eax,%ecx,8),%zmm2,%zmm3"); 7038c2ecf20Sopenharmony_ci 7048c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 38 73 */ 7058c2ecf20Sopenharmony_ci 7068c2ecf20Sopenharmony_ci asm volatile("vpshrdvd %xmm1, %xmm2, %xmm3"); 7078c2ecf20Sopenharmony_ci asm volatile("vpshrdvd %ymm1, %ymm2, %ymm3"); 7088c2ecf20Sopenharmony_ci asm volatile("vpshrdvd %zmm1, %zmm2, %zmm3"); 7098c2ecf20Sopenharmony_ci asm volatile("vpshrdvd 0x12345678(%rax,%rcx,8),%zmm2,%zmm3"); 7108c2ecf20Sopenharmony_ci asm volatile("vpshrdvd 0x12345678(%eax,%ecx,8),%zmm2,%zmm3"); 7118c2ecf20Sopenharmony_ci 7128c2ecf20Sopenharmony_ci asm volatile("vpshrdvq %xmm1, %xmm2, %xmm3"); 7138c2ecf20Sopenharmony_ci asm volatile("vpshrdvq %ymm1, %ymm2, %ymm3"); 7148c2ecf20Sopenharmony_ci asm volatile("vpshrdvq %zmm1, %zmm2, %zmm3"); 7158c2ecf20Sopenharmony_ci asm volatile("vpshrdvq 0x12345678(%rax,%rcx,8),%zmm2,%zmm3"); 7168c2ecf20Sopenharmony_ci asm volatile("vpshrdvq 0x12345678(%eax,%ecx,8),%zmm2,%zmm3"); 7178c2ecf20Sopenharmony_ci 7188c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 38 75 */ 7198c2ecf20Sopenharmony_ci 7208c2ecf20Sopenharmony_ci asm volatile("vpermi2b %zmm24,%zmm25,%zmm26"); 7218c2ecf20Sopenharmony_ci asm volatile("vpermi2w %zmm26,%zmm27,%zmm28"); 7228c2ecf20Sopenharmony_ci 7238c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 38 76 */ 7248c2ecf20Sopenharmony_ci 7258c2ecf20Sopenharmony_ci asm volatile("vpermi2d %zmm26,%zmm27,%zmm28"); 7268c2ecf20Sopenharmony_ci asm volatile("vpermi2q %zmm26,%zmm27,%zmm28"); 7278c2ecf20Sopenharmony_ci 7288c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 38 77 */ 7298c2ecf20Sopenharmony_ci 7308c2ecf20Sopenharmony_ci asm volatile("vpermi2ps %zmm26,%zmm27,%zmm28"); 7318c2ecf20Sopenharmony_ci asm volatile("vpermi2pd %zmm26,%zmm27,%zmm28"); 7328c2ecf20Sopenharmony_ci 7338c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 38 7a */ 7348c2ecf20Sopenharmony_ci 7358c2ecf20Sopenharmony_ci asm volatile("vpbroadcastb %eax,%xmm30"); 7368c2ecf20Sopenharmony_ci 7378c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 38 7b */ 7388c2ecf20Sopenharmony_ci 7398c2ecf20Sopenharmony_ci asm volatile("vpbroadcastw %eax,%xmm30"); 7408c2ecf20Sopenharmony_ci 7418c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 38 7c */ 7428c2ecf20Sopenharmony_ci 7438c2ecf20Sopenharmony_ci asm volatile("vpbroadcastd %eax,%xmm30"); 7448c2ecf20Sopenharmony_ci asm volatile("vpbroadcastq %rax,%zmm30"); 7458c2ecf20Sopenharmony_ci 7468c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 38 7d */ 7478c2ecf20Sopenharmony_ci 7488c2ecf20Sopenharmony_ci asm volatile("vpermt2b %zmm26,%zmm27,%zmm28"); 7498c2ecf20Sopenharmony_ci asm volatile("vpermt2w %zmm26,%zmm27,%zmm28"); 7508c2ecf20Sopenharmony_ci 7518c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 38 7e */ 7528c2ecf20Sopenharmony_ci 7538c2ecf20Sopenharmony_ci asm volatile("vpermt2d %zmm26,%zmm27,%zmm28"); 7548c2ecf20Sopenharmony_ci asm volatile("vpermt2q %zmm26,%zmm27,%zmm28"); 7558c2ecf20Sopenharmony_ci 7568c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 38 7f */ 7578c2ecf20Sopenharmony_ci 7588c2ecf20Sopenharmony_ci asm volatile("vpermt2ps %zmm26,%zmm27,%zmm28"); 7598c2ecf20Sopenharmony_ci asm volatile("vpermt2pd %zmm26,%zmm27,%zmm28"); 7608c2ecf20Sopenharmony_ci 7618c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 38 83 */ 7628c2ecf20Sopenharmony_ci 7638c2ecf20Sopenharmony_ci asm volatile("vpmultishiftqb %zmm26,%zmm27,%zmm28"); 7648c2ecf20Sopenharmony_ci 7658c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 38 88 */ 7668c2ecf20Sopenharmony_ci 7678c2ecf20Sopenharmony_ci asm volatile("vexpandps (%rcx),%zmm26"); 7688c2ecf20Sopenharmony_ci asm volatile("vexpandpd (%rcx),%zmm28"); 7698c2ecf20Sopenharmony_ci 7708c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 38 89 */ 7718c2ecf20Sopenharmony_ci 7728c2ecf20Sopenharmony_ci asm volatile("vpexpandd (%rcx),%zmm28"); 7738c2ecf20Sopenharmony_ci asm volatile("vpexpandq (%rcx),%zmm26"); 7748c2ecf20Sopenharmony_ci 7758c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 38 8a */ 7768c2ecf20Sopenharmony_ci 7778c2ecf20Sopenharmony_ci asm volatile("vcompressps %zmm28,(%rcx)"); 7788c2ecf20Sopenharmony_ci asm volatile("vcompresspd %zmm28,(%rcx)"); 7798c2ecf20Sopenharmony_ci 7808c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 38 8b */ 7818c2ecf20Sopenharmony_ci 7828c2ecf20Sopenharmony_ci asm volatile("vpcompressd %zmm28,(%rcx)"); 7838c2ecf20Sopenharmony_ci asm volatile("vpcompressq %zmm26,(%rcx)"); 7848c2ecf20Sopenharmony_ci 7858c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 38 8d */ 7868c2ecf20Sopenharmony_ci 7878c2ecf20Sopenharmony_ci asm volatile("vpermb %zmm26,%zmm27,%zmm28"); 7888c2ecf20Sopenharmony_ci asm volatile("vpermw %zmm26,%zmm27,%zmm28"); 7898c2ecf20Sopenharmony_ci 7908c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 38 8f */ 7918c2ecf20Sopenharmony_ci 7928c2ecf20Sopenharmony_ci asm volatile("vpshufbitqmb %xmm1, %xmm2, %k3"); 7938c2ecf20Sopenharmony_ci asm volatile("vpshufbitqmb %ymm1, %ymm2, %k3"); 7948c2ecf20Sopenharmony_ci asm volatile("vpshufbitqmb %zmm1, %zmm2, %k3"); 7958c2ecf20Sopenharmony_ci asm volatile("vpshufbitqmb 0x12345678(%rax,%rcx,8),%zmm2,%k3"); 7968c2ecf20Sopenharmony_ci asm volatile("vpshufbitqmb 0x12345678(%eax,%ecx,8),%zmm2,%k3"); 7978c2ecf20Sopenharmony_ci 7988c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 38 90 */ 7998c2ecf20Sopenharmony_ci 8008c2ecf20Sopenharmony_ci asm volatile("vpgatherdd %xmm2,0x02(%rbp,%xmm7,2),%xmm1"); 8018c2ecf20Sopenharmony_ci asm volatile("vpgatherdq %xmm2,0x04(%rbp,%xmm7,2),%xmm1"); 8028c2ecf20Sopenharmony_ci asm volatile("vpgatherdd 0x7b(%rbp,%zmm27,8),%zmm26{%k1}"); 8038c2ecf20Sopenharmony_ci asm volatile("vpgatherdq 0x7b(%rbp,%ymm27,8),%zmm26{%k1}"); 8048c2ecf20Sopenharmony_ci 8058c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 38 91 */ 8068c2ecf20Sopenharmony_ci 8078c2ecf20Sopenharmony_ci asm volatile("vpgatherqd %xmm2,0x02(%rbp,%xmm7,2),%xmm1"); 8088c2ecf20Sopenharmony_ci asm volatile("vpgatherqq %xmm2,0x02(%rbp,%xmm7,2),%xmm1"); 8098c2ecf20Sopenharmony_ci asm volatile("vpgatherqd 0x7b(%rbp,%zmm27,8),%ymm26{%k1}"); 8108c2ecf20Sopenharmony_ci asm volatile("vpgatherqq 0x7b(%rbp,%zmm27,8),%zmm26{%k1}"); 8118c2ecf20Sopenharmony_ci 8128c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 38 9a */ 8138c2ecf20Sopenharmony_ci 8148c2ecf20Sopenharmony_ci asm volatile("vfmsub132ps %xmm1, %xmm2, %xmm3"); 8158c2ecf20Sopenharmony_ci asm volatile("vfmsub132ps %ymm1, %ymm2, %ymm3"); 8168c2ecf20Sopenharmony_ci asm volatile("vfmsub132ps %zmm1, %zmm2, %zmm3"); 8178c2ecf20Sopenharmony_ci asm volatile("vfmsub132ps 0x12345678(%rax,%rcx,8),%zmm2,%zmm3"); 8188c2ecf20Sopenharmony_ci asm volatile("vfmsub132ps 0x12345678(%eax,%ecx,8),%zmm2,%zmm3"); 8198c2ecf20Sopenharmony_ci 8208c2ecf20Sopenharmony_ci asm volatile("vfmsub132pd %xmm1, %xmm2, %xmm3"); 8218c2ecf20Sopenharmony_ci asm volatile("vfmsub132pd %ymm1, %ymm2, %ymm3"); 8228c2ecf20Sopenharmony_ci asm volatile("vfmsub132pd %zmm1, %zmm2, %zmm3"); 8238c2ecf20Sopenharmony_ci asm volatile("vfmsub132pd 0x12345678(%rax,%rcx,8),%zmm2,%zmm3"); 8248c2ecf20Sopenharmony_ci asm volatile("vfmsub132pd 0x12345678(%eax,%ecx,8),%zmm2,%zmm3"); 8258c2ecf20Sopenharmony_ci 8268c2ecf20Sopenharmony_ci asm volatile("v4fmaddps (%rax), %zmm0, %zmm4"); 8278c2ecf20Sopenharmony_ci asm volatile("v4fmaddps (%eax), %zmm0, %zmm4"); 8288c2ecf20Sopenharmony_ci asm volatile("v4fmaddps 0x12345678(%rax,%rcx,8),%zmm0,%zmm4"); 8298c2ecf20Sopenharmony_ci asm volatile("v4fmaddps 0x12345678(%eax,%ecx,8),%zmm0,%zmm4"); 8308c2ecf20Sopenharmony_ci 8318c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 38 9b */ 8328c2ecf20Sopenharmony_ci 8338c2ecf20Sopenharmony_ci asm volatile("vfmsub132ss %xmm1, %xmm2, %xmm3"); 8348c2ecf20Sopenharmony_ci asm volatile("vfmsub132ss 0x12345678(%rax,%rcx,8),%xmm2,%xmm3"); 8358c2ecf20Sopenharmony_ci asm volatile("vfmsub132ss 0x12345678(%eax,%ecx,8),%xmm2,%xmm3"); 8368c2ecf20Sopenharmony_ci 8378c2ecf20Sopenharmony_ci asm volatile("vfmsub132sd %xmm1, %xmm2, %xmm3"); 8388c2ecf20Sopenharmony_ci asm volatile("vfmsub132sd 0x12345678(%rax,%rcx,8),%xmm2,%xmm3"); 8398c2ecf20Sopenharmony_ci asm volatile("vfmsub132sd 0x12345678(%eax,%ecx,8),%xmm2,%xmm3"); 8408c2ecf20Sopenharmony_ci 8418c2ecf20Sopenharmony_ci asm volatile("v4fmaddss (%rax), %xmm0, %xmm4"); 8428c2ecf20Sopenharmony_ci asm volatile("v4fmaddss (%eax), %xmm0, %xmm4"); 8438c2ecf20Sopenharmony_ci asm volatile("v4fmaddss 0x12345678(%rax,%rcx,8),%xmm0,%xmm4"); 8448c2ecf20Sopenharmony_ci asm volatile("v4fmaddss 0x12345678(%eax,%ecx,8),%xmm0,%xmm4"); 8458c2ecf20Sopenharmony_ci 8468c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 38 a0 */ 8478c2ecf20Sopenharmony_ci 8488c2ecf20Sopenharmony_ci asm volatile("vpscatterdd %zmm28,0x7b(%rbp,%zmm29,8){%k1}"); 8498c2ecf20Sopenharmony_ci asm volatile("vpscatterdq %zmm26,0x7b(%rbp,%ymm27,8){%k1}"); 8508c2ecf20Sopenharmony_ci 8518c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 38 a1 */ 8528c2ecf20Sopenharmony_ci 8538c2ecf20Sopenharmony_ci asm volatile("vpscatterqd %ymm6,0x7b(%rbp,%zmm29,8){%k1}"); 8548c2ecf20Sopenharmony_ci asm volatile("vpscatterqq %ymm6,0x7b(%rbp,%ymm27,8){%k1}"); 8558c2ecf20Sopenharmony_ci 8568c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 38 a2 */ 8578c2ecf20Sopenharmony_ci 8588c2ecf20Sopenharmony_ci asm volatile("vscatterdps %zmm28,0x7b(%rbp,%zmm29,8){%k1}"); 8598c2ecf20Sopenharmony_ci asm volatile("vscatterdpd %zmm28,0x7b(%rbp,%ymm27,8){%k1}"); 8608c2ecf20Sopenharmony_ci 8618c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 38 a3 */ 8628c2ecf20Sopenharmony_ci 8638c2ecf20Sopenharmony_ci asm volatile("vscatterqps %ymm6,0x7b(%rbp,%zmm29,8){%k1}"); 8648c2ecf20Sopenharmony_ci asm volatile("vscatterqpd %zmm28,0x7b(%rbp,%zmm29,8){%k1}"); 8658c2ecf20Sopenharmony_ci 8668c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 38 aa */ 8678c2ecf20Sopenharmony_ci 8688c2ecf20Sopenharmony_ci asm volatile("vfmsub213ps %xmm1, %xmm2, %xmm3"); 8698c2ecf20Sopenharmony_ci asm volatile("vfmsub213ps %ymm1, %ymm2, %ymm3"); 8708c2ecf20Sopenharmony_ci asm volatile("vfmsub213ps %zmm1, %zmm2, %zmm3"); 8718c2ecf20Sopenharmony_ci asm volatile("vfmsub213ps 0x12345678(%rax,%rcx,8),%zmm2,%zmm3"); 8728c2ecf20Sopenharmony_ci asm volatile("vfmsub213ps 0x12345678(%eax,%ecx,8),%zmm2,%zmm3"); 8738c2ecf20Sopenharmony_ci 8748c2ecf20Sopenharmony_ci asm volatile("vfmsub213pd %xmm1, %xmm2, %xmm3"); 8758c2ecf20Sopenharmony_ci asm volatile("vfmsub213pd %ymm1, %ymm2, %ymm3"); 8768c2ecf20Sopenharmony_ci asm volatile("vfmsub213pd %zmm1, %zmm2, %zmm3"); 8778c2ecf20Sopenharmony_ci asm volatile("vfmsub213pd 0x12345678(%rax,%rcx,8),%zmm2,%zmm3"); 8788c2ecf20Sopenharmony_ci asm volatile("vfmsub213pd 0x12345678(%eax,%ecx,8),%zmm2,%zmm3"); 8798c2ecf20Sopenharmony_ci 8808c2ecf20Sopenharmony_ci asm volatile("v4fnmaddps (%rax), %zmm0, %zmm4"); 8818c2ecf20Sopenharmony_ci asm volatile("v4fnmaddps (%eax), %zmm0, %zmm4"); 8828c2ecf20Sopenharmony_ci asm volatile("v4fnmaddps 0x12345678(%rax,%rcx,8),%zmm0,%zmm4"); 8838c2ecf20Sopenharmony_ci asm volatile("v4fnmaddps 0x12345678(%eax,%ecx,8),%zmm0,%zmm4"); 8848c2ecf20Sopenharmony_ci 8858c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 38 ab */ 8868c2ecf20Sopenharmony_ci 8878c2ecf20Sopenharmony_ci asm volatile("vfmsub213ss %xmm1, %xmm2, %xmm3"); 8888c2ecf20Sopenharmony_ci asm volatile("vfmsub213ss 0x12345678(%rax,%rcx,8),%xmm2,%xmm3"); 8898c2ecf20Sopenharmony_ci asm volatile("vfmsub213ss 0x12345678(%eax,%ecx,8),%xmm2,%xmm3"); 8908c2ecf20Sopenharmony_ci 8918c2ecf20Sopenharmony_ci asm volatile("vfmsub213sd %xmm1, %xmm2, %xmm3"); 8928c2ecf20Sopenharmony_ci asm volatile("vfmsub213sd 0x12345678(%rax,%rcx,8),%xmm2,%xmm3"); 8938c2ecf20Sopenharmony_ci asm volatile("vfmsub213sd 0x12345678(%eax,%ecx,8),%xmm2,%xmm3"); 8948c2ecf20Sopenharmony_ci 8958c2ecf20Sopenharmony_ci asm volatile("v4fnmaddss (%rax), %xmm0, %xmm4"); 8968c2ecf20Sopenharmony_ci asm volatile("v4fnmaddss (%eax), %xmm0, %xmm4"); 8978c2ecf20Sopenharmony_ci asm volatile("v4fnmaddss 0x12345678(%rax,%rcx,8),%xmm0,%xmm4"); 8988c2ecf20Sopenharmony_ci asm volatile("v4fnmaddss 0x12345678(%eax,%ecx,8),%xmm0,%xmm4"); 8998c2ecf20Sopenharmony_ci 9008c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 38 b4 */ 9018c2ecf20Sopenharmony_ci 9028c2ecf20Sopenharmony_ci asm volatile("vpmadd52luq %zmm26,%zmm27,%zmm28"); 9038c2ecf20Sopenharmony_ci 9048c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 38 b5 */ 9058c2ecf20Sopenharmony_ci 9068c2ecf20Sopenharmony_ci asm volatile("vpmadd52huq %zmm26,%zmm27,%zmm28"); 9078c2ecf20Sopenharmony_ci 9088c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 38 c4 */ 9098c2ecf20Sopenharmony_ci 9108c2ecf20Sopenharmony_ci asm volatile("vpconflictd %zmm26,%zmm27"); 9118c2ecf20Sopenharmony_ci asm volatile("vpconflictq %zmm26,%zmm27"); 9128c2ecf20Sopenharmony_ci 9138c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 38 c8 */ 9148c2ecf20Sopenharmony_ci 9158c2ecf20Sopenharmony_ci asm volatile("vexp2ps %zmm29,%zmm30"); 9168c2ecf20Sopenharmony_ci asm volatile("vexp2pd %zmm26,%zmm27"); 9178c2ecf20Sopenharmony_ci 9188c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 38 ca */ 9198c2ecf20Sopenharmony_ci 9208c2ecf20Sopenharmony_ci asm volatile("vrcp28ps %zmm29,%zmm30"); 9218c2ecf20Sopenharmony_ci asm volatile("vrcp28pd %zmm26,%zmm27"); 9228c2ecf20Sopenharmony_ci 9238c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 38 cb */ 9248c2ecf20Sopenharmony_ci 9258c2ecf20Sopenharmony_ci asm volatile("vrcp28ss %xmm28,%xmm29,%xmm30{%k7}"); 9268c2ecf20Sopenharmony_ci asm volatile("vrcp28sd %xmm25,%xmm26,%xmm27{%k7}"); 9278c2ecf20Sopenharmony_ci 9288c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 38 cc */ 9298c2ecf20Sopenharmony_ci 9308c2ecf20Sopenharmony_ci asm volatile("vrsqrt28ps %zmm29,%zmm30"); 9318c2ecf20Sopenharmony_ci asm volatile("vrsqrt28pd %zmm26,%zmm27"); 9328c2ecf20Sopenharmony_ci 9338c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 38 cd */ 9348c2ecf20Sopenharmony_ci 9358c2ecf20Sopenharmony_ci asm volatile("vrsqrt28ss %xmm28,%xmm29,%xmm30{%k7}"); 9368c2ecf20Sopenharmony_ci asm volatile("vrsqrt28sd %xmm25,%xmm26,%xmm27{%k7}"); 9378c2ecf20Sopenharmony_ci 9388c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 38 cf */ 9398c2ecf20Sopenharmony_ci 9408c2ecf20Sopenharmony_ci asm volatile("gf2p8mulb %xmm1, %xmm3"); 9418c2ecf20Sopenharmony_ci asm volatile("gf2p8mulb 0x12345678(%rax,%rcx,8),%xmm3"); 9428c2ecf20Sopenharmony_ci asm volatile("gf2p8mulb 0x12345678(%eax,%ecx,8),%xmm3"); 9438c2ecf20Sopenharmony_ci 9448c2ecf20Sopenharmony_ci asm volatile("vgf2p8mulb %xmm1, %xmm2, %xmm3"); 9458c2ecf20Sopenharmony_ci asm volatile("vgf2p8mulb %ymm1, %ymm2, %ymm3"); 9468c2ecf20Sopenharmony_ci asm volatile("vgf2p8mulb %zmm1, %zmm2, %zmm3"); 9478c2ecf20Sopenharmony_ci asm volatile("vgf2p8mulb 0x12345678(%rax,%rcx,8),%zmm2,%zmm3"); 9488c2ecf20Sopenharmony_ci asm volatile("vgf2p8mulb 0x12345678(%eax,%ecx,8),%zmm2,%zmm3"); 9498c2ecf20Sopenharmony_ci 9508c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 38 dc */ 9518c2ecf20Sopenharmony_ci 9528c2ecf20Sopenharmony_ci asm volatile("vaesenc %xmm1, %xmm2, %xmm3"); 9538c2ecf20Sopenharmony_ci asm volatile("vaesenc %ymm1, %ymm2, %ymm3"); 9548c2ecf20Sopenharmony_ci asm volatile("vaesenc %zmm1, %zmm2, %zmm3"); 9558c2ecf20Sopenharmony_ci asm volatile("vaesenc 0x12345678(%rax,%rcx,8),%zmm2,%zmm3"); 9568c2ecf20Sopenharmony_ci asm volatile("vaesenc 0x12345678(%eax,%ecx,8),%zmm2,%zmm3"); 9578c2ecf20Sopenharmony_ci 9588c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 38 dd */ 9598c2ecf20Sopenharmony_ci 9608c2ecf20Sopenharmony_ci asm volatile("vaesenclast %xmm1, %xmm2, %xmm3"); 9618c2ecf20Sopenharmony_ci asm volatile("vaesenclast %ymm1, %ymm2, %ymm3"); 9628c2ecf20Sopenharmony_ci asm volatile("vaesenclast %zmm1, %zmm2, %zmm3"); 9638c2ecf20Sopenharmony_ci asm volatile("vaesenclast 0x12345678(%rax,%rcx,8),%zmm2,%zmm3"); 9648c2ecf20Sopenharmony_ci asm volatile("vaesenclast 0x12345678(%eax,%ecx,8),%zmm2,%zmm3"); 9658c2ecf20Sopenharmony_ci 9668c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 38 de */ 9678c2ecf20Sopenharmony_ci 9688c2ecf20Sopenharmony_ci asm volatile("vaesdec %xmm1, %xmm2, %xmm3"); 9698c2ecf20Sopenharmony_ci asm volatile("vaesdec %ymm1, %ymm2, %ymm3"); 9708c2ecf20Sopenharmony_ci asm volatile("vaesdec %zmm1, %zmm2, %zmm3"); 9718c2ecf20Sopenharmony_ci asm volatile("vaesdec 0x12345678(%rax,%rcx,8),%zmm2,%zmm3"); 9728c2ecf20Sopenharmony_ci asm volatile("vaesdec 0x12345678(%eax,%ecx,8),%zmm2,%zmm3"); 9738c2ecf20Sopenharmony_ci 9748c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 38 df */ 9758c2ecf20Sopenharmony_ci 9768c2ecf20Sopenharmony_ci asm volatile("vaesdeclast %xmm1, %xmm2, %xmm3"); 9778c2ecf20Sopenharmony_ci asm volatile("vaesdeclast %ymm1, %ymm2, %ymm3"); 9788c2ecf20Sopenharmony_ci asm volatile("vaesdeclast %zmm1, %zmm2, %zmm3"); 9798c2ecf20Sopenharmony_ci asm volatile("vaesdeclast 0x12345678(%rax,%rcx,8),%zmm2,%zmm3"); 9808c2ecf20Sopenharmony_ci asm volatile("vaesdeclast 0x12345678(%eax,%ecx,8),%zmm2,%zmm3"); 9818c2ecf20Sopenharmony_ci 9828c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 3a 03 */ 9838c2ecf20Sopenharmony_ci 9848c2ecf20Sopenharmony_ci asm volatile("valignd $0x12,%zmm28,%zmm29,%zmm30"); 9858c2ecf20Sopenharmony_ci asm volatile("valignq $0x12,%zmm25,%zmm26,%zmm27"); 9868c2ecf20Sopenharmony_ci 9878c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 3a 08 */ 9888c2ecf20Sopenharmony_ci 9898c2ecf20Sopenharmony_ci asm volatile("vroundps $0x5,%ymm6,%ymm2"); 9908c2ecf20Sopenharmony_ci asm volatile("vrndscaleps $0x12,%zmm25,%zmm26"); 9918c2ecf20Sopenharmony_ci 9928c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 3a 09 */ 9938c2ecf20Sopenharmony_ci 9948c2ecf20Sopenharmony_ci asm volatile("vroundpd $0x5,%ymm6,%ymm2"); 9958c2ecf20Sopenharmony_ci asm volatile("vrndscalepd $0x12,%zmm25,%zmm26"); 9968c2ecf20Sopenharmony_ci 9978c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 3a 1a */ 9988c2ecf20Sopenharmony_ci 9998c2ecf20Sopenharmony_ci asm volatile("vroundss $0x5,%xmm4,%xmm6,%xmm2"); 10008c2ecf20Sopenharmony_ci asm volatile("vrndscaless $0x12,%xmm24,%xmm25,%xmm26{%k7}"); 10018c2ecf20Sopenharmony_ci 10028c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 3a 0b */ 10038c2ecf20Sopenharmony_ci 10048c2ecf20Sopenharmony_ci asm volatile("vroundsd $0x5,%xmm4,%xmm6,%xmm2"); 10058c2ecf20Sopenharmony_ci asm volatile("vrndscalesd $0x12,%xmm24,%xmm25,%xmm26{%k7}"); 10068c2ecf20Sopenharmony_ci 10078c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 3a 18 */ 10088c2ecf20Sopenharmony_ci 10098c2ecf20Sopenharmony_ci asm volatile("vinsertf128 $0x5,%xmm4,%ymm4,%ymm6"); 10108c2ecf20Sopenharmony_ci asm volatile("vinsertf32x4 $0x12,%xmm24,%zmm25,%zmm26{%k7}"); 10118c2ecf20Sopenharmony_ci asm volatile("vinsertf64x2 $0x12,%xmm24,%zmm25,%zmm26{%k7}"); 10128c2ecf20Sopenharmony_ci 10138c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 3a 19 */ 10148c2ecf20Sopenharmony_ci 10158c2ecf20Sopenharmony_ci asm volatile("vextractf128 $0x5,%ymm4,%xmm4"); 10168c2ecf20Sopenharmony_ci asm volatile("vextractf32x4 $0x12,%zmm25,%xmm26{%k7}"); 10178c2ecf20Sopenharmony_ci asm volatile("vextractf64x2 $0x12,%zmm25,%xmm26{%k7}"); 10188c2ecf20Sopenharmony_ci 10198c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 3a 1a */ 10208c2ecf20Sopenharmony_ci 10218c2ecf20Sopenharmony_ci asm volatile("vinsertf32x8 $0x12,%ymm25,%zmm26,%zmm27{%k7}"); 10228c2ecf20Sopenharmony_ci asm volatile("vinsertf64x4 $0x12,%ymm28,%zmm29,%zmm30{%k7}"); 10238c2ecf20Sopenharmony_ci 10248c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 3a 1b */ 10258c2ecf20Sopenharmony_ci 10268c2ecf20Sopenharmony_ci asm volatile("vextractf32x8 $0x12,%zmm29,%ymm30{%k7}"); 10278c2ecf20Sopenharmony_ci asm volatile("vextractf64x4 $0x12,%zmm26,%ymm27{%k7}"); 10288c2ecf20Sopenharmony_ci 10298c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 3a 1e */ 10308c2ecf20Sopenharmony_ci 10318c2ecf20Sopenharmony_ci asm volatile("vpcmpud $0x12,%zmm29,%zmm30,%k5"); 10328c2ecf20Sopenharmony_ci asm volatile("vpcmpuq $0x12,%zmm26,%zmm27,%k5"); 10338c2ecf20Sopenharmony_ci 10348c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 3a 1f */ 10358c2ecf20Sopenharmony_ci 10368c2ecf20Sopenharmony_ci asm volatile("vpcmpd $0x12,%zmm29,%zmm30,%k5"); 10378c2ecf20Sopenharmony_ci asm volatile("vpcmpq $0x12,%zmm26,%zmm27,%k5"); 10388c2ecf20Sopenharmony_ci 10398c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 3a 23 */ 10408c2ecf20Sopenharmony_ci 10418c2ecf20Sopenharmony_ci asm volatile("vshuff32x4 $0x12,%zmm28,%zmm29,%zmm30"); 10428c2ecf20Sopenharmony_ci asm volatile("vshuff64x2 $0x12,%zmm25,%zmm26,%zmm27"); 10438c2ecf20Sopenharmony_ci 10448c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 3a 25 */ 10458c2ecf20Sopenharmony_ci 10468c2ecf20Sopenharmony_ci asm volatile("vpternlogd $0x12,%zmm28,%zmm29,%zmm30"); 10478c2ecf20Sopenharmony_ci asm volatile("vpternlogq $0x12,%zmm28,%zmm29,%zmm30"); 10488c2ecf20Sopenharmony_ci 10498c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 3a 26 */ 10508c2ecf20Sopenharmony_ci 10518c2ecf20Sopenharmony_ci asm volatile("vgetmantps $0x12,%zmm26,%zmm27"); 10528c2ecf20Sopenharmony_ci asm volatile("vgetmantpd $0x12,%zmm29,%zmm30"); 10538c2ecf20Sopenharmony_ci 10548c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 3a 27 */ 10558c2ecf20Sopenharmony_ci 10568c2ecf20Sopenharmony_ci asm volatile("vgetmantss $0x12,%xmm25,%xmm26,%xmm27{%k7}"); 10578c2ecf20Sopenharmony_ci asm volatile("vgetmantsd $0x12,%xmm28,%xmm29,%xmm30{%k7}"); 10588c2ecf20Sopenharmony_ci 10598c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 3a 38 */ 10608c2ecf20Sopenharmony_ci 10618c2ecf20Sopenharmony_ci asm volatile("vinserti128 $0x5,%xmm4,%ymm4,%ymm6"); 10628c2ecf20Sopenharmony_ci asm volatile("vinserti32x4 $0x12,%xmm24,%zmm25,%zmm26{%k7}"); 10638c2ecf20Sopenharmony_ci asm volatile("vinserti64x2 $0x12,%xmm24,%zmm25,%zmm26{%k7}"); 10648c2ecf20Sopenharmony_ci 10658c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 3a 39 */ 10668c2ecf20Sopenharmony_ci 10678c2ecf20Sopenharmony_ci asm volatile("vextracti128 $0x5,%ymm4,%xmm6"); 10688c2ecf20Sopenharmony_ci asm volatile("vextracti32x4 $0x12,%zmm25,%xmm26{%k7}"); 10698c2ecf20Sopenharmony_ci asm volatile("vextracti64x2 $0x12,%zmm25,%xmm26{%k7}"); 10708c2ecf20Sopenharmony_ci 10718c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 3a 3a */ 10728c2ecf20Sopenharmony_ci 10738c2ecf20Sopenharmony_ci asm volatile("vinserti32x8 $0x12,%ymm28,%zmm29,%zmm30{%k7}"); 10748c2ecf20Sopenharmony_ci asm volatile("vinserti64x4 $0x12,%ymm25,%zmm26,%zmm27{%k7}"); 10758c2ecf20Sopenharmony_ci 10768c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 3a 3b */ 10778c2ecf20Sopenharmony_ci 10788c2ecf20Sopenharmony_ci asm volatile("vextracti32x8 $0x12,%zmm29,%ymm30{%k7}"); 10798c2ecf20Sopenharmony_ci asm volatile("vextracti64x4 $0x12,%zmm26,%ymm27{%k7}"); 10808c2ecf20Sopenharmony_ci 10818c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 3a 3e */ 10828c2ecf20Sopenharmony_ci 10838c2ecf20Sopenharmony_ci asm volatile("vpcmpub $0x12,%zmm29,%zmm30,%k5"); 10848c2ecf20Sopenharmony_ci asm volatile("vpcmpuw $0x12,%zmm26,%zmm27,%k5"); 10858c2ecf20Sopenharmony_ci 10868c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 3a 3f */ 10878c2ecf20Sopenharmony_ci 10888c2ecf20Sopenharmony_ci asm volatile("vpcmpb $0x12,%zmm29,%zmm30,%k5"); 10898c2ecf20Sopenharmony_ci asm volatile("vpcmpw $0x12,%zmm26,%zmm27,%k5"); 10908c2ecf20Sopenharmony_ci 10918c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 3a 43 */ 10928c2ecf20Sopenharmony_ci 10938c2ecf20Sopenharmony_ci asm volatile("vmpsadbw $0x5,%ymm4,%ymm6,%ymm2"); 10948c2ecf20Sopenharmony_ci asm volatile("vdbpsadbw $0x12,%zmm4,%zmm5,%zmm6"); 10958c2ecf20Sopenharmony_ci 10968c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 3a 43 */ 10978c2ecf20Sopenharmony_ci 10988c2ecf20Sopenharmony_ci asm volatile("vshufi32x4 $0x12,%zmm25,%zmm26,%zmm27"); 10998c2ecf20Sopenharmony_ci asm volatile("vshufi64x2 $0x12,%zmm28,%zmm29,%zmm30"); 11008c2ecf20Sopenharmony_ci 11018c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 3a 44 */ 11028c2ecf20Sopenharmony_ci 11038c2ecf20Sopenharmony_ci asm volatile("vpclmulqdq $0x12,%xmm1,%xmm2,%xmm3"); 11048c2ecf20Sopenharmony_ci asm volatile("vpclmulqdq $0x12,%ymm1,%ymm2,%ymm3"); 11058c2ecf20Sopenharmony_ci asm volatile("vpclmulqdq $0x12,%zmm1,%zmm2,%zmm3"); 11068c2ecf20Sopenharmony_ci asm volatile("vpclmulqdq $0x12,%zmm25,%zmm26,%zmm27"); 11078c2ecf20Sopenharmony_ci 11088c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 3a 50 */ 11098c2ecf20Sopenharmony_ci 11108c2ecf20Sopenharmony_ci asm volatile("vrangeps $0x12,%zmm25,%zmm26,%zmm27"); 11118c2ecf20Sopenharmony_ci asm volatile("vrangepd $0x12,%zmm28,%zmm29,%zmm30"); 11128c2ecf20Sopenharmony_ci 11138c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 3a 51 */ 11148c2ecf20Sopenharmony_ci 11158c2ecf20Sopenharmony_ci asm volatile("vrangess $0x12,%xmm25,%xmm26,%xmm27"); 11168c2ecf20Sopenharmony_ci asm volatile("vrangesd $0x12,%xmm28,%xmm29,%xmm30"); 11178c2ecf20Sopenharmony_ci 11188c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 3a 54 */ 11198c2ecf20Sopenharmony_ci 11208c2ecf20Sopenharmony_ci asm volatile("vfixupimmps $0x12,%zmm28,%zmm29,%zmm30"); 11218c2ecf20Sopenharmony_ci asm volatile("vfixupimmpd $0x12,%zmm25,%zmm26,%zmm27"); 11228c2ecf20Sopenharmony_ci 11238c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 3a 55 */ 11248c2ecf20Sopenharmony_ci 11258c2ecf20Sopenharmony_ci asm volatile("vfixupimmss $0x12,%xmm28,%xmm29,%xmm30{%k7}"); 11268c2ecf20Sopenharmony_ci asm volatile("vfixupimmsd $0x12,%xmm25,%xmm26,%xmm27{%k7}"); 11278c2ecf20Sopenharmony_ci 11288c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 3a 56 */ 11298c2ecf20Sopenharmony_ci 11308c2ecf20Sopenharmony_ci asm volatile("vreduceps $0x12,%zmm26,%zmm27"); 11318c2ecf20Sopenharmony_ci asm volatile("vreducepd $0x12,%zmm29,%zmm30"); 11328c2ecf20Sopenharmony_ci 11338c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 3a 57 */ 11348c2ecf20Sopenharmony_ci 11358c2ecf20Sopenharmony_ci asm volatile("vreducess $0x12,%xmm25,%xmm26,%xmm27"); 11368c2ecf20Sopenharmony_ci asm volatile("vreducesd $0x12,%xmm28,%xmm29,%xmm30"); 11378c2ecf20Sopenharmony_ci 11388c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 3a 66 */ 11398c2ecf20Sopenharmony_ci 11408c2ecf20Sopenharmony_ci asm volatile("vfpclassps $0x12,%zmm27,%k5"); 11418c2ecf20Sopenharmony_ci asm volatile("vfpclasspd $0x12,%zmm30,%k5"); 11428c2ecf20Sopenharmony_ci 11438c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 3a 67 */ 11448c2ecf20Sopenharmony_ci 11458c2ecf20Sopenharmony_ci asm volatile("vfpclassss $0x12,%xmm27,%k5"); 11468c2ecf20Sopenharmony_ci asm volatile("vfpclasssd $0x12,%xmm30,%k5"); 11478c2ecf20Sopenharmony_ci 11488c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 3a 70 */ 11498c2ecf20Sopenharmony_ci 11508c2ecf20Sopenharmony_ci asm volatile("vpshldw $0x12,%xmm1,%xmm2,%xmm3"); 11518c2ecf20Sopenharmony_ci asm volatile("vpshldw $0x12,%ymm1,%ymm2,%ymm3"); 11528c2ecf20Sopenharmony_ci asm volatile("vpshldw $0x12,%zmm1,%zmm2,%zmm3"); 11538c2ecf20Sopenharmony_ci asm volatile("vpshldw $0x12,%zmm25,%zmm26,%zmm27"); 11548c2ecf20Sopenharmony_ci 11558c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 3a 71 */ 11568c2ecf20Sopenharmony_ci 11578c2ecf20Sopenharmony_ci asm volatile("vpshldd $0x12,%xmm1,%xmm2,%xmm3"); 11588c2ecf20Sopenharmony_ci asm volatile("vpshldd $0x12,%ymm1,%ymm2,%ymm3"); 11598c2ecf20Sopenharmony_ci asm volatile("vpshldd $0x12,%zmm1,%zmm2,%zmm3"); 11608c2ecf20Sopenharmony_ci asm volatile("vpshldd $0x12,%zmm25,%zmm26,%zmm27"); 11618c2ecf20Sopenharmony_ci 11628c2ecf20Sopenharmony_ci asm volatile("vpshldq $0x12,%xmm1,%xmm2,%xmm3"); 11638c2ecf20Sopenharmony_ci asm volatile("vpshldq $0x12,%ymm1,%ymm2,%ymm3"); 11648c2ecf20Sopenharmony_ci asm volatile("vpshldq $0x12,%zmm1,%zmm2,%zmm3"); 11658c2ecf20Sopenharmony_ci asm volatile("vpshldq $0x12,%zmm25,%zmm26,%zmm27"); 11668c2ecf20Sopenharmony_ci 11678c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 3a 72 */ 11688c2ecf20Sopenharmony_ci 11698c2ecf20Sopenharmony_ci asm volatile("vpshrdw $0x12,%xmm1,%xmm2,%xmm3"); 11708c2ecf20Sopenharmony_ci asm volatile("vpshrdw $0x12,%ymm1,%ymm2,%ymm3"); 11718c2ecf20Sopenharmony_ci asm volatile("vpshrdw $0x12,%zmm1,%zmm2,%zmm3"); 11728c2ecf20Sopenharmony_ci asm volatile("vpshrdw $0x12,%zmm25,%zmm26,%zmm27"); 11738c2ecf20Sopenharmony_ci 11748c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 3a 73 */ 11758c2ecf20Sopenharmony_ci 11768c2ecf20Sopenharmony_ci asm volatile("vpshrdd $0x12,%xmm1,%xmm2,%xmm3"); 11778c2ecf20Sopenharmony_ci asm volatile("vpshrdd $0x12,%ymm1,%ymm2,%ymm3"); 11788c2ecf20Sopenharmony_ci asm volatile("vpshrdd $0x12,%zmm1,%zmm2,%zmm3"); 11798c2ecf20Sopenharmony_ci asm volatile("vpshrdd $0x12,%zmm25,%zmm26,%zmm27"); 11808c2ecf20Sopenharmony_ci 11818c2ecf20Sopenharmony_ci asm volatile("vpshrdq $0x12,%xmm1,%xmm2,%xmm3"); 11828c2ecf20Sopenharmony_ci asm volatile("vpshrdq $0x12,%ymm1,%ymm2,%ymm3"); 11838c2ecf20Sopenharmony_ci asm volatile("vpshrdq $0x12,%zmm1,%zmm2,%zmm3"); 11848c2ecf20Sopenharmony_ci asm volatile("vpshrdq $0x12,%zmm25,%zmm26,%zmm27"); 11858c2ecf20Sopenharmony_ci 11868c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 3a ce */ 11878c2ecf20Sopenharmony_ci 11888c2ecf20Sopenharmony_ci asm volatile("gf2p8affineqb $0x12,%xmm1,%xmm3"); 11898c2ecf20Sopenharmony_ci 11908c2ecf20Sopenharmony_ci asm volatile("vgf2p8affineqb $0x12,%xmm1,%xmm2,%xmm3"); 11918c2ecf20Sopenharmony_ci asm volatile("vgf2p8affineqb $0x12,%ymm1,%ymm2,%ymm3"); 11928c2ecf20Sopenharmony_ci asm volatile("vgf2p8affineqb $0x12,%zmm1,%zmm2,%zmm3"); 11938c2ecf20Sopenharmony_ci asm volatile("vgf2p8affineqb $0x12,%zmm25,%zmm26,%zmm27"); 11948c2ecf20Sopenharmony_ci 11958c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 3a cf */ 11968c2ecf20Sopenharmony_ci 11978c2ecf20Sopenharmony_ci asm volatile("gf2p8affineinvqb $0x12,%xmm1,%xmm3"); 11988c2ecf20Sopenharmony_ci 11998c2ecf20Sopenharmony_ci asm volatile("vgf2p8affineinvqb $0x12,%xmm1,%xmm2,%xmm3"); 12008c2ecf20Sopenharmony_ci asm volatile("vgf2p8affineinvqb $0x12,%ymm1,%ymm2,%ymm3"); 12018c2ecf20Sopenharmony_ci asm volatile("vgf2p8affineinvqb $0x12,%zmm1,%zmm2,%zmm3"); 12028c2ecf20Sopenharmony_ci asm volatile("vgf2p8affineinvqb $0x12,%zmm25,%zmm26,%zmm27"); 12038c2ecf20Sopenharmony_ci 12048c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 72 (Grp13) */ 12058c2ecf20Sopenharmony_ci 12068c2ecf20Sopenharmony_ci asm volatile("vprord $0x12,%zmm25,%zmm26"); 12078c2ecf20Sopenharmony_ci asm volatile("vprorq $0x12,%zmm25,%zmm26"); 12088c2ecf20Sopenharmony_ci asm volatile("vprold $0x12,%zmm29,%zmm30"); 12098c2ecf20Sopenharmony_ci asm volatile("vprolq $0x12,%zmm29,%zmm30"); 12108c2ecf20Sopenharmony_ci asm volatile("psrad $0x2,%mm6"); 12118c2ecf20Sopenharmony_ci asm volatile("vpsrad $0x5,%ymm6,%ymm2"); 12128c2ecf20Sopenharmony_ci asm volatile("vpsrad $0x5,%zmm26,%zmm22"); 12138c2ecf20Sopenharmony_ci asm volatile("vpsraq $0x5,%zmm26,%zmm22"); 12148c2ecf20Sopenharmony_ci 12158c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 38 c6 (Grp18) */ 12168c2ecf20Sopenharmony_ci 12178c2ecf20Sopenharmony_ci asm volatile("vgatherpf0dps 0x7b(%r14,%zmm31,8){%k1}"); 12188c2ecf20Sopenharmony_ci asm volatile("vgatherpf0dpd 0x7b(%r14,%ymm31,8){%k1}"); 12198c2ecf20Sopenharmony_ci asm volatile("vgatherpf1dps 0x7b(%r14,%zmm31,8){%k1}"); 12208c2ecf20Sopenharmony_ci asm volatile("vgatherpf1dpd 0x7b(%r14,%ymm31,8){%k1}"); 12218c2ecf20Sopenharmony_ci asm volatile("vscatterpf0dps 0x7b(%r14,%zmm31,8){%k1}"); 12228c2ecf20Sopenharmony_ci asm volatile("vscatterpf0dpd 0x7b(%r14,%ymm31,8){%k1}"); 12238c2ecf20Sopenharmony_ci asm volatile("vscatterpf1dps 0x7b(%r14,%zmm31,8){%k1}"); 12248c2ecf20Sopenharmony_ci asm volatile("vscatterpf1dpd 0x7b(%r14,%ymm31,8){%k1}"); 12258c2ecf20Sopenharmony_ci 12268c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 38 c7 (Grp19) */ 12278c2ecf20Sopenharmony_ci 12288c2ecf20Sopenharmony_ci asm volatile("vgatherpf0qps 0x7b(%r14,%zmm31,8){%k1}"); 12298c2ecf20Sopenharmony_ci asm volatile("vgatherpf0qpd 0x7b(%r14,%zmm31,8){%k1}"); 12308c2ecf20Sopenharmony_ci asm volatile("vgatherpf1qps 0x7b(%r14,%zmm31,8){%k1}"); 12318c2ecf20Sopenharmony_ci asm volatile("vgatherpf1qpd 0x7b(%r14,%zmm31,8){%k1}"); 12328c2ecf20Sopenharmony_ci asm volatile("vscatterpf0qps 0x7b(%r14,%zmm31,8){%k1}"); 12338c2ecf20Sopenharmony_ci asm volatile("vscatterpf0qpd 0x7b(%r14,%zmm31,8){%k1}"); 12348c2ecf20Sopenharmony_ci asm volatile("vscatterpf1qps 0x7b(%r14,%zmm31,8){%k1}"); 12358c2ecf20Sopenharmony_ci asm volatile("vscatterpf1qpd 0x7b(%r14,%zmm31,8){%k1}"); 12368c2ecf20Sopenharmony_ci 12378c2ecf20Sopenharmony_ci /* AVX-512: Examples */ 12388c2ecf20Sopenharmony_ci 12398c2ecf20Sopenharmony_ci asm volatile("vaddpd %zmm28,%zmm29,%zmm30"); 12408c2ecf20Sopenharmony_ci asm volatile("vaddpd %zmm28,%zmm29,%zmm30{%k7}"); 12418c2ecf20Sopenharmony_ci asm volatile("vaddpd %zmm28,%zmm29,%zmm30{%k7}{z}"); 12428c2ecf20Sopenharmony_ci asm volatile("vaddpd {rn-sae},%zmm28,%zmm29,%zmm30"); 12438c2ecf20Sopenharmony_ci asm volatile("vaddpd {ru-sae},%zmm28,%zmm29,%zmm30"); 12448c2ecf20Sopenharmony_ci asm volatile("vaddpd {rd-sae},%zmm28,%zmm29,%zmm30"); 12458c2ecf20Sopenharmony_ci asm volatile("vaddpd {rz-sae},%zmm28,%zmm29,%zmm30"); 12468c2ecf20Sopenharmony_ci asm volatile("vaddpd (%rcx),%zmm29,%zmm30"); 12478c2ecf20Sopenharmony_ci asm volatile("vaddpd 0x123(%rax,%r14,8),%zmm29,%zmm30"); 12488c2ecf20Sopenharmony_ci asm volatile("vaddpd (%rcx){1to8},%zmm29,%zmm30"); 12498c2ecf20Sopenharmony_ci asm volatile("vaddpd 0x1fc0(%rdx),%zmm29,%zmm30"); 12508c2ecf20Sopenharmony_ci asm volatile("vaddpd 0x3f8(%rdx){1to8},%zmm29,%zmm30"); 12518c2ecf20Sopenharmony_ci asm volatile("vcmpeq_uqps 0x1fc(%rdx){1to16},%zmm30,%k5"); 12528c2ecf20Sopenharmony_ci asm volatile("vcmpltsd 0x123(%rax,%r14,8),%xmm29,%k5{%k7}"); 12538c2ecf20Sopenharmony_ci asm volatile("vcmplesd {sae},%xmm28,%xmm29,%k5{%k7}"); 12548c2ecf20Sopenharmony_ci asm volatile("vgetmantss $0x5b,0x123(%rax,%r14,8),%xmm29,%xmm30{%k7}"); 12558c2ecf20Sopenharmony_ci 12568c2ecf20Sopenharmony_ci /* bndmk m64, bnd */ 12578c2ecf20Sopenharmony_ci 12588c2ecf20Sopenharmony_ci asm volatile("bndmk (%rax), %bnd0"); 12598c2ecf20Sopenharmony_ci asm volatile("bndmk (%r8), %bnd0"); 12608c2ecf20Sopenharmony_ci asm volatile("bndmk (0x12345678), %bnd0"); 12618c2ecf20Sopenharmony_ci asm volatile("bndmk (%rax), %bnd3"); 12628c2ecf20Sopenharmony_ci asm volatile("bndmk (%rcx,%rax,1), %bnd0"); 12638c2ecf20Sopenharmony_ci asm volatile("bndmk 0x12345678(,%rax,1), %bnd0"); 12648c2ecf20Sopenharmony_ci asm volatile("bndmk (%rax,%rcx,1), %bnd0"); 12658c2ecf20Sopenharmony_ci asm volatile("bndmk (%rax,%rcx,8), %bnd0"); 12668c2ecf20Sopenharmony_ci asm volatile("bndmk 0x12(%rax), %bnd0"); 12678c2ecf20Sopenharmony_ci asm volatile("bndmk 0x12(%rbp), %bnd0"); 12688c2ecf20Sopenharmony_ci asm volatile("bndmk 0x12(%rcx,%rax,1), %bnd0"); 12698c2ecf20Sopenharmony_ci asm volatile("bndmk 0x12(%rbp,%rax,1), %bnd0"); 12708c2ecf20Sopenharmony_ci asm volatile("bndmk 0x12(%rax,%rcx,1), %bnd0"); 12718c2ecf20Sopenharmony_ci asm volatile("bndmk 0x12(%rax,%rcx,8), %bnd0"); 12728c2ecf20Sopenharmony_ci asm volatile("bndmk 0x12345678(%rax), %bnd0"); 12738c2ecf20Sopenharmony_ci asm volatile("bndmk 0x12345678(%rbp), %bnd0"); 12748c2ecf20Sopenharmony_ci asm volatile("bndmk 0x12345678(%rcx,%rax,1), %bnd0"); 12758c2ecf20Sopenharmony_ci asm volatile("bndmk 0x12345678(%rbp,%rax,1), %bnd0"); 12768c2ecf20Sopenharmony_ci asm volatile("bndmk 0x12345678(%rax,%rcx,1), %bnd0"); 12778c2ecf20Sopenharmony_ci asm volatile("bndmk 0x12345678(%rax,%rcx,8), %bnd0"); 12788c2ecf20Sopenharmony_ci 12798c2ecf20Sopenharmony_ci /* bndcl r/m64, bnd */ 12808c2ecf20Sopenharmony_ci 12818c2ecf20Sopenharmony_ci asm volatile("bndcl (%rax), %bnd0"); 12828c2ecf20Sopenharmony_ci asm volatile("bndcl (%r8), %bnd0"); 12838c2ecf20Sopenharmony_ci asm volatile("bndcl (0x12345678), %bnd0"); 12848c2ecf20Sopenharmony_ci asm volatile("bndcl (%rax), %bnd3"); 12858c2ecf20Sopenharmony_ci asm volatile("bndcl (%rcx,%rax,1), %bnd0"); 12868c2ecf20Sopenharmony_ci asm volatile("bndcl 0x12345678(,%rax,1), %bnd0"); 12878c2ecf20Sopenharmony_ci asm volatile("bndcl (%rax,%rcx,1), %bnd0"); 12888c2ecf20Sopenharmony_ci asm volatile("bndcl (%rax,%rcx,8), %bnd0"); 12898c2ecf20Sopenharmony_ci asm volatile("bndcl 0x12(%rax), %bnd0"); 12908c2ecf20Sopenharmony_ci asm volatile("bndcl 0x12(%rbp), %bnd0"); 12918c2ecf20Sopenharmony_ci asm volatile("bndcl 0x12(%rcx,%rax,1), %bnd0"); 12928c2ecf20Sopenharmony_ci asm volatile("bndcl 0x12(%rbp,%rax,1), %bnd0"); 12938c2ecf20Sopenharmony_ci asm volatile("bndcl 0x12(%rax,%rcx,1), %bnd0"); 12948c2ecf20Sopenharmony_ci asm volatile("bndcl 0x12(%rax,%rcx,8), %bnd0"); 12958c2ecf20Sopenharmony_ci asm volatile("bndcl 0x12345678(%rax), %bnd0"); 12968c2ecf20Sopenharmony_ci asm volatile("bndcl 0x12345678(%rbp), %bnd0"); 12978c2ecf20Sopenharmony_ci asm volatile("bndcl 0x12345678(%rcx,%rax,1), %bnd0"); 12988c2ecf20Sopenharmony_ci asm volatile("bndcl 0x12345678(%rbp,%rax,1), %bnd0"); 12998c2ecf20Sopenharmony_ci asm volatile("bndcl 0x12345678(%rax,%rcx,1), %bnd0"); 13008c2ecf20Sopenharmony_ci asm volatile("bndcl 0x12345678(%rax,%rcx,8), %bnd0"); 13018c2ecf20Sopenharmony_ci asm volatile("bndcl %rax, %bnd0"); 13028c2ecf20Sopenharmony_ci 13038c2ecf20Sopenharmony_ci /* bndcu r/m64, bnd */ 13048c2ecf20Sopenharmony_ci 13058c2ecf20Sopenharmony_ci asm volatile("bndcu (%rax), %bnd0"); 13068c2ecf20Sopenharmony_ci asm volatile("bndcu (%r8), %bnd0"); 13078c2ecf20Sopenharmony_ci asm volatile("bndcu (0x12345678), %bnd0"); 13088c2ecf20Sopenharmony_ci asm volatile("bndcu (%rax), %bnd3"); 13098c2ecf20Sopenharmony_ci asm volatile("bndcu (%rcx,%rax,1), %bnd0"); 13108c2ecf20Sopenharmony_ci asm volatile("bndcu 0x12345678(,%rax,1), %bnd0"); 13118c2ecf20Sopenharmony_ci asm volatile("bndcu (%rax,%rcx,1), %bnd0"); 13128c2ecf20Sopenharmony_ci asm volatile("bndcu (%rax,%rcx,8), %bnd0"); 13138c2ecf20Sopenharmony_ci asm volatile("bndcu 0x12(%rax), %bnd0"); 13148c2ecf20Sopenharmony_ci asm volatile("bndcu 0x12(%rbp), %bnd0"); 13158c2ecf20Sopenharmony_ci asm volatile("bndcu 0x12(%rcx,%rax,1), %bnd0"); 13168c2ecf20Sopenharmony_ci asm volatile("bndcu 0x12(%rbp,%rax,1), %bnd0"); 13178c2ecf20Sopenharmony_ci asm volatile("bndcu 0x12(%rax,%rcx,1), %bnd0"); 13188c2ecf20Sopenharmony_ci asm volatile("bndcu 0x12(%rax,%rcx,8), %bnd0"); 13198c2ecf20Sopenharmony_ci asm volatile("bndcu 0x12345678(%rax), %bnd0"); 13208c2ecf20Sopenharmony_ci asm volatile("bndcu 0x12345678(%rbp), %bnd0"); 13218c2ecf20Sopenharmony_ci asm volatile("bndcu 0x12345678(%rcx,%rax,1), %bnd0"); 13228c2ecf20Sopenharmony_ci asm volatile("bndcu 0x12345678(%rbp,%rax,1), %bnd0"); 13238c2ecf20Sopenharmony_ci asm volatile("bndcu 0x12345678(%rax,%rcx,1), %bnd0"); 13248c2ecf20Sopenharmony_ci asm volatile("bndcu 0x12345678(%rax,%rcx,8), %bnd0"); 13258c2ecf20Sopenharmony_ci asm volatile("bndcu %rax, %bnd0"); 13268c2ecf20Sopenharmony_ci 13278c2ecf20Sopenharmony_ci /* bndcn r/m64, bnd */ 13288c2ecf20Sopenharmony_ci 13298c2ecf20Sopenharmony_ci asm volatile("bndcn (%rax), %bnd0"); 13308c2ecf20Sopenharmony_ci asm volatile("bndcn (%r8), %bnd0"); 13318c2ecf20Sopenharmony_ci asm volatile("bndcn (0x12345678), %bnd0"); 13328c2ecf20Sopenharmony_ci asm volatile("bndcn (%rax), %bnd3"); 13338c2ecf20Sopenharmony_ci asm volatile("bndcn (%rcx,%rax,1), %bnd0"); 13348c2ecf20Sopenharmony_ci asm volatile("bndcn 0x12345678(,%rax,1), %bnd0"); 13358c2ecf20Sopenharmony_ci asm volatile("bndcn (%rax,%rcx,1), %bnd0"); 13368c2ecf20Sopenharmony_ci asm volatile("bndcn (%rax,%rcx,8), %bnd0"); 13378c2ecf20Sopenharmony_ci asm volatile("bndcn 0x12(%rax), %bnd0"); 13388c2ecf20Sopenharmony_ci asm volatile("bndcn 0x12(%rbp), %bnd0"); 13398c2ecf20Sopenharmony_ci asm volatile("bndcn 0x12(%rcx,%rax,1), %bnd0"); 13408c2ecf20Sopenharmony_ci asm volatile("bndcn 0x12(%rbp,%rax,1), %bnd0"); 13418c2ecf20Sopenharmony_ci asm volatile("bndcn 0x12(%rax,%rcx,1), %bnd0"); 13428c2ecf20Sopenharmony_ci asm volatile("bndcn 0x12(%rax,%rcx,8), %bnd0"); 13438c2ecf20Sopenharmony_ci asm volatile("bndcn 0x12345678(%rax), %bnd0"); 13448c2ecf20Sopenharmony_ci asm volatile("bndcn 0x12345678(%rbp), %bnd0"); 13458c2ecf20Sopenharmony_ci asm volatile("bndcn 0x12345678(%rcx,%rax,1), %bnd0"); 13468c2ecf20Sopenharmony_ci asm volatile("bndcn 0x12345678(%rbp,%rax,1), %bnd0"); 13478c2ecf20Sopenharmony_ci asm volatile("bndcn 0x12345678(%rax,%rcx,1), %bnd0"); 13488c2ecf20Sopenharmony_ci asm volatile("bndcn 0x12345678(%rax,%rcx,8), %bnd0"); 13498c2ecf20Sopenharmony_ci asm volatile("bndcn %rax, %bnd0"); 13508c2ecf20Sopenharmony_ci 13518c2ecf20Sopenharmony_ci /* bndmov m128, bnd */ 13528c2ecf20Sopenharmony_ci 13538c2ecf20Sopenharmony_ci asm volatile("bndmov (%rax), %bnd0"); 13548c2ecf20Sopenharmony_ci asm volatile("bndmov (%r8), %bnd0"); 13558c2ecf20Sopenharmony_ci asm volatile("bndmov (0x12345678), %bnd0"); 13568c2ecf20Sopenharmony_ci asm volatile("bndmov (%rax), %bnd3"); 13578c2ecf20Sopenharmony_ci asm volatile("bndmov (%rcx,%rax,1), %bnd0"); 13588c2ecf20Sopenharmony_ci asm volatile("bndmov 0x12345678(,%rax,1), %bnd0"); 13598c2ecf20Sopenharmony_ci asm volatile("bndmov (%rax,%rcx,1), %bnd0"); 13608c2ecf20Sopenharmony_ci asm volatile("bndmov (%rax,%rcx,8), %bnd0"); 13618c2ecf20Sopenharmony_ci asm volatile("bndmov 0x12(%rax), %bnd0"); 13628c2ecf20Sopenharmony_ci asm volatile("bndmov 0x12(%rbp), %bnd0"); 13638c2ecf20Sopenharmony_ci asm volatile("bndmov 0x12(%rcx,%rax,1), %bnd0"); 13648c2ecf20Sopenharmony_ci asm volatile("bndmov 0x12(%rbp,%rax,1), %bnd0"); 13658c2ecf20Sopenharmony_ci asm volatile("bndmov 0x12(%rax,%rcx,1), %bnd0"); 13668c2ecf20Sopenharmony_ci asm volatile("bndmov 0x12(%rax,%rcx,8), %bnd0"); 13678c2ecf20Sopenharmony_ci asm volatile("bndmov 0x12345678(%rax), %bnd0"); 13688c2ecf20Sopenharmony_ci asm volatile("bndmov 0x12345678(%rbp), %bnd0"); 13698c2ecf20Sopenharmony_ci asm volatile("bndmov 0x12345678(%rcx,%rax,1), %bnd0"); 13708c2ecf20Sopenharmony_ci asm volatile("bndmov 0x12345678(%rbp,%rax,1), %bnd0"); 13718c2ecf20Sopenharmony_ci asm volatile("bndmov 0x12345678(%rax,%rcx,1), %bnd0"); 13728c2ecf20Sopenharmony_ci asm volatile("bndmov 0x12345678(%rax,%rcx,8), %bnd0"); 13738c2ecf20Sopenharmony_ci 13748c2ecf20Sopenharmony_ci /* bndmov bnd, m128 */ 13758c2ecf20Sopenharmony_ci 13768c2ecf20Sopenharmony_ci asm volatile("bndmov %bnd0, (%rax)"); 13778c2ecf20Sopenharmony_ci asm volatile("bndmov %bnd0, (%r8)"); 13788c2ecf20Sopenharmony_ci asm volatile("bndmov %bnd0, (0x12345678)"); 13798c2ecf20Sopenharmony_ci asm volatile("bndmov %bnd3, (%rax)"); 13808c2ecf20Sopenharmony_ci asm volatile("bndmov %bnd0, (%rcx,%rax,1)"); 13818c2ecf20Sopenharmony_ci asm volatile("bndmov %bnd0, 0x12345678(,%rax,1)"); 13828c2ecf20Sopenharmony_ci asm volatile("bndmov %bnd0, (%rax,%rcx,1)"); 13838c2ecf20Sopenharmony_ci asm volatile("bndmov %bnd0, (%rax,%rcx,8)"); 13848c2ecf20Sopenharmony_ci asm volatile("bndmov %bnd0, 0x12(%rax)"); 13858c2ecf20Sopenharmony_ci asm volatile("bndmov %bnd0, 0x12(%rbp)"); 13868c2ecf20Sopenharmony_ci asm volatile("bndmov %bnd0, 0x12(%rcx,%rax,1)"); 13878c2ecf20Sopenharmony_ci asm volatile("bndmov %bnd0, 0x12(%rbp,%rax,1)"); 13888c2ecf20Sopenharmony_ci asm volatile("bndmov %bnd0, 0x12(%rax,%rcx,1)"); 13898c2ecf20Sopenharmony_ci asm volatile("bndmov %bnd0, 0x12(%rax,%rcx,8)"); 13908c2ecf20Sopenharmony_ci asm volatile("bndmov %bnd0, 0x12345678(%rax)"); 13918c2ecf20Sopenharmony_ci asm volatile("bndmov %bnd0, 0x12345678(%rbp)"); 13928c2ecf20Sopenharmony_ci asm volatile("bndmov %bnd0, 0x12345678(%rcx,%rax,1)"); 13938c2ecf20Sopenharmony_ci asm volatile("bndmov %bnd0, 0x12345678(%rbp,%rax,1)"); 13948c2ecf20Sopenharmony_ci asm volatile("bndmov %bnd0, 0x12345678(%rax,%rcx,1)"); 13958c2ecf20Sopenharmony_ci asm volatile("bndmov %bnd0, 0x12345678(%rax,%rcx,8)"); 13968c2ecf20Sopenharmony_ci 13978c2ecf20Sopenharmony_ci /* bndmov bnd2, bnd1 */ 13988c2ecf20Sopenharmony_ci 13998c2ecf20Sopenharmony_ci asm volatile("bndmov %bnd0, %bnd1"); 14008c2ecf20Sopenharmony_ci asm volatile("bndmov %bnd1, %bnd0"); 14018c2ecf20Sopenharmony_ci 14028c2ecf20Sopenharmony_ci /* bndldx mib, bnd */ 14038c2ecf20Sopenharmony_ci 14048c2ecf20Sopenharmony_ci asm volatile("bndldx (%rax), %bnd0"); 14058c2ecf20Sopenharmony_ci asm volatile("bndldx (%r8), %bnd0"); 14068c2ecf20Sopenharmony_ci asm volatile("bndldx (0x12345678), %bnd0"); 14078c2ecf20Sopenharmony_ci asm volatile("bndldx (%rax), %bnd3"); 14088c2ecf20Sopenharmony_ci asm volatile("bndldx (%rcx,%rax,1), %bnd0"); 14098c2ecf20Sopenharmony_ci asm volatile("bndldx 0x12345678(,%rax,1), %bnd0"); 14108c2ecf20Sopenharmony_ci asm volatile("bndldx (%rax,%rcx,1), %bnd0"); 14118c2ecf20Sopenharmony_ci asm volatile("bndldx 0x12(%rax), %bnd0"); 14128c2ecf20Sopenharmony_ci asm volatile("bndldx 0x12(%rbp), %bnd0"); 14138c2ecf20Sopenharmony_ci asm volatile("bndldx 0x12(%rcx,%rax,1), %bnd0"); 14148c2ecf20Sopenharmony_ci asm volatile("bndldx 0x12(%rbp,%rax,1), %bnd0"); 14158c2ecf20Sopenharmony_ci asm volatile("bndldx 0x12(%rax,%rcx,1), %bnd0"); 14168c2ecf20Sopenharmony_ci asm volatile("bndldx 0x12345678(%rax), %bnd0"); 14178c2ecf20Sopenharmony_ci asm volatile("bndldx 0x12345678(%rbp), %bnd0"); 14188c2ecf20Sopenharmony_ci asm volatile("bndldx 0x12345678(%rcx,%rax,1), %bnd0"); 14198c2ecf20Sopenharmony_ci asm volatile("bndldx 0x12345678(%rbp,%rax,1), %bnd0"); 14208c2ecf20Sopenharmony_ci asm volatile("bndldx 0x12345678(%rax,%rcx,1), %bnd0"); 14218c2ecf20Sopenharmony_ci 14228c2ecf20Sopenharmony_ci /* bndstx bnd, mib */ 14238c2ecf20Sopenharmony_ci 14248c2ecf20Sopenharmony_ci asm volatile("bndstx %bnd0, (%rax)"); 14258c2ecf20Sopenharmony_ci asm volatile("bndstx %bnd0, (%r8)"); 14268c2ecf20Sopenharmony_ci asm volatile("bndstx %bnd0, (0x12345678)"); 14278c2ecf20Sopenharmony_ci asm volatile("bndstx %bnd3, (%rax)"); 14288c2ecf20Sopenharmony_ci asm volatile("bndstx %bnd0, (%rcx,%rax,1)"); 14298c2ecf20Sopenharmony_ci asm volatile("bndstx %bnd0, 0x12345678(,%rax,1)"); 14308c2ecf20Sopenharmony_ci asm volatile("bndstx %bnd0, (%rax,%rcx,1)"); 14318c2ecf20Sopenharmony_ci asm volatile("bndstx %bnd0, 0x12(%rax)"); 14328c2ecf20Sopenharmony_ci asm volatile("bndstx %bnd0, 0x12(%rbp)"); 14338c2ecf20Sopenharmony_ci asm volatile("bndstx %bnd0, 0x12(%rcx,%rax,1)"); 14348c2ecf20Sopenharmony_ci asm volatile("bndstx %bnd0, 0x12(%rbp,%rax,1)"); 14358c2ecf20Sopenharmony_ci asm volatile("bndstx %bnd0, 0x12(%rax,%rcx,1)"); 14368c2ecf20Sopenharmony_ci asm volatile("bndstx %bnd0, 0x12345678(%rax)"); 14378c2ecf20Sopenharmony_ci asm volatile("bndstx %bnd0, 0x12345678(%rbp)"); 14388c2ecf20Sopenharmony_ci asm volatile("bndstx %bnd0, 0x12345678(%rcx,%rax,1)"); 14398c2ecf20Sopenharmony_ci asm volatile("bndstx %bnd0, 0x12345678(%rbp,%rax,1)"); 14408c2ecf20Sopenharmony_ci asm volatile("bndstx %bnd0, 0x12345678(%rax,%rcx,1)"); 14418c2ecf20Sopenharmony_ci 14428c2ecf20Sopenharmony_ci /* bnd prefix on call, ret, jmp and all jcc */ 14438c2ecf20Sopenharmony_ci 14448c2ecf20Sopenharmony_ci asm volatile("bnd call label1"); /* Expecting: call unconditional 0 */ 14458c2ecf20Sopenharmony_ci asm volatile("bnd call *(%eax)"); /* Expecting: call indirect 0 */ 14468c2ecf20Sopenharmony_ci asm volatile("bnd ret"); /* Expecting: ret indirect 0 */ 14478c2ecf20Sopenharmony_ci asm volatile("bnd jmp label1"); /* Expecting: jmp unconditional 0 */ 14488c2ecf20Sopenharmony_ci asm volatile("bnd jmp label1"); /* Expecting: jmp unconditional 0 */ 14498c2ecf20Sopenharmony_ci asm volatile("bnd jmp *(%ecx)"); /* Expecting: jmp indirect 0 */ 14508c2ecf20Sopenharmony_ci asm volatile("bnd jne label1"); /* Expecting: jcc conditional 0 */ 14518c2ecf20Sopenharmony_ci 14528c2ecf20Sopenharmony_ci /* sha1rnds4 imm8, xmm2/m128, xmm1 */ 14538c2ecf20Sopenharmony_ci 14548c2ecf20Sopenharmony_ci asm volatile("sha1rnds4 $0x0, %xmm1, %xmm0"); 14558c2ecf20Sopenharmony_ci asm volatile("sha1rnds4 $0x91, %xmm7, %xmm2"); 14568c2ecf20Sopenharmony_ci asm volatile("sha1rnds4 $0x91, %xmm8, %xmm0"); 14578c2ecf20Sopenharmony_ci asm volatile("sha1rnds4 $0x91, %xmm7, %xmm8"); 14588c2ecf20Sopenharmony_ci asm volatile("sha1rnds4 $0x91, %xmm15, %xmm8"); 14598c2ecf20Sopenharmony_ci asm volatile("sha1rnds4 $0x91, (%rax), %xmm0"); 14608c2ecf20Sopenharmony_ci asm volatile("sha1rnds4 $0x91, (%r8), %xmm0"); 14618c2ecf20Sopenharmony_ci asm volatile("sha1rnds4 $0x91, (0x12345678), %xmm0"); 14628c2ecf20Sopenharmony_ci asm volatile("sha1rnds4 $0x91, (%rax), %xmm3"); 14638c2ecf20Sopenharmony_ci asm volatile("sha1rnds4 $0x91, (%rcx,%rax,1), %xmm0"); 14648c2ecf20Sopenharmony_ci asm volatile("sha1rnds4 $0x91, 0x12345678(,%rax,1), %xmm0"); 14658c2ecf20Sopenharmony_ci asm volatile("sha1rnds4 $0x91, (%rax,%rcx,1), %xmm0"); 14668c2ecf20Sopenharmony_ci asm volatile("sha1rnds4 $0x91, (%rax,%rcx,8), %xmm0"); 14678c2ecf20Sopenharmony_ci asm volatile("sha1rnds4 $0x91, 0x12(%rax), %xmm0"); 14688c2ecf20Sopenharmony_ci asm volatile("sha1rnds4 $0x91, 0x12(%rbp), %xmm0"); 14698c2ecf20Sopenharmony_ci asm volatile("sha1rnds4 $0x91, 0x12(%rcx,%rax,1), %xmm0"); 14708c2ecf20Sopenharmony_ci asm volatile("sha1rnds4 $0x91, 0x12(%rbp,%rax,1), %xmm0"); 14718c2ecf20Sopenharmony_ci asm volatile("sha1rnds4 $0x91, 0x12(%rax,%rcx,1), %xmm0"); 14728c2ecf20Sopenharmony_ci asm volatile("sha1rnds4 $0x91, 0x12(%rax,%rcx,8), %xmm0"); 14738c2ecf20Sopenharmony_ci asm volatile("sha1rnds4 $0x91, 0x12345678(%rax), %xmm0"); 14748c2ecf20Sopenharmony_ci asm volatile("sha1rnds4 $0x91, 0x12345678(%rbp), %xmm0"); 14758c2ecf20Sopenharmony_ci asm volatile("sha1rnds4 $0x91, 0x12345678(%rcx,%rax,1), %xmm0"); 14768c2ecf20Sopenharmony_ci asm volatile("sha1rnds4 $0x91, 0x12345678(%rbp,%rax,1), %xmm0"); 14778c2ecf20Sopenharmony_ci asm volatile("sha1rnds4 $0x91, 0x12345678(%rax,%rcx,1), %xmm0"); 14788c2ecf20Sopenharmony_ci asm volatile("sha1rnds4 $0x91, 0x12345678(%rax,%rcx,8), %xmm0"); 14798c2ecf20Sopenharmony_ci asm volatile("sha1rnds4 $0x91, 0x12345678(%rax,%rcx,8), %xmm15"); 14808c2ecf20Sopenharmony_ci 14818c2ecf20Sopenharmony_ci /* sha1nexte xmm2/m128, xmm1 */ 14828c2ecf20Sopenharmony_ci 14838c2ecf20Sopenharmony_ci asm volatile("sha1nexte %xmm1, %xmm0"); 14848c2ecf20Sopenharmony_ci asm volatile("sha1nexte %xmm7, %xmm2"); 14858c2ecf20Sopenharmony_ci asm volatile("sha1nexte %xmm8, %xmm0"); 14868c2ecf20Sopenharmony_ci asm volatile("sha1nexte %xmm7, %xmm8"); 14878c2ecf20Sopenharmony_ci asm volatile("sha1nexte %xmm15, %xmm8"); 14888c2ecf20Sopenharmony_ci asm volatile("sha1nexte (%rax), %xmm0"); 14898c2ecf20Sopenharmony_ci asm volatile("sha1nexte (%r8), %xmm0"); 14908c2ecf20Sopenharmony_ci asm volatile("sha1nexte (0x12345678), %xmm0"); 14918c2ecf20Sopenharmony_ci asm volatile("sha1nexte (%rax), %xmm3"); 14928c2ecf20Sopenharmony_ci asm volatile("sha1nexte (%rcx,%rax,1), %xmm0"); 14938c2ecf20Sopenharmony_ci asm volatile("sha1nexte 0x12345678(,%rax,1), %xmm0"); 14948c2ecf20Sopenharmony_ci asm volatile("sha1nexte (%rax,%rcx,1), %xmm0"); 14958c2ecf20Sopenharmony_ci asm volatile("sha1nexte (%rax,%rcx,8), %xmm0"); 14968c2ecf20Sopenharmony_ci asm volatile("sha1nexte 0x12(%rax), %xmm0"); 14978c2ecf20Sopenharmony_ci asm volatile("sha1nexte 0x12(%rbp), %xmm0"); 14988c2ecf20Sopenharmony_ci asm volatile("sha1nexte 0x12(%rcx,%rax,1), %xmm0"); 14998c2ecf20Sopenharmony_ci asm volatile("sha1nexte 0x12(%rbp,%rax,1), %xmm0"); 15008c2ecf20Sopenharmony_ci asm volatile("sha1nexte 0x12(%rax,%rcx,1), %xmm0"); 15018c2ecf20Sopenharmony_ci asm volatile("sha1nexte 0x12(%rax,%rcx,8), %xmm0"); 15028c2ecf20Sopenharmony_ci asm volatile("sha1nexte 0x12345678(%rax), %xmm0"); 15038c2ecf20Sopenharmony_ci asm volatile("sha1nexte 0x12345678(%rbp), %xmm0"); 15048c2ecf20Sopenharmony_ci asm volatile("sha1nexte 0x12345678(%rcx,%rax,1), %xmm0"); 15058c2ecf20Sopenharmony_ci asm volatile("sha1nexte 0x12345678(%rbp,%rax,1), %xmm0"); 15068c2ecf20Sopenharmony_ci asm volatile("sha1nexte 0x12345678(%rax,%rcx,1), %xmm0"); 15078c2ecf20Sopenharmony_ci asm volatile("sha1nexte 0x12345678(%rax,%rcx,8), %xmm0"); 15088c2ecf20Sopenharmony_ci asm volatile("sha1nexte 0x12345678(%rax,%rcx,8), %xmm15"); 15098c2ecf20Sopenharmony_ci 15108c2ecf20Sopenharmony_ci /* sha1msg1 xmm2/m128, xmm1 */ 15118c2ecf20Sopenharmony_ci 15128c2ecf20Sopenharmony_ci asm volatile("sha1msg1 %xmm1, %xmm0"); 15138c2ecf20Sopenharmony_ci asm volatile("sha1msg1 %xmm7, %xmm2"); 15148c2ecf20Sopenharmony_ci asm volatile("sha1msg1 %xmm8, %xmm0"); 15158c2ecf20Sopenharmony_ci asm volatile("sha1msg1 %xmm7, %xmm8"); 15168c2ecf20Sopenharmony_ci asm volatile("sha1msg1 %xmm15, %xmm8"); 15178c2ecf20Sopenharmony_ci asm volatile("sha1msg1 (%rax), %xmm0"); 15188c2ecf20Sopenharmony_ci asm volatile("sha1msg1 (%r8), %xmm0"); 15198c2ecf20Sopenharmony_ci asm volatile("sha1msg1 (0x12345678), %xmm0"); 15208c2ecf20Sopenharmony_ci asm volatile("sha1msg1 (%rax), %xmm3"); 15218c2ecf20Sopenharmony_ci asm volatile("sha1msg1 (%rcx,%rax,1), %xmm0"); 15228c2ecf20Sopenharmony_ci asm volatile("sha1msg1 0x12345678(,%rax,1), %xmm0"); 15238c2ecf20Sopenharmony_ci asm volatile("sha1msg1 (%rax,%rcx,1), %xmm0"); 15248c2ecf20Sopenharmony_ci asm volatile("sha1msg1 (%rax,%rcx,8), %xmm0"); 15258c2ecf20Sopenharmony_ci asm volatile("sha1msg1 0x12(%rax), %xmm0"); 15268c2ecf20Sopenharmony_ci asm volatile("sha1msg1 0x12(%rbp), %xmm0"); 15278c2ecf20Sopenharmony_ci asm volatile("sha1msg1 0x12(%rcx,%rax,1), %xmm0"); 15288c2ecf20Sopenharmony_ci asm volatile("sha1msg1 0x12(%rbp,%rax,1), %xmm0"); 15298c2ecf20Sopenharmony_ci asm volatile("sha1msg1 0x12(%rax,%rcx,1), %xmm0"); 15308c2ecf20Sopenharmony_ci asm volatile("sha1msg1 0x12(%rax,%rcx,8), %xmm0"); 15318c2ecf20Sopenharmony_ci asm volatile("sha1msg1 0x12345678(%rax), %xmm0"); 15328c2ecf20Sopenharmony_ci asm volatile("sha1msg1 0x12345678(%rbp), %xmm0"); 15338c2ecf20Sopenharmony_ci asm volatile("sha1msg1 0x12345678(%rcx,%rax,1), %xmm0"); 15348c2ecf20Sopenharmony_ci asm volatile("sha1msg1 0x12345678(%rbp,%rax,1), %xmm0"); 15358c2ecf20Sopenharmony_ci asm volatile("sha1msg1 0x12345678(%rax,%rcx,1), %xmm0"); 15368c2ecf20Sopenharmony_ci asm volatile("sha1msg1 0x12345678(%rax,%rcx,8), %xmm0"); 15378c2ecf20Sopenharmony_ci asm volatile("sha1msg1 0x12345678(%rax,%rcx,8), %xmm15"); 15388c2ecf20Sopenharmony_ci 15398c2ecf20Sopenharmony_ci /* sha1msg2 xmm2/m128, xmm1 */ 15408c2ecf20Sopenharmony_ci 15418c2ecf20Sopenharmony_ci asm volatile("sha1msg2 %xmm1, %xmm0"); 15428c2ecf20Sopenharmony_ci asm volatile("sha1msg2 %xmm7, %xmm2"); 15438c2ecf20Sopenharmony_ci asm volatile("sha1msg2 %xmm8, %xmm0"); 15448c2ecf20Sopenharmony_ci asm volatile("sha1msg2 %xmm7, %xmm8"); 15458c2ecf20Sopenharmony_ci asm volatile("sha1msg2 %xmm15, %xmm8"); 15468c2ecf20Sopenharmony_ci asm volatile("sha1msg2 (%rax), %xmm0"); 15478c2ecf20Sopenharmony_ci asm volatile("sha1msg2 (%r8), %xmm0"); 15488c2ecf20Sopenharmony_ci asm volatile("sha1msg2 (0x12345678), %xmm0"); 15498c2ecf20Sopenharmony_ci asm volatile("sha1msg2 (%rax), %xmm3"); 15508c2ecf20Sopenharmony_ci asm volatile("sha1msg2 (%rcx,%rax,1), %xmm0"); 15518c2ecf20Sopenharmony_ci asm volatile("sha1msg2 0x12345678(,%rax,1), %xmm0"); 15528c2ecf20Sopenharmony_ci asm volatile("sha1msg2 (%rax,%rcx,1), %xmm0"); 15538c2ecf20Sopenharmony_ci asm volatile("sha1msg2 (%rax,%rcx,8), %xmm0"); 15548c2ecf20Sopenharmony_ci asm volatile("sha1msg2 0x12(%rax), %xmm0"); 15558c2ecf20Sopenharmony_ci asm volatile("sha1msg2 0x12(%rbp), %xmm0"); 15568c2ecf20Sopenharmony_ci asm volatile("sha1msg2 0x12(%rcx,%rax,1), %xmm0"); 15578c2ecf20Sopenharmony_ci asm volatile("sha1msg2 0x12(%rbp,%rax,1), %xmm0"); 15588c2ecf20Sopenharmony_ci asm volatile("sha1msg2 0x12(%rax,%rcx,1), %xmm0"); 15598c2ecf20Sopenharmony_ci asm volatile("sha1msg2 0x12(%rax,%rcx,8), %xmm0"); 15608c2ecf20Sopenharmony_ci asm volatile("sha1msg2 0x12345678(%rax), %xmm0"); 15618c2ecf20Sopenharmony_ci asm volatile("sha1msg2 0x12345678(%rbp), %xmm0"); 15628c2ecf20Sopenharmony_ci asm volatile("sha1msg2 0x12345678(%rcx,%rax,1), %xmm0"); 15638c2ecf20Sopenharmony_ci asm volatile("sha1msg2 0x12345678(%rbp,%rax,1), %xmm0"); 15648c2ecf20Sopenharmony_ci asm volatile("sha1msg2 0x12345678(%rax,%rcx,1), %xmm0"); 15658c2ecf20Sopenharmony_ci asm volatile("sha1msg2 0x12345678(%rax,%rcx,8), %xmm0"); 15668c2ecf20Sopenharmony_ci asm volatile("sha1msg2 0x12345678(%rax,%rcx,8), %xmm15"); 15678c2ecf20Sopenharmony_ci 15688c2ecf20Sopenharmony_ci /* sha256rnds2 <XMM0>, xmm2/m128, xmm1 */ 15698c2ecf20Sopenharmony_ci /* Note sha256rnds2 has an implicit operand 'xmm0' */ 15708c2ecf20Sopenharmony_ci 15718c2ecf20Sopenharmony_ci asm volatile("sha256rnds2 %xmm4, %xmm1"); 15728c2ecf20Sopenharmony_ci asm volatile("sha256rnds2 %xmm7, %xmm2"); 15738c2ecf20Sopenharmony_ci asm volatile("sha256rnds2 %xmm8, %xmm1"); 15748c2ecf20Sopenharmony_ci asm volatile("sha256rnds2 %xmm7, %xmm8"); 15758c2ecf20Sopenharmony_ci asm volatile("sha256rnds2 %xmm15, %xmm8"); 15768c2ecf20Sopenharmony_ci asm volatile("sha256rnds2 (%rax), %xmm1"); 15778c2ecf20Sopenharmony_ci asm volatile("sha256rnds2 (%r8), %xmm1"); 15788c2ecf20Sopenharmony_ci asm volatile("sha256rnds2 (0x12345678), %xmm1"); 15798c2ecf20Sopenharmony_ci asm volatile("sha256rnds2 (%rax), %xmm3"); 15808c2ecf20Sopenharmony_ci asm volatile("sha256rnds2 (%rcx,%rax,1), %xmm1"); 15818c2ecf20Sopenharmony_ci asm volatile("sha256rnds2 0x12345678(,%rax,1), %xmm1"); 15828c2ecf20Sopenharmony_ci asm volatile("sha256rnds2 (%rax,%rcx,1), %xmm1"); 15838c2ecf20Sopenharmony_ci asm volatile("sha256rnds2 (%rax,%rcx,8), %xmm1"); 15848c2ecf20Sopenharmony_ci asm volatile("sha256rnds2 0x12(%rax), %xmm1"); 15858c2ecf20Sopenharmony_ci asm volatile("sha256rnds2 0x12(%rbp), %xmm1"); 15868c2ecf20Sopenharmony_ci asm volatile("sha256rnds2 0x12(%rcx,%rax,1), %xmm1"); 15878c2ecf20Sopenharmony_ci asm volatile("sha256rnds2 0x12(%rbp,%rax,1), %xmm1"); 15888c2ecf20Sopenharmony_ci asm volatile("sha256rnds2 0x12(%rax,%rcx,1), %xmm1"); 15898c2ecf20Sopenharmony_ci asm volatile("sha256rnds2 0x12(%rax,%rcx,8), %xmm1"); 15908c2ecf20Sopenharmony_ci asm volatile("sha256rnds2 0x12345678(%rax), %xmm1"); 15918c2ecf20Sopenharmony_ci asm volatile("sha256rnds2 0x12345678(%rbp), %xmm1"); 15928c2ecf20Sopenharmony_ci asm volatile("sha256rnds2 0x12345678(%rcx,%rax,1), %xmm1"); 15938c2ecf20Sopenharmony_ci asm volatile("sha256rnds2 0x12345678(%rbp,%rax,1), %xmm1"); 15948c2ecf20Sopenharmony_ci asm volatile("sha256rnds2 0x12345678(%rax,%rcx,1), %xmm1"); 15958c2ecf20Sopenharmony_ci asm volatile("sha256rnds2 0x12345678(%rax,%rcx,8), %xmm1"); 15968c2ecf20Sopenharmony_ci asm volatile("sha256rnds2 0x12345678(%rax,%rcx,8), %xmm15"); 15978c2ecf20Sopenharmony_ci 15988c2ecf20Sopenharmony_ci /* sha256msg1 xmm2/m128, xmm1 */ 15998c2ecf20Sopenharmony_ci 16008c2ecf20Sopenharmony_ci asm volatile("sha256msg1 %xmm1, %xmm0"); 16018c2ecf20Sopenharmony_ci asm volatile("sha256msg1 %xmm7, %xmm2"); 16028c2ecf20Sopenharmony_ci asm volatile("sha256msg1 %xmm8, %xmm0"); 16038c2ecf20Sopenharmony_ci asm volatile("sha256msg1 %xmm7, %xmm8"); 16048c2ecf20Sopenharmony_ci asm volatile("sha256msg1 %xmm15, %xmm8"); 16058c2ecf20Sopenharmony_ci asm volatile("sha256msg1 (%rax), %xmm0"); 16068c2ecf20Sopenharmony_ci asm volatile("sha256msg1 (%r8), %xmm0"); 16078c2ecf20Sopenharmony_ci asm volatile("sha256msg1 (0x12345678), %xmm0"); 16088c2ecf20Sopenharmony_ci asm volatile("sha256msg1 (%rax), %xmm3"); 16098c2ecf20Sopenharmony_ci asm volatile("sha256msg1 (%rcx,%rax,1), %xmm0"); 16108c2ecf20Sopenharmony_ci asm volatile("sha256msg1 0x12345678(,%rax,1), %xmm0"); 16118c2ecf20Sopenharmony_ci asm volatile("sha256msg1 (%rax,%rcx,1), %xmm0"); 16128c2ecf20Sopenharmony_ci asm volatile("sha256msg1 (%rax,%rcx,8), %xmm0"); 16138c2ecf20Sopenharmony_ci asm volatile("sha256msg1 0x12(%rax), %xmm0"); 16148c2ecf20Sopenharmony_ci asm volatile("sha256msg1 0x12(%rbp), %xmm0"); 16158c2ecf20Sopenharmony_ci asm volatile("sha256msg1 0x12(%rcx,%rax,1), %xmm0"); 16168c2ecf20Sopenharmony_ci asm volatile("sha256msg1 0x12(%rbp,%rax,1), %xmm0"); 16178c2ecf20Sopenharmony_ci asm volatile("sha256msg1 0x12(%rax,%rcx,1), %xmm0"); 16188c2ecf20Sopenharmony_ci asm volatile("sha256msg1 0x12(%rax,%rcx,8), %xmm0"); 16198c2ecf20Sopenharmony_ci asm volatile("sha256msg1 0x12345678(%rax), %xmm0"); 16208c2ecf20Sopenharmony_ci asm volatile("sha256msg1 0x12345678(%rbp), %xmm0"); 16218c2ecf20Sopenharmony_ci asm volatile("sha256msg1 0x12345678(%rcx,%rax,1), %xmm0"); 16228c2ecf20Sopenharmony_ci asm volatile("sha256msg1 0x12345678(%rbp,%rax,1), %xmm0"); 16238c2ecf20Sopenharmony_ci asm volatile("sha256msg1 0x12345678(%rax,%rcx,1), %xmm0"); 16248c2ecf20Sopenharmony_ci asm volatile("sha256msg1 0x12345678(%rax,%rcx,8), %xmm0"); 16258c2ecf20Sopenharmony_ci asm volatile("sha256msg1 0x12345678(%rax,%rcx,8), %xmm15"); 16268c2ecf20Sopenharmony_ci 16278c2ecf20Sopenharmony_ci /* sha256msg2 xmm2/m128, xmm1 */ 16288c2ecf20Sopenharmony_ci 16298c2ecf20Sopenharmony_ci asm volatile("sha256msg2 %xmm1, %xmm0"); 16308c2ecf20Sopenharmony_ci asm volatile("sha256msg2 %xmm7, %xmm2"); 16318c2ecf20Sopenharmony_ci asm volatile("sha256msg2 %xmm8, %xmm0"); 16328c2ecf20Sopenharmony_ci asm volatile("sha256msg2 %xmm7, %xmm8"); 16338c2ecf20Sopenharmony_ci asm volatile("sha256msg2 %xmm15, %xmm8"); 16348c2ecf20Sopenharmony_ci asm volatile("sha256msg2 (%rax), %xmm0"); 16358c2ecf20Sopenharmony_ci asm volatile("sha256msg2 (%r8), %xmm0"); 16368c2ecf20Sopenharmony_ci asm volatile("sha256msg2 (0x12345678), %xmm0"); 16378c2ecf20Sopenharmony_ci asm volatile("sha256msg2 (%rax), %xmm3"); 16388c2ecf20Sopenharmony_ci asm volatile("sha256msg2 (%rcx,%rax,1), %xmm0"); 16398c2ecf20Sopenharmony_ci asm volatile("sha256msg2 0x12345678(,%rax,1), %xmm0"); 16408c2ecf20Sopenharmony_ci asm volatile("sha256msg2 (%rax,%rcx,1), %xmm0"); 16418c2ecf20Sopenharmony_ci asm volatile("sha256msg2 (%rax,%rcx,8), %xmm0"); 16428c2ecf20Sopenharmony_ci asm volatile("sha256msg2 0x12(%rax), %xmm0"); 16438c2ecf20Sopenharmony_ci asm volatile("sha256msg2 0x12(%rbp), %xmm0"); 16448c2ecf20Sopenharmony_ci asm volatile("sha256msg2 0x12(%rcx,%rax,1), %xmm0"); 16458c2ecf20Sopenharmony_ci asm volatile("sha256msg2 0x12(%rbp,%rax,1), %xmm0"); 16468c2ecf20Sopenharmony_ci asm volatile("sha256msg2 0x12(%rax,%rcx,1), %xmm0"); 16478c2ecf20Sopenharmony_ci asm volatile("sha256msg2 0x12(%rax,%rcx,8), %xmm0"); 16488c2ecf20Sopenharmony_ci asm volatile("sha256msg2 0x12345678(%rax), %xmm0"); 16498c2ecf20Sopenharmony_ci asm volatile("sha256msg2 0x12345678(%rbp), %xmm0"); 16508c2ecf20Sopenharmony_ci asm volatile("sha256msg2 0x12345678(%rcx,%rax,1), %xmm0"); 16518c2ecf20Sopenharmony_ci asm volatile("sha256msg2 0x12345678(%rbp,%rax,1), %xmm0"); 16528c2ecf20Sopenharmony_ci asm volatile("sha256msg2 0x12345678(%rax,%rcx,1), %xmm0"); 16538c2ecf20Sopenharmony_ci asm volatile("sha256msg2 0x12345678(%rax,%rcx,8), %xmm0"); 16548c2ecf20Sopenharmony_ci asm volatile("sha256msg2 0x12345678(%rax,%rcx,8), %xmm15"); 16558c2ecf20Sopenharmony_ci 16568c2ecf20Sopenharmony_ci /* clflushopt m8 */ 16578c2ecf20Sopenharmony_ci 16588c2ecf20Sopenharmony_ci asm volatile("clflushopt (%rax)"); 16598c2ecf20Sopenharmony_ci asm volatile("clflushopt (%r8)"); 16608c2ecf20Sopenharmony_ci asm volatile("clflushopt (0x12345678)"); 16618c2ecf20Sopenharmony_ci asm volatile("clflushopt 0x12345678(%rax,%rcx,8)"); 16628c2ecf20Sopenharmony_ci asm volatile("clflushopt 0x12345678(%r8,%rcx,8)"); 16638c2ecf20Sopenharmony_ci /* Also check instructions in the same group encoding as clflushopt */ 16648c2ecf20Sopenharmony_ci asm volatile("clflush (%rax)"); 16658c2ecf20Sopenharmony_ci asm volatile("clflush (%r8)"); 16668c2ecf20Sopenharmony_ci asm volatile("sfence"); 16678c2ecf20Sopenharmony_ci 16688c2ecf20Sopenharmony_ci /* clwb m8 */ 16698c2ecf20Sopenharmony_ci 16708c2ecf20Sopenharmony_ci asm volatile("clwb (%rax)"); 16718c2ecf20Sopenharmony_ci asm volatile("clwb (%r8)"); 16728c2ecf20Sopenharmony_ci asm volatile("clwb (0x12345678)"); 16738c2ecf20Sopenharmony_ci asm volatile("clwb 0x12345678(%rax,%rcx,8)"); 16748c2ecf20Sopenharmony_ci asm volatile("clwb 0x12345678(%r8,%rcx,8)"); 16758c2ecf20Sopenharmony_ci /* Also check instructions in the same group encoding as clwb */ 16768c2ecf20Sopenharmony_ci asm volatile("xsaveopt (%rax)"); 16778c2ecf20Sopenharmony_ci asm volatile("xsaveopt (%r8)"); 16788c2ecf20Sopenharmony_ci asm volatile("mfence"); 16798c2ecf20Sopenharmony_ci 16808c2ecf20Sopenharmony_ci /* cldemote m8 */ 16818c2ecf20Sopenharmony_ci 16828c2ecf20Sopenharmony_ci asm volatile("cldemote (%rax)"); 16838c2ecf20Sopenharmony_ci asm volatile("cldemote (%r8)"); 16848c2ecf20Sopenharmony_ci asm volatile("cldemote (0x12345678)"); 16858c2ecf20Sopenharmony_ci asm volatile("cldemote 0x12345678(%rax,%rcx,8)"); 16868c2ecf20Sopenharmony_ci asm volatile("cldemote 0x12345678(%r8,%rcx,8)"); 16878c2ecf20Sopenharmony_ci 16888c2ecf20Sopenharmony_ci /* xsavec mem */ 16898c2ecf20Sopenharmony_ci 16908c2ecf20Sopenharmony_ci asm volatile("xsavec (%rax)"); 16918c2ecf20Sopenharmony_ci asm volatile("xsavec (%r8)"); 16928c2ecf20Sopenharmony_ci asm volatile("xsavec (0x12345678)"); 16938c2ecf20Sopenharmony_ci asm volatile("xsavec 0x12345678(%rax,%rcx,8)"); 16948c2ecf20Sopenharmony_ci asm volatile("xsavec 0x12345678(%r8,%rcx,8)"); 16958c2ecf20Sopenharmony_ci 16968c2ecf20Sopenharmony_ci /* xsaves mem */ 16978c2ecf20Sopenharmony_ci 16988c2ecf20Sopenharmony_ci asm volatile("xsaves (%rax)"); 16998c2ecf20Sopenharmony_ci asm volatile("xsaves (%r8)"); 17008c2ecf20Sopenharmony_ci asm volatile("xsaves (0x12345678)"); 17018c2ecf20Sopenharmony_ci asm volatile("xsaves 0x12345678(%rax,%rcx,8)"); 17028c2ecf20Sopenharmony_ci asm volatile("xsaves 0x12345678(%r8,%rcx,8)"); 17038c2ecf20Sopenharmony_ci 17048c2ecf20Sopenharmony_ci /* xrstors mem */ 17058c2ecf20Sopenharmony_ci 17068c2ecf20Sopenharmony_ci asm volatile("xrstors (%rax)"); 17078c2ecf20Sopenharmony_ci asm volatile("xrstors (%r8)"); 17088c2ecf20Sopenharmony_ci asm volatile("xrstors (0x12345678)"); 17098c2ecf20Sopenharmony_ci asm volatile("xrstors 0x12345678(%rax,%rcx,8)"); 17108c2ecf20Sopenharmony_ci asm volatile("xrstors 0x12345678(%r8,%rcx,8)"); 17118c2ecf20Sopenharmony_ci 17128c2ecf20Sopenharmony_ci /* ptwrite */ 17138c2ecf20Sopenharmony_ci 17148c2ecf20Sopenharmony_ci asm volatile("ptwrite (%rax)"); 17158c2ecf20Sopenharmony_ci asm volatile("ptwrite (%r8)"); 17168c2ecf20Sopenharmony_ci asm volatile("ptwrite (0x12345678)"); 17178c2ecf20Sopenharmony_ci asm volatile("ptwrite 0x12345678(%rax,%rcx,8)"); 17188c2ecf20Sopenharmony_ci asm volatile("ptwrite 0x12345678(%r8,%rcx,8)"); 17198c2ecf20Sopenharmony_ci 17208c2ecf20Sopenharmony_ci asm volatile("ptwritel (%rax)"); 17218c2ecf20Sopenharmony_ci asm volatile("ptwritel (%r8)"); 17228c2ecf20Sopenharmony_ci asm volatile("ptwritel (0x12345678)"); 17238c2ecf20Sopenharmony_ci asm volatile("ptwritel 0x12345678(%rax,%rcx,8)"); 17248c2ecf20Sopenharmony_ci asm volatile("ptwritel 0x12345678(%r8,%rcx,8)"); 17258c2ecf20Sopenharmony_ci 17268c2ecf20Sopenharmony_ci asm volatile("ptwriteq (%rax)"); 17278c2ecf20Sopenharmony_ci asm volatile("ptwriteq (%r8)"); 17288c2ecf20Sopenharmony_ci asm volatile("ptwriteq (0x12345678)"); 17298c2ecf20Sopenharmony_ci asm volatile("ptwriteq 0x12345678(%rax,%rcx,8)"); 17308c2ecf20Sopenharmony_ci asm volatile("ptwriteq 0x12345678(%r8,%rcx,8)"); 17318c2ecf20Sopenharmony_ci 17328c2ecf20Sopenharmony_ci /* tpause */ 17338c2ecf20Sopenharmony_ci 17348c2ecf20Sopenharmony_ci asm volatile("tpause %ebx"); 17358c2ecf20Sopenharmony_ci asm volatile("tpause %r8d"); 17368c2ecf20Sopenharmony_ci 17378c2ecf20Sopenharmony_ci /* umonitor */ 17388c2ecf20Sopenharmony_ci 17398c2ecf20Sopenharmony_ci asm volatile("umonitor %eax"); 17408c2ecf20Sopenharmony_ci asm volatile("umonitor %rax"); 17418c2ecf20Sopenharmony_ci asm volatile("umonitor %r8d"); 17428c2ecf20Sopenharmony_ci 17438c2ecf20Sopenharmony_ci /* umwait */ 17448c2ecf20Sopenharmony_ci 17458c2ecf20Sopenharmony_ci asm volatile("umwait %eax"); 17468c2ecf20Sopenharmony_ci asm volatile("umwait %r8d"); 17478c2ecf20Sopenharmony_ci 17488c2ecf20Sopenharmony_ci /* movdiri */ 17498c2ecf20Sopenharmony_ci 17508c2ecf20Sopenharmony_ci asm volatile("movdiri %rax,(%rbx)"); 17518c2ecf20Sopenharmony_ci asm volatile("movdiri %rcx,0x12345678(%rax)"); 17528c2ecf20Sopenharmony_ci 17538c2ecf20Sopenharmony_ci /* movdir64b */ 17548c2ecf20Sopenharmony_ci 17558c2ecf20Sopenharmony_ci asm volatile("movdir64b (%rax),%rbx"); 17568c2ecf20Sopenharmony_ci asm volatile("movdir64b 0x12345678(%rax),%rcx"); 17578c2ecf20Sopenharmony_ci asm volatile("movdir64b (%eax),%ebx"); 17588c2ecf20Sopenharmony_ci asm volatile("movdir64b 0x12345678(%eax),%ecx"); 17598c2ecf20Sopenharmony_ci 17608c2ecf20Sopenharmony_ci /* enqcmd */ 17618c2ecf20Sopenharmony_ci 17628c2ecf20Sopenharmony_ci asm volatile("enqcmd (%rax),%rbx"); 17638c2ecf20Sopenharmony_ci asm volatile("enqcmd 0x12345678(%rax),%rcx"); 17648c2ecf20Sopenharmony_ci asm volatile("enqcmd (%eax),%ebx"); 17658c2ecf20Sopenharmony_ci asm volatile("enqcmd 0x12345678(%eax),%ecx"); 17668c2ecf20Sopenharmony_ci 17678c2ecf20Sopenharmony_ci /* enqcmds */ 17688c2ecf20Sopenharmony_ci 17698c2ecf20Sopenharmony_ci asm volatile("enqcmds (%rax),%rbx"); 17708c2ecf20Sopenharmony_ci asm volatile("enqcmds 0x12345678(%rax),%rcx"); 17718c2ecf20Sopenharmony_ci asm volatile("enqcmds (%eax),%ebx"); 17728c2ecf20Sopenharmony_ci asm volatile("enqcmds 0x12345678(%eax),%ecx"); 17738c2ecf20Sopenharmony_ci 17748c2ecf20Sopenharmony_ci /* incsspd/q */ 17758c2ecf20Sopenharmony_ci 17768c2ecf20Sopenharmony_ci asm volatile("incsspd %eax"); 17778c2ecf20Sopenharmony_ci asm volatile("incsspd %r8d"); 17788c2ecf20Sopenharmony_ci asm volatile("incsspq %rax"); 17798c2ecf20Sopenharmony_ci asm volatile("incsspq %r8"); 17808c2ecf20Sopenharmony_ci /* Also check instructions in the same group encoding as incsspd/q */ 17818c2ecf20Sopenharmony_ci asm volatile("xrstor (%rax)"); 17828c2ecf20Sopenharmony_ci asm volatile("xrstor (%r8)"); 17838c2ecf20Sopenharmony_ci asm volatile("xrstor (0x12345678)"); 17848c2ecf20Sopenharmony_ci asm volatile("xrstor 0x12345678(%rax,%rcx,8)"); 17858c2ecf20Sopenharmony_ci asm volatile("xrstor 0x12345678(%r8,%rcx,8)"); 17868c2ecf20Sopenharmony_ci asm volatile("lfence"); 17878c2ecf20Sopenharmony_ci 17888c2ecf20Sopenharmony_ci /* rdsspd/q */ 17898c2ecf20Sopenharmony_ci 17908c2ecf20Sopenharmony_ci asm volatile("rdsspd %eax"); 17918c2ecf20Sopenharmony_ci asm volatile("rdsspd %r8d"); 17928c2ecf20Sopenharmony_ci asm volatile("rdsspq %rax"); 17938c2ecf20Sopenharmony_ci asm volatile("rdsspq %r8"); 17948c2ecf20Sopenharmony_ci 17958c2ecf20Sopenharmony_ci /* saveprevssp */ 17968c2ecf20Sopenharmony_ci 17978c2ecf20Sopenharmony_ci asm volatile("saveprevssp"); 17988c2ecf20Sopenharmony_ci 17998c2ecf20Sopenharmony_ci /* rstorssp */ 18008c2ecf20Sopenharmony_ci 18018c2ecf20Sopenharmony_ci asm volatile("rstorssp (%rax)"); 18028c2ecf20Sopenharmony_ci asm volatile("rstorssp (%r8)"); 18038c2ecf20Sopenharmony_ci asm volatile("rstorssp (0x12345678)"); 18048c2ecf20Sopenharmony_ci asm volatile("rstorssp 0x12345678(%rax,%rcx,8)"); 18058c2ecf20Sopenharmony_ci asm volatile("rstorssp 0x12345678(%r8,%rcx,8)"); 18068c2ecf20Sopenharmony_ci 18078c2ecf20Sopenharmony_ci /* wrssd/q */ 18088c2ecf20Sopenharmony_ci 18098c2ecf20Sopenharmony_ci asm volatile("wrssd %ecx,(%rax)"); 18108c2ecf20Sopenharmony_ci asm volatile("wrssd %edx,(%r8)"); 18118c2ecf20Sopenharmony_ci asm volatile("wrssd %edx,(0x12345678)"); 18128c2ecf20Sopenharmony_ci asm volatile("wrssd %edx,0x12345678(%rax,%rcx,8)"); 18138c2ecf20Sopenharmony_ci asm volatile("wrssd %edx,0x12345678(%r8,%rcx,8)"); 18148c2ecf20Sopenharmony_ci asm volatile("wrssq %rcx,(%rax)"); 18158c2ecf20Sopenharmony_ci asm volatile("wrssq %rdx,(%r8)"); 18168c2ecf20Sopenharmony_ci asm volatile("wrssq %rdx,(0x12345678)"); 18178c2ecf20Sopenharmony_ci asm volatile("wrssq %rdx,0x12345678(%rax,%rcx,8)"); 18188c2ecf20Sopenharmony_ci asm volatile("wrssq %rdx,0x12345678(%r8,%rcx,8)"); 18198c2ecf20Sopenharmony_ci 18208c2ecf20Sopenharmony_ci /* wrussd/q */ 18218c2ecf20Sopenharmony_ci 18228c2ecf20Sopenharmony_ci asm volatile("wrussd %ecx,(%rax)"); 18238c2ecf20Sopenharmony_ci asm volatile("wrussd %edx,(%r8)"); 18248c2ecf20Sopenharmony_ci asm volatile("wrussd %edx,(0x12345678)"); 18258c2ecf20Sopenharmony_ci asm volatile("wrussd %edx,0x12345678(%rax,%rcx,8)"); 18268c2ecf20Sopenharmony_ci asm volatile("wrussd %edx,0x12345678(%r8,%rcx,8)"); 18278c2ecf20Sopenharmony_ci asm volatile("wrussq %rcx,(%rax)"); 18288c2ecf20Sopenharmony_ci asm volatile("wrussq %rdx,(%r8)"); 18298c2ecf20Sopenharmony_ci asm volatile("wrussq %rdx,(0x12345678)"); 18308c2ecf20Sopenharmony_ci asm volatile("wrussq %rdx,0x12345678(%rax,%rcx,8)"); 18318c2ecf20Sopenharmony_ci asm volatile("wrussq %rdx,0x12345678(%r8,%rcx,8)"); 18328c2ecf20Sopenharmony_ci 18338c2ecf20Sopenharmony_ci /* setssbsy */ 18348c2ecf20Sopenharmony_ci 18358c2ecf20Sopenharmony_ci asm volatile("setssbsy"); 18368c2ecf20Sopenharmony_ci /* Also check instructions in the same group encoding as setssbsy */ 18378c2ecf20Sopenharmony_ci asm volatile("rdpkru"); 18388c2ecf20Sopenharmony_ci asm volatile("wrpkru"); 18398c2ecf20Sopenharmony_ci 18408c2ecf20Sopenharmony_ci /* clrssbsy */ 18418c2ecf20Sopenharmony_ci 18428c2ecf20Sopenharmony_ci asm volatile("clrssbsy (%rax)"); 18438c2ecf20Sopenharmony_ci asm volatile("clrssbsy (%r8)"); 18448c2ecf20Sopenharmony_ci asm volatile("clrssbsy (0x12345678)"); 18458c2ecf20Sopenharmony_ci asm volatile("clrssbsy 0x12345678(%rax,%rcx,8)"); 18468c2ecf20Sopenharmony_ci asm volatile("clrssbsy 0x12345678(%r8,%rcx,8)"); 18478c2ecf20Sopenharmony_ci 18488c2ecf20Sopenharmony_ci /* endbr32/64 */ 18498c2ecf20Sopenharmony_ci 18508c2ecf20Sopenharmony_ci asm volatile("endbr32"); 18518c2ecf20Sopenharmony_ci asm volatile("endbr64"); 18528c2ecf20Sopenharmony_ci 18538c2ecf20Sopenharmony_ci /* call with/without notrack prefix */ 18548c2ecf20Sopenharmony_ci 18558c2ecf20Sopenharmony_ci asm volatile("callq *%rax"); /* Expecting: call indirect 0 */ 18568c2ecf20Sopenharmony_ci asm volatile("callq *(%rax)"); /* Expecting: call indirect 0 */ 18578c2ecf20Sopenharmony_ci asm volatile("callq *(%r8)"); /* Expecting: call indirect 0 */ 18588c2ecf20Sopenharmony_ci asm volatile("callq *(0x12345678)"); /* Expecting: call indirect 0 */ 18598c2ecf20Sopenharmony_ci asm volatile("callq *0x12345678(%rax,%rcx,8)"); /* Expecting: call indirect 0 */ 18608c2ecf20Sopenharmony_ci asm volatile("callq *0x12345678(%r8,%rcx,8)"); /* Expecting: call indirect 0 */ 18618c2ecf20Sopenharmony_ci 18628c2ecf20Sopenharmony_ci asm volatile("bnd callq *%rax"); /* Expecting: call indirect 0 */ 18638c2ecf20Sopenharmony_ci asm volatile("bnd callq *(%rax)"); /* Expecting: call indirect 0 */ 18648c2ecf20Sopenharmony_ci asm volatile("bnd callq *(%r8)"); /* Expecting: call indirect 0 */ 18658c2ecf20Sopenharmony_ci asm volatile("bnd callq *(0x12345678)"); /* Expecting: call indirect 0 */ 18668c2ecf20Sopenharmony_ci asm volatile("bnd callq *0x12345678(%rax,%rcx,8)"); /* Expecting: call indirect 0 */ 18678c2ecf20Sopenharmony_ci asm volatile("bnd callq *0x12345678(%r8,%rcx,8)"); /* Expecting: call indirect 0 */ 18688c2ecf20Sopenharmony_ci 18698c2ecf20Sopenharmony_ci asm volatile("notrack callq *%rax"); /* Expecting: call indirect 0 */ 18708c2ecf20Sopenharmony_ci asm volatile("notrack callq *(%rax)"); /* Expecting: call indirect 0 */ 18718c2ecf20Sopenharmony_ci asm volatile("notrack callq *(%r8)"); /* Expecting: call indirect 0 */ 18728c2ecf20Sopenharmony_ci asm volatile("notrack callq *(0x12345678)"); /* Expecting: call indirect 0 */ 18738c2ecf20Sopenharmony_ci asm volatile("notrack callq *0x12345678(%rax,%rcx,8)"); /* Expecting: call indirect 0 */ 18748c2ecf20Sopenharmony_ci asm volatile("notrack callq *0x12345678(%r8,%rcx,8)"); /* Expecting: call indirect 0 */ 18758c2ecf20Sopenharmony_ci 18768c2ecf20Sopenharmony_ci asm volatile("notrack bnd callq *%rax"); /* Expecting: call indirect 0 */ 18778c2ecf20Sopenharmony_ci asm volatile("notrack bnd callq *(%rax)"); /* Expecting: call indirect 0 */ 18788c2ecf20Sopenharmony_ci asm volatile("notrack bnd callq *(%r8)"); /* Expecting: call indirect 0 */ 18798c2ecf20Sopenharmony_ci asm volatile("notrack bnd callq *(0x12345678)"); /* Expecting: call indirect 0 */ 18808c2ecf20Sopenharmony_ci asm volatile("notrack bnd callq *0x12345678(%rax,%rcx,8)"); /* Expecting: call indirect 0 */ 18818c2ecf20Sopenharmony_ci asm volatile("notrack bnd callq *0x12345678(%r8,%rcx,8)"); /* Expecting: call indirect 0 */ 18828c2ecf20Sopenharmony_ci 18838c2ecf20Sopenharmony_ci /* jmp with/without notrack prefix */ 18848c2ecf20Sopenharmony_ci 18858c2ecf20Sopenharmony_ci asm volatile("jmpq *%rax"); /* Expecting: jmp indirect 0 */ 18868c2ecf20Sopenharmony_ci asm volatile("jmpq *(%rax)"); /* Expecting: jmp indirect 0 */ 18878c2ecf20Sopenharmony_ci asm volatile("jmpq *(%r8)"); /* Expecting: jmp indirect 0 */ 18888c2ecf20Sopenharmony_ci asm volatile("jmpq *(0x12345678)"); /* Expecting: jmp indirect 0 */ 18898c2ecf20Sopenharmony_ci asm volatile("jmpq *0x12345678(%rax,%rcx,8)"); /* Expecting: jmp indirect 0 */ 18908c2ecf20Sopenharmony_ci asm volatile("jmpq *0x12345678(%r8,%rcx,8)"); /* Expecting: jmp indirect 0 */ 18918c2ecf20Sopenharmony_ci 18928c2ecf20Sopenharmony_ci asm volatile("bnd jmpq *%rax"); /* Expecting: jmp indirect 0 */ 18938c2ecf20Sopenharmony_ci asm volatile("bnd jmpq *(%rax)"); /* Expecting: jmp indirect 0 */ 18948c2ecf20Sopenharmony_ci asm volatile("bnd jmpq *(%r8)"); /* Expecting: jmp indirect 0 */ 18958c2ecf20Sopenharmony_ci asm volatile("bnd jmpq *(0x12345678)"); /* Expecting: jmp indirect 0 */ 18968c2ecf20Sopenharmony_ci asm volatile("bnd jmpq *0x12345678(%rax,%rcx,8)"); /* Expecting: jmp indirect 0 */ 18978c2ecf20Sopenharmony_ci asm volatile("bnd jmpq *0x12345678(%r8,%rcx,8)"); /* Expecting: jmp indirect 0 */ 18988c2ecf20Sopenharmony_ci 18998c2ecf20Sopenharmony_ci asm volatile("notrack jmpq *%rax"); /* Expecting: jmp indirect 0 */ 19008c2ecf20Sopenharmony_ci asm volatile("notrack jmpq *(%rax)"); /* Expecting: jmp indirect 0 */ 19018c2ecf20Sopenharmony_ci asm volatile("notrack jmpq *(%r8)"); /* Expecting: jmp indirect 0 */ 19028c2ecf20Sopenharmony_ci asm volatile("notrack jmpq *(0x12345678)"); /* Expecting: jmp indirect 0 */ 19038c2ecf20Sopenharmony_ci asm volatile("notrack jmpq *0x12345678(%rax,%rcx,8)"); /* Expecting: jmp indirect 0 */ 19048c2ecf20Sopenharmony_ci asm volatile("notrack jmpq *0x12345678(%r8,%rcx,8)"); /* Expecting: jmp indirect 0 */ 19058c2ecf20Sopenharmony_ci 19068c2ecf20Sopenharmony_ci asm volatile("notrack bnd jmpq *%rax"); /* Expecting: jmp indirect 0 */ 19078c2ecf20Sopenharmony_ci asm volatile("notrack bnd jmpq *(%rax)"); /* Expecting: jmp indirect 0 */ 19088c2ecf20Sopenharmony_ci asm volatile("notrack bnd jmpq *(%r8)"); /* Expecting: jmp indirect 0 */ 19098c2ecf20Sopenharmony_ci asm volatile("notrack bnd jmpq *(0x12345678)"); /* Expecting: jmp indirect 0 */ 19108c2ecf20Sopenharmony_ci asm volatile("notrack bnd jmpq *0x12345678(%rax,%rcx,8)"); /* Expecting: jmp indirect 0 */ 19118c2ecf20Sopenharmony_ci asm volatile("notrack bnd jmpq *0x12345678(%r8,%rcx,8)"); /* Expecting: jmp indirect 0 */ 19128c2ecf20Sopenharmony_ci 19138c2ecf20Sopenharmony_ci#else /* #ifdef __x86_64__ */ 19148c2ecf20Sopenharmony_ci 19158c2ecf20Sopenharmony_ci /* bound r32, mem (same op code as EVEX prefix) */ 19168c2ecf20Sopenharmony_ci 19178c2ecf20Sopenharmony_ci asm volatile("bound %eax, 0x12345678(%ecx)"); 19188c2ecf20Sopenharmony_ci asm volatile("bound %ecx, 0x12345678(%eax)"); 19198c2ecf20Sopenharmony_ci asm volatile("bound %edx, 0x12345678(%eax)"); 19208c2ecf20Sopenharmony_ci asm volatile("bound %ebx, 0x12345678(%eax)"); 19218c2ecf20Sopenharmony_ci asm volatile("bound %esp, 0x12345678(%eax)"); 19228c2ecf20Sopenharmony_ci asm volatile("bound %ebp, 0x12345678(%eax)"); 19238c2ecf20Sopenharmony_ci asm volatile("bound %esi, 0x12345678(%eax)"); 19248c2ecf20Sopenharmony_ci asm volatile("bound %edi, 0x12345678(%eax)"); 19258c2ecf20Sopenharmony_ci asm volatile("bound %ecx, (%eax)"); 19268c2ecf20Sopenharmony_ci asm volatile("bound %eax, (0x12345678)"); 19278c2ecf20Sopenharmony_ci asm volatile("bound %edx, (%ecx,%eax,1)"); 19288c2ecf20Sopenharmony_ci asm volatile("bound %edx, 0x12345678(,%eax,1)"); 19298c2ecf20Sopenharmony_ci asm volatile("bound %edx, (%eax,%ecx,1)"); 19308c2ecf20Sopenharmony_ci asm volatile("bound %edx, (%eax,%ecx,8)"); 19318c2ecf20Sopenharmony_ci asm volatile("bound %edx, 0x12(%eax)"); 19328c2ecf20Sopenharmony_ci asm volatile("bound %edx, 0x12(%ebp)"); 19338c2ecf20Sopenharmony_ci asm volatile("bound %edx, 0x12(%ecx,%eax,1)"); 19348c2ecf20Sopenharmony_ci asm volatile("bound %edx, 0x12(%ebp,%eax,1)"); 19358c2ecf20Sopenharmony_ci asm volatile("bound %edx, 0x12(%eax,%ecx,1)"); 19368c2ecf20Sopenharmony_ci asm volatile("bound %edx, 0x12(%eax,%ecx,8)"); 19378c2ecf20Sopenharmony_ci asm volatile("bound %edx, 0x12345678(%eax)"); 19388c2ecf20Sopenharmony_ci asm volatile("bound %edx, 0x12345678(%ebp)"); 19398c2ecf20Sopenharmony_ci asm volatile("bound %edx, 0x12345678(%ecx,%eax,1)"); 19408c2ecf20Sopenharmony_ci asm volatile("bound %edx, 0x12345678(%ebp,%eax,1)"); 19418c2ecf20Sopenharmony_ci asm volatile("bound %edx, 0x12345678(%eax,%ecx,1)"); 19428c2ecf20Sopenharmony_ci asm volatile("bound %edx, 0x12345678(%eax,%ecx,8)"); 19438c2ecf20Sopenharmony_ci 19448c2ecf20Sopenharmony_ci /* bound r16, mem (same op code as EVEX prefix) */ 19458c2ecf20Sopenharmony_ci 19468c2ecf20Sopenharmony_ci asm volatile("bound %ax, 0x12345678(%ecx)"); 19478c2ecf20Sopenharmony_ci asm volatile("bound %cx, 0x12345678(%eax)"); 19488c2ecf20Sopenharmony_ci asm volatile("bound %dx, 0x12345678(%eax)"); 19498c2ecf20Sopenharmony_ci asm volatile("bound %bx, 0x12345678(%eax)"); 19508c2ecf20Sopenharmony_ci asm volatile("bound %sp, 0x12345678(%eax)"); 19518c2ecf20Sopenharmony_ci asm volatile("bound %bp, 0x12345678(%eax)"); 19528c2ecf20Sopenharmony_ci asm volatile("bound %si, 0x12345678(%eax)"); 19538c2ecf20Sopenharmony_ci asm volatile("bound %di, 0x12345678(%eax)"); 19548c2ecf20Sopenharmony_ci asm volatile("bound %cx, (%eax)"); 19558c2ecf20Sopenharmony_ci asm volatile("bound %ax, (0x12345678)"); 19568c2ecf20Sopenharmony_ci asm volatile("bound %dx, (%ecx,%eax,1)"); 19578c2ecf20Sopenharmony_ci asm volatile("bound %dx, 0x12345678(,%eax,1)"); 19588c2ecf20Sopenharmony_ci asm volatile("bound %dx, (%eax,%ecx,1)"); 19598c2ecf20Sopenharmony_ci asm volatile("bound %dx, (%eax,%ecx,8)"); 19608c2ecf20Sopenharmony_ci asm volatile("bound %dx, 0x12(%eax)"); 19618c2ecf20Sopenharmony_ci asm volatile("bound %dx, 0x12(%ebp)"); 19628c2ecf20Sopenharmony_ci asm volatile("bound %dx, 0x12(%ecx,%eax,1)"); 19638c2ecf20Sopenharmony_ci asm volatile("bound %dx, 0x12(%ebp,%eax,1)"); 19648c2ecf20Sopenharmony_ci asm volatile("bound %dx, 0x12(%eax,%ecx,1)"); 19658c2ecf20Sopenharmony_ci asm volatile("bound %dx, 0x12(%eax,%ecx,8)"); 19668c2ecf20Sopenharmony_ci asm volatile("bound %dx, 0x12345678(%eax)"); 19678c2ecf20Sopenharmony_ci asm volatile("bound %dx, 0x12345678(%ebp)"); 19688c2ecf20Sopenharmony_ci asm volatile("bound %dx, 0x12345678(%ecx,%eax,1)"); 19698c2ecf20Sopenharmony_ci asm volatile("bound %dx, 0x12345678(%ebp,%eax,1)"); 19708c2ecf20Sopenharmony_ci asm volatile("bound %dx, 0x12345678(%eax,%ecx,1)"); 19718c2ecf20Sopenharmony_ci asm volatile("bound %dx, 0x12345678(%eax,%ecx,8)"); 19728c2ecf20Sopenharmony_ci 19738c2ecf20Sopenharmony_ci /* AVX-512: Instructions with the same op codes as Mask Instructions */ 19748c2ecf20Sopenharmony_ci 19758c2ecf20Sopenharmony_ci asm volatile("cmovno %eax,%ebx"); 19768c2ecf20Sopenharmony_ci asm volatile("cmovno 0x12345678(%eax),%ecx"); 19778c2ecf20Sopenharmony_ci asm volatile("cmovno 0x12345678(%eax),%cx"); 19788c2ecf20Sopenharmony_ci 19798c2ecf20Sopenharmony_ci asm volatile("cmove %eax,%ebx"); 19808c2ecf20Sopenharmony_ci asm volatile("cmove 0x12345678(%eax),%ecx"); 19818c2ecf20Sopenharmony_ci asm volatile("cmove 0x12345678(%eax),%cx"); 19828c2ecf20Sopenharmony_ci 19838c2ecf20Sopenharmony_ci asm volatile("seto 0x12345678(%eax)"); 19848c2ecf20Sopenharmony_ci asm volatile("setno 0x12345678(%eax)"); 19858c2ecf20Sopenharmony_ci asm volatile("setb 0x12345678(%eax)"); 19868c2ecf20Sopenharmony_ci asm volatile("setc 0x12345678(%eax)"); 19878c2ecf20Sopenharmony_ci asm volatile("setnae 0x12345678(%eax)"); 19888c2ecf20Sopenharmony_ci asm volatile("setae 0x12345678(%eax)"); 19898c2ecf20Sopenharmony_ci asm volatile("setnb 0x12345678(%eax)"); 19908c2ecf20Sopenharmony_ci asm volatile("setnc 0x12345678(%eax)"); 19918c2ecf20Sopenharmony_ci asm volatile("sets 0x12345678(%eax)"); 19928c2ecf20Sopenharmony_ci asm volatile("setns 0x12345678(%eax)"); 19938c2ecf20Sopenharmony_ci 19948c2ecf20Sopenharmony_ci /* AVX-512: Mask Instructions */ 19958c2ecf20Sopenharmony_ci 19968c2ecf20Sopenharmony_ci asm volatile("kandw %k7,%k6,%k5"); 19978c2ecf20Sopenharmony_ci asm volatile("kandq %k7,%k6,%k5"); 19988c2ecf20Sopenharmony_ci asm volatile("kandb %k7,%k6,%k5"); 19998c2ecf20Sopenharmony_ci asm volatile("kandd %k7,%k6,%k5"); 20008c2ecf20Sopenharmony_ci 20018c2ecf20Sopenharmony_ci asm volatile("kandnw %k7,%k6,%k5"); 20028c2ecf20Sopenharmony_ci asm volatile("kandnq %k7,%k6,%k5"); 20038c2ecf20Sopenharmony_ci asm volatile("kandnb %k7,%k6,%k5"); 20048c2ecf20Sopenharmony_ci asm volatile("kandnd %k7,%k6,%k5"); 20058c2ecf20Sopenharmony_ci 20068c2ecf20Sopenharmony_ci asm volatile("knotw %k7,%k6"); 20078c2ecf20Sopenharmony_ci asm volatile("knotq %k7,%k6"); 20088c2ecf20Sopenharmony_ci asm volatile("knotb %k7,%k6"); 20098c2ecf20Sopenharmony_ci asm volatile("knotd %k7,%k6"); 20108c2ecf20Sopenharmony_ci 20118c2ecf20Sopenharmony_ci asm volatile("korw %k7,%k6,%k5"); 20128c2ecf20Sopenharmony_ci asm volatile("korq %k7,%k6,%k5"); 20138c2ecf20Sopenharmony_ci asm volatile("korb %k7,%k6,%k5"); 20148c2ecf20Sopenharmony_ci asm volatile("kord %k7,%k6,%k5"); 20158c2ecf20Sopenharmony_ci 20168c2ecf20Sopenharmony_ci asm volatile("kxnorw %k7,%k6,%k5"); 20178c2ecf20Sopenharmony_ci asm volatile("kxnorq %k7,%k6,%k5"); 20188c2ecf20Sopenharmony_ci asm volatile("kxnorb %k7,%k6,%k5"); 20198c2ecf20Sopenharmony_ci asm volatile("kxnord %k7,%k6,%k5"); 20208c2ecf20Sopenharmony_ci 20218c2ecf20Sopenharmony_ci asm volatile("kxorw %k7,%k6,%k5"); 20228c2ecf20Sopenharmony_ci asm volatile("kxorq %k7,%k6,%k5"); 20238c2ecf20Sopenharmony_ci asm volatile("kxorb %k7,%k6,%k5"); 20248c2ecf20Sopenharmony_ci asm volatile("kxord %k7,%k6,%k5"); 20258c2ecf20Sopenharmony_ci 20268c2ecf20Sopenharmony_ci asm volatile("kaddw %k7,%k6,%k5"); 20278c2ecf20Sopenharmony_ci asm volatile("kaddq %k7,%k6,%k5"); 20288c2ecf20Sopenharmony_ci asm volatile("kaddb %k7,%k6,%k5"); 20298c2ecf20Sopenharmony_ci asm volatile("kaddd %k7,%k6,%k5"); 20308c2ecf20Sopenharmony_ci 20318c2ecf20Sopenharmony_ci asm volatile("kunpckbw %k7,%k6,%k5"); 20328c2ecf20Sopenharmony_ci asm volatile("kunpckwd %k7,%k6,%k5"); 20338c2ecf20Sopenharmony_ci asm volatile("kunpckdq %k7,%k6,%k5"); 20348c2ecf20Sopenharmony_ci 20358c2ecf20Sopenharmony_ci asm volatile("kmovw %k6,%k5"); 20368c2ecf20Sopenharmony_ci asm volatile("kmovw (%ecx),%k5"); 20378c2ecf20Sopenharmony_ci asm volatile("kmovw 0x123(%eax,%ecx,8),%k5"); 20388c2ecf20Sopenharmony_ci asm volatile("kmovw %k5,(%ecx)"); 20398c2ecf20Sopenharmony_ci asm volatile("kmovw %k5,0x123(%eax,%ecx,8)"); 20408c2ecf20Sopenharmony_ci asm volatile("kmovw %eax,%k5"); 20418c2ecf20Sopenharmony_ci asm volatile("kmovw %ebp,%k5"); 20428c2ecf20Sopenharmony_ci asm volatile("kmovw %k5,%eax"); 20438c2ecf20Sopenharmony_ci asm volatile("kmovw %k5,%ebp"); 20448c2ecf20Sopenharmony_ci 20458c2ecf20Sopenharmony_ci asm volatile("kmovq %k6,%k5"); 20468c2ecf20Sopenharmony_ci asm volatile("kmovq (%ecx),%k5"); 20478c2ecf20Sopenharmony_ci asm volatile("kmovq 0x123(%eax,%ecx,8),%k5"); 20488c2ecf20Sopenharmony_ci asm volatile("kmovq %k5,(%ecx)"); 20498c2ecf20Sopenharmony_ci asm volatile("kmovq %k5,0x123(%eax,%ecx,8)"); 20508c2ecf20Sopenharmony_ci 20518c2ecf20Sopenharmony_ci asm volatile("kmovb %k6,%k5"); 20528c2ecf20Sopenharmony_ci asm volatile("kmovb (%ecx),%k5"); 20538c2ecf20Sopenharmony_ci asm volatile("kmovb 0x123(%eax,%ecx,8),%k5"); 20548c2ecf20Sopenharmony_ci asm volatile("kmovb %k5,(%ecx)"); 20558c2ecf20Sopenharmony_ci asm volatile("kmovb %k5,0x123(%eax,%ecx,8)"); 20568c2ecf20Sopenharmony_ci asm volatile("kmovb %eax,%k5"); 20578c2ecf20Sopenharmony_ci asm volatile("kmovb %ebp,%k5"); 20588c2ecf20Sopenharmony_ci asm volatile("kmovb %k5,%eax"); 20598c2ecf20Sopenharmony_ci asm volatile("kmovb %k5,%ebp"); 20608c2ecf20Sopenharmony_ci 20618c2ecf20Sopenharmony_ci asm volatile("kmovd %k6,%k5"); 20628c2ecf20Sopenharmony_ci asm volatile("kmovd (%ecx),%k5"); 20638c2ecf20Sopenharmony_ci asm volatile("kmovd 0x123(%eax,%ecx,8),%k5"); 20648c2ecf20Sopenharmony_ci asm volatile("kmovd %k5,(%ecx)"); 20658c2ecf20Sopenharmony_ci asm volatile("kmovd %k5,0x123(%eax,%ecx,8)"); 20668c2ecf20Sopenharmony_ci asm volatile("kmovd %eax,%k5"); 20678c2ecf20Sopenharmony_ci asm volatile("kmovd %ebp,%k5"); 20688c2ecf20Sopenharmony_ci asm volatile("kmovd %k5,%eax"); 20698c2ecf20Sopenharmony_ci asm volatile("kmovd %k5,%ebp"); 20708c2ecf20Sopenharmony_ci 20718c2ecf20Sopenharmony_ci asm volatile("kortestw %k6,%k5"); 20728c2ecf20Sopenharmony_ci asm volatile("kortestq %k6,%k5"); 20738c2ecf20Sopenharmony_ci asm volatile("kortestb %k6,%k5"); 20748c2ecf20Sopenharmony_ci asm volatile("kortestd %k6,%k5"); 20758c2ecf20Sopenharmony_ci 20768c2ecf20Sopenharmony_ci asm volatile("ktestw %k6,%k5"); 20778c2ecf20Sopenharmony_ci asm volatile("ktestq %k6,%k5"); 20788c2ecf20Sopenharmony_ci asm volatile("ktestb %k6,%k5"); 20798c2ecf20Sopenharmony_ci asm volatile("ktestd %k6,%k5"); 20808c2ecf20Sopenharmony_ci 20818c2ecf20Sopenharmony_ci asm volatile("kshiftrw $0x12,%k6,%k5"); 20828c2ecf20Sopenharmony_ci asm volatile("kshiftrq $0x5b,%k6,%k5"); 20838c2ecf20Sopenharmony_ci asm volatile("kshiftlw $0x12,%k6,%k5"); 20848c2ecf20Sopenharmony_ci asm volatile("kshiftlq $0x5b,%k6,%k5"); 20858c2ecf20Sopenharmony_ci 20868c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 5b */ 20878c2ecf20Sopenharmony_ci asm volatile("vcvtdq2ps %xmm5,%xmm6"); 20888c2ecf20Sopenharmony_ci asm volatile("vcvtqq2ps %zmm5,%ymm6{%k7}"); 20898c2ecf20Sopenharmony_ci asm volatile("vcvtps2dq %xmm5,%xmm6"); 20908c2ecf20Sopenharmony_ci asm volatile("vcvttps2dq %xmm5,%xmm6"); 20918c2ecf20Sopenharmony_ci 20928c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 6f */ 20938c2ecf20Sopenharmony_ci 20948c2ecf20Sopenharmony_ci asm volatile("movq %mm0,%mm4"); 20958c2ecf20Sopenharmony_ci asm volatile("vmovdqa %ymm4,%ymm6"); 20968c2ecf20Sopenharmony_ci asm volatile("vmovdqa32 %zmm5,%zmm6"); 20978c2ecf20Sopenharmony_ci asm volatile("vmovdqa64 %zmm5,%zmm6"); 20988c2ecf20Sopenharmony_ci asm volatile("vmovdqu %ymm4,%ymm6"); 20998c2ecf20Sopenharmony_ci asm volatile("vmovdqu32 %zmm5,%zmm6"); 21008c2ecf20Sopenharmony_ci asm volatile("vmovdqu64 %zmm5,%zmm6"); 21018c2ecf20Sopenharmony_ci asm volatile("vmovdqu8 %zmm5,%zmm6"); 21028c2ecf20Sopenharmony_ci asm volatile("vmovdqu16 %zmm5,%zmm6"); 21038c2ecf20Sopenharmony_ci 21048c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 78 */ 21058c2ecf20Sopenharmony_ci 21068c2ecf20Sopenharmony_ci asm volatile("vmread %eax,%ebx"); 21078c2ecf20Sopenharmony_ci asm volatile("vcvttps2udq %zmm5,%zmm6"); 21088c2ecf20Sopenharmony_ci asm volatile("vcvttpd2udq %zmm5,%ymm6{%k7}"); 21098c2ecf20Sopenharmony_ci asm volatile("vcvttsd2usi %xmm6,%eax"); 21108c2ecf20Sopenharmony_ci asm volatile("vcvttss2usi %xmm6,%eax"); 21118c2ecf20Sopenharmony_ci asm volatile("vcvttps2uqq %ymm5,%zmm6{%k7}"); 21128c2ecf20Sopenharmony_ci asm volatile("vcvttpd2uqq %zmm5,%zmm6"); 21138c2ecf20Sopenharmony_ci 21148c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 79 */ 21158c2ecf20Sopenharmony_ci 21168c2ecf20Sopenharmony_ci asm volatile("vmwrite %eax,%ebx"); 21178c2ecf20Sopenharmony_ci asm volatile("vcvtps2udq %zmm5,%zmm6"); 21188c2ecf20Sopenharmony_ci asm volatile("vcvtpd2udq %zmm5,%ymm6{%k7}"); 21198c2ecf20Sopenharmony_ci asm volatile("vcvtsd2usi %xmm6,%eax"); 21208c2ecf20Sopenharmony_ci asm volatile("vcvtss2usi %xmm6,%eax"); 21218c2ecf20Sopenharmony_ci asm volatile("vcvtps2uqq %ymm5,%zmm6{%k7}"); 21228c2ecf20Sopenharmony_ci asm volatile("vcvtpd2uqq %zmm5,%zmm6"); 21238c2ecf20Sopenharmony_ci 21248c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 7a */ 21258c2ecf20Sopenharmony_ci 21268c2ecf20Sopenharmony_ci asm volatile("vcvtudq2pd %ymm5,%zmm6{%k7}"); 21278c2ecf20Sopenharmony_ci asm volatile("vcvtuqq2pd %zmm5,%zmm6"); 21288c2ecf20Sopenharmony_ci asm volatile("vcvtudq2ps %zmm5,%zmm6"); 21298c2ecf20Sopenharmony_ci asm volatile("vcvtuqq2ps %zmm5,%ymm6{%k7}"); 21308c2ecf20Sopenharmony_ci asm volatile("vcvttps2qq %ymm5,%zmm6{%k7}"); 21318c2ecf20Sopenharmony_ci asm volatile("vcvttpd2qq %zmm5,%zmm6"); 21328c2ecf20Sopenharmony_ci 21338c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 7b */ 21348c2ecf20Sopenharmony_ci 21358c2ecf20Sopenharmony_ci asm volatile("vcvtusi2sd %eax,%xmm5,%xmm6"); 21368c2ecf20Sopenharmony_ci asm volatile("vcvtusi2ss %eax,%xmm5,%xmm6"); 21378c2ecf20Sopenharmony_ci asm volatile("vcvtps2qq %ymm5,%zmm6{%k7}"); 21388c2ecf20Sopenharmony_ci asm volatile("vcvtpd2qq %zmm5,%zmm6"); 21398c2ecf20Sopenharmony_ci 21408c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 7f */ 21418c2ecf20Sopenharmony_ci 21428c2ecf20Sopenharmony_ci asm volatile("movq.s %mm0,%mm4"); 21438c2ecf20Sopenharmony_ci asm volatile("vmovdqa.s %ymm5,%ymm6"); 21448c2ecf20Sopenharmony_ci asm volatile("vmovdqa32.s %zmm5,%zmm6"); 21458c2ecf20Sopenharmony_ci asm volatile("vmovdqa64.s %zmm5,%zmm6"); 21468c2ecf20Sopenharmony_ci asm volatile("vmovdqu.s %ymm5,%ymm6"); 21478c2ecf20Sopenharmony_ci asm volatile("vmovdqu32.s %zmm5,%zmm6"); 21488c2ecf20Sopenharmony_ci asm volatile("vmovdqu64.s %zmm5,%zmm6"); 21498c2ecf20Sopenharmony_ci asm volatile("vmovdqu8.s %zmm5,%zmm6"); 21508c2ecf20Sopenharmony_ci asm volatile("vmovdqu16.s %zmm5,%zmm6"); 21518c2ecf20Sopenharmony_ci 21528c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f db */ 21538c2ecf20Sopenharmony_ci 21548c2ecf20Sopenharmony_ci asm volatile("pand %mm1,%mm2"); 21558c2ecf20Sopenharmony_ci asm volatile("pand %xmm1,%xmm2"); 21568c2ecf20Sopenharmony_ci asm volatile("vpand %ymm4,%ymm6,%ymm2"); 21578c2ecf20Sopenharmony_ci asm volatile("vpandd %zmm4,%zmm5,%zmm6"); 21588c2ecf20Sopenharmony_ci asm volatile("vpandq %zmm4,%zmm5,%zmm6"); 21598c2ecf20Sopenharmony_ci 21608c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f df */ 21618c2ecf20Sopenharmony_ci 21628c2ecf20Sopenharmony_ci asm volatile("pandn %mm1,%mm2"); 21638c2ecf20Sopenharmony_ci asm volatile("pandn %xmm1,%xmm2"); 21648c2ecf20Sopenharmony_ci asm volatile("vpandn %ymm4,%ymm6,%ymm2"); 21658c2ecf20Sopenharmony_ci asm volatile("vpandnd %zmm4,%zmm5,%zmm6"); 21668c2ecf20Sopenharmony_ci asm volatile("vpandnq %zmm4,%zmm5,%zmm6"); 21678c2ecf20Sopenharmony_ci 21688c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f e6 */ 21698c2ecf20Sopenharmony_ci 21708c2ecf20Sopenharmony_ci asm volatile("vcvttpd2dq %xmm1,%xmm2"); 21718c2ecf20Sopenharmony_ci asm volatile("vcvtdq2pd %xmm5,%xmm6"); 21728c2ecf20Sopenharmony_ci asm volatile("vcvtdq2pd %ymm5,%zmm6{%k7}"); 21738c2ecf20Sopenharmony_ci asm volatile("vcvtqq2pd %zmm5,%zmm6"); 21748c2ecf20Sopenharmony_ci asm volatile("vcvtpd2dq %xmm1,%xmm2"); 21758c2ecf20Sopenharmony_ci 21768c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f eb */ 21778c2ecf20Sopenharmony_ci 21788c2ecf20Sopenharmony_ci asm volatile("por %mm4,%mm6"); 21798c2ecf20Sopenharmony_ci asm volatile("vpor %ymm4,%ymm6,%ymm2"); 21808c2ecf20Sopenharmony_ci asm volatile("vpord %zmm4,%zmm5,%zmm6"); 21818c2ecf20Sopenharmony_ci asm volatile("vporq %zmm4,%zmm5,%zmm6"); 21828c2ecf20Sopenharmony_ci 21838c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f ef */ 21848c2ecf20Sopenharmony_ci 21858c2ecf20Sopenharmony_ci asm volatile("pxor %mm4,%mm6"); 21868c2ecf20Sopenharmony_ci asm volatile("vpxor %ymm4,%ymm6,%ymm2"); 21878c2ecf20Sopenharmony_ci asm volatile("vpxord %zmm4,%zmm5,%zmm6"); 21888c2ecf20Sopenharmony_ci asm volatile("vpxorq %zmm4,%zmm5,%zmm6"); 21898c2ecf20Sopenharmony_ci 21908c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 38 10 */ 21918c2ecf20Sopenharmony_ci 21928c2ecf20Sopenharmony_ci asm volatile("pblendvb %xmm1,%xmm0"); 21938c2ecf20Sopenharmony_ci asm volatile("vpsrlvw %zmm4,%zmm5,%zmm6"); 21948c2ecf20Sopenharmony_ci asm volatile("vpmovuswb %zmm5,%ymm6{%k7}"); 21958c2ecf20Sopenharmony_ci 21968c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 38 11 */ 21978c2ecf20Sopenharmony_ci 21988c2ecf20Sopenharmony_ci asm volatile("vpmovusdb %zmm5,%xmm6{%k7}"); 21998c2ecf20Sopenharmony_ci asm volatile("vpsravw %zmm4,%zmm5,%zmm6"); 22008c2ecf20Sopenharmony_ci 22018c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 38 12 */ 22028c2ecf20Sopenharmony_ci 22038c2ecf20Sopenharmony_ci asm volatile("vpmovusqb %zmm5,%xmm6{%k7}"); 22048c2ecf20Sopenharmony_ci asm volatile("vpsllvw %zmm4,%zmm5,%zmm6"); 22058c2ecf20Sopenharmony_ci 22068c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 38 13 */ 22078c2ecf20Sopenharmony_ci 22088c2ecf20Sopenharmony_ci asm volatile("vcvtph2ps %xmm3,%ymm5"); 22098c2ecf20Sopenharmony_ci asm volatile("vcvtph2ps %ymm5,%zmm6{%k7}"); 22108c2ecf20Sopenharmony_ci asm volatile("vpmovusdw %zmm5,%ymm6{%k7}"); 22118c2ecf20Sopenharmony_ci 22128c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 38 14 */ 22138c2ecf20Sopenharmony_ci 22148c2ecf20Sopenharmony_ci asm volatile("blendvps %xmm1,%xmm0"); 22158c2ecf20Sopenharmony_ci asm volatile("vpmovusqw %zmm5,%xmm6{%k7}"); 22168c2ecf20Sopenharmony_ci asm volatile("vprorvd %zmm4,%zmm5,%zmm6"); 22178c2ecf20Sopenharmony_ci asm volatile("vprorvq %zmm4,%zmm5,%zmm6"); 22188c2ecf20Sopenharmony_ci 22198c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 38 15 */ 22208c2ecf20Sopenharmony_ci 22218c2ecf20Sopenharmony_ci asm volatile("blendvpd %xmm1,%xmm0"); 22228c2ecf20Sopenharmony_ci asm volatile("vpmovusqd %zmm5,%ymm6{%k7}"); 22238c2ecf20Sopenharmony_ci asm volatile("vprolvd %zmm4,%zmm5,%zmm6"); 22248c2ecf20Sopenharmony_ci asm volatile("vprolvq %zmm4,%zmm5,%zmm6"); 22258c2ecf20Sopenharmony_ci 22268c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 38 16 */ 22278c2ecf20Sopenharmony_ci 22288c2ecf20Sopenharmony_ci asm volatile("vpermps %ymm4,%ymm6,%ymm2"); 22298c2ecf20Sopenharmony_ci asm volatile("vpermps %ymm4,%ymm6,%ymm2{%k7}"); 22308c2ecf20Sopenharmony_ci asm volatile("vpermpd %ymm4,%ymm6,%ymm2{%k7}"); 22318c2ecf20Sopenharmony_ci 22328c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 38 19 */ 22338c2ecf20Sopenharmony_ci 22348c2ecf20Sopenharmony_ci asm volatile("vbroadcastsd %xmm4,%ymm6"); 22358c2ecf20Sopenharmony_ci asm volatile("vbroadcastf32x2 %xmm7,%zmm6"); 22368c2ecf20Sopenharmony_ci 22378c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 38 1a */ 22388c2ecf20Sopenharmony_ci 22398c2ecf20Sopenharmony_ci asm volatile("vbroadcastf128 (%ecx),%ymm4"); 22408c2ecf20Sopenharmony_ci asm volatile("vbroadcastf32x4 (%ecx),%zmm6"); 22418c2ecf20Sopenharmony_ci asm volatile("vbroadcastf64x2 (%ecx),%zmm6"); 22428c2ecf20Sopenharmony_ci 22438c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 38 1b */ 22448c2ecf20Sopenharmony_ci 22458c2ecf20Sopenharmony_ci asm volatile("vbroadcastf32x8 (%ecx),%zmm6"); 22468c2ecf20Sopenharmony_ci asm volatile("vbroadcastf64x4 (%ecx),%zmm6"); 22478c2ecf20Sopenharmony_ci 22488c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 38 1f */ 22498c2ecf20Sopenharmony_ci 22508c2ecf20Sopenharmony_ci asm volatile("vpabsq %zmm4,%zmm6"); 22518c2ecf20Sopenharmony_ci 22528c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 38 20 */ 22538c2ecf20Sopenharmony_ci 22548c2ecf20Sopenharmony_ci asm volatile("vpmovsxbw %xmm4,%xmm5"); 22558c2ecf20Sopenharmony_ci asm volatile("vpmovswb %zmm5,%ymm6{%k7}"); 22568c2ecf20Sopenharmony_ci 22578c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 38 21 */ 22588c2ecf20Sopenharmony_ci 22598c2ecf20Sopenharmony_ci asm volatile("vpmovsxbd %xmm4,%ymm6"); 22608c2ecf20Sopenharmony_ci asm volatile("vpmovsdb %zmm5,%xmm6{%k7}"); 22618c2ecf20Sopenharmony_ci 22628c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 38 22 */ 22638c2ecf20Sopenharmony_ci 22648c2ecf20Sopenharmony_ci asm volatile("vpmovsxbq %xmm4,%ymm4"); 22658c2ecf20Sopenharmony_ci asm volatile("vpmovsqb %zmm5,%xmm6{%k7}"); 22668c2ecf20Sopenharmony_ci 22678c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 38 23 */ 22688c2ecf20Sopenharmony_ci 22698c2ecf20Sopenharmony_ci asm volatile("vpmovsxwd %xmm4,%ymm4"); 22708c2ecf20Sopenharmony_ci asm volatile("vpmovsdw %zmm5,%ymm6{%k7}"); 22718c2ecf20Sopenharmony_ci 22728c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 38 24 */ 22738c2ecf20Sopenharmony_ci 22748c2ecf20Sopenharmony_ci asm volatile("vpmovsxwq %xmm4,%ymm6"); 22758c2ecf20Sopenharmony_ci asm volatile("vpmovsqw %zmm5,%xmm6{%k7}"); 22768c2ecf20Sopenharmony_ci 22778c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 38 25 */ 22788c2ecf20Sopenharmony_ci 22798c2ecf20Sopenharmony_ci asm volatile("vpmovsxdq %xmm4,%ymm4"); 22808c2ecf20Sopenharmony_ci asm volatile("vpmovsqd %zmm5,%ymm6{%k7}"); 22818c2ecf20Sopenharmony_ci 22828c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 38 26 */ 22838c2ecf20Sopenharmony_ci 22848c2ecf20Sopenharmony_ci asm volatile("vptestmb %zmm5,%zmm6,%k5"); 22858c2ecf20Sopenharmony_ci asm volatile("vptestmw %zmm5,%zmm6,%k5"); 22868c2ecf20Sopenharmony_ci asm volatile("vptestnmb %zmm4,%zmm5,%k5"); 22878c2ecf20Sopenharmony_ci asm volatile("vptestnmw %zmm4,%zmm5,%k5"); 22888c2ecf20Sopenharmony_ci 22898c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 38 27 */ 22908c2ecf20Sopenharmony_ci 22918c2ecf20Sopenharmony_ci asm volatile("vptestmd %zmm5,%zmm6,%k5"); 22928c2ecf20Sopenharmony_ci asm volatile("vptestmq %zmm5,%zmm6,%k5"); 22938c2ecf20Sopenharmony_ci asm volatile("vptestnmd %zmm4,%zmm5,%k5"); 22948c2ecf20Sopenharmony_ci asm volatile("vptestnmq %zmm4,%zmm5,%k5"); 22958c2ecf20Sopenharmony_ci 22968c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 38 28 */ 22978c2ecf20Sopenharmony_ci 22988c2ecf20Sopenharmony_ci asm volatile("vpmuldq %ymm4,%ymm6,%ymm2"); 22998c2ecf20Sopenharmony_ci asm volatile("vpmovm2b %k5,%zmm6"); 23008c2ecf20Sopenharmony_ci asm volatile("vpmovm2w %k5,%zmm6"); 23018c2ecf20Sopenharmony_ci 23028c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 38 29 */ 23038c2ecf20Sopenharmony_ci 23048c2ecf20Sopenharmony_ci asm volatile("vpcmpeqq %ymm4,%ymm6,%ymm2"); 23058c2ecf20Sopenharmony_ci asm volatile("vpmovb2m %zmm6,%k5"); 23068c2ecf20Sopenharmony_ci asm volatile("vpmovw2m %zmm6,%k5"); 23078c2ecf20Sopenharmony_ci 23088c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 38 2a */ 23098c2ecf20Sopenharmony_ci 23108c2ecf20Sopenharmony_ci asm volatile("vmovntdqa (%ecx),%ymm4"); 23118c2ecf20Sopenharmony_ci asm volatile("vpbroadcastmb2q %k6,%zmm1"); 23128c2ecf20Sopenharmony_ci 23138c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 38 2c */ 23148c2ecf20Sopenharmony_ci 23158c2ecf20Sopenharmony_ci asm volatile("vmaskmovps (%ecx),%ymm4,%ymm6"); 23168c2ecf20Sopenharmony_ci asm volatile("vscalefps %zmm4,%zmm5,%zmm6"); 23178c2ecf20Sopenharmony_ci asm volatile("vscalefpd %zmm4,%zmm5,%zmm6"); 23188c2ecf20Sopenharmony_ci 23198c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 38 2d */ 23208c2ecf20Sopenharmony_ci 23218c2ecf20Sopenharmony_ci asm volatile("vmaskmovpd (%ecx),%ymm4,%ymm6"); 23228c2ecf20Sopenharmony_ci asm volatile("vscalefss %xmm4,%xmm5,%xmm6{%k7}"); 23238c2ecf20Sopenharmony_ci asm volatile("vscalefsd %xmm4,%xmm5,%xmm6{%k7}"); 23248c2ecf20Sopenharmony_ci 23258c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 38 30 */ 23268c2ecf20Sopenharmony_ci 23278c2ecf20Sopenharmony_ci asm volatile("vpmovzxbw %xmm4,%ymm4"); 23288c2ecf20Sopenharmony_ci asm volatile("vpmovwb %zmm5,%ymm6{%k7}"); 23298c2ecf20Sopenharmony_ci 23308c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 38 31 */ 23318c2ecf20Sopenharmony_ci 23328c2ecf20Sopenharmony_ci asm volatile("vpmovzxbd %xmm4,%ymm6"); 23338c2ecf20Sopenharmony_ci asm volatile("vpmovdb %zmm5,%xmm6{%k7}"); 23348c2ecf20Sopenharmony_ci 23358c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 38 32 */ 23368c2ecf20Sopenharmony_ci 23378c2ecf20Sopenharmony_ci asm volatile("vpmovzxbq %xmm4,%ymm4"); 23388c2ecf20Sopenharmony_ci asm volatile("vpmovqb %zmm5,%xmm6{%k7}"); 23398c2ecf20Sopenharmony_ci 23408c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 38 33 */ 23418c2ecf20Sopenharmony_ci 23428c2ecf20Sopenharmony_ci asm volatile("vpmovzxwd %xmm4,%ymm4"); 23438c2ecf20Sopenharmony_ci asm volatile("vpmovdw %zmm5,%ymm6{%k7}"); 23448c2ecf20Sopenharmony_ci 23458c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 38 34 */ 23468c2ecf20Sopenharmony_ci 23478c2ecf20Sopenharmony_ci asm volatile("vpmovzxwq %xmm4,%ymm6"); 23488c2ecf20Sopenharmony_ci asm volatile("vpmovqw %zmm5,%xmm6{%k7}"); 23498c2ecf20Sopenharmony_ci 23508c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 38 35 */ 23518c2ecf20Sopenharmony_ci 23528c2ecf20Sopenharmony_ci asm volatile("vpmovzxdq %xmm4,%ymm4"); 23538c2ecf20Sopenharmony_ci asm volatile("vpmovqd %zmm5,%ymm6{%k7}"); 23548c2ecf20Sopenharmony_ci 23558c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 38 36 */ 23568c2ecf20Sopenharmony_ci 23578c2ecf20Sopenharmony_ci asm volatile("vpermd %ymm4,%ymm6,%ymm2"); 23588c2ecf20Sopenharmony_ci asm volatile("vpermd %ymm4,%ymm6,%ymm2{%k7}"); 23598c2ecf20Sopenharmony_ci asm volatile("vpermq %ymm4,%ymm6,%ymm2{%k7}"); 23608c2ecf20Sopenharmony_ci 23618c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 38 38 */ 23628c2ecf20Sopenharmony_ci 23638c2ecf20Sopenharmony_ci asm volatile("vpminsb %ymm4,%ymm6,%ymm2"); 23648c2ecf20Sopenharmony_ci asm volatile("vpmovm2d %k5,%zmm6"); 23658c2ecf20Sopenharmony_ci asm volatile("vpmovm2q %k5,%zmm6"); 23668c2ecf20Sopenharmony_ci 23678c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 38 39 */ 23688c2ecf20Sopenharmony_ci 23698c2ecf20Sopenharmony_ci asm volatile("vpminsd %xmm1,%xmm2,%xmm3"); 23708c2ecf20Sopenharmony_ci asm volatile("vpminsd %zmm4,%zmm5,%zmm6"); 23718c2ecf20Sopenharmony_ci asm volatile("vpminsq %zmm4,%zmm5,%zmm6"); 23728c2ecf20Sopenharmony_ci asm volatile("vpmovd2m %zmm6,%k5"); 23738c2ecf20Sopenharmony_ci asm volatile("vpmovq2m %zmm6,%k5"); 23748c2ecf20Sopenharmony_ci 23758c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 38 3a */ 23768c2ecf20Sopenharmony_ci 23778c2ecf20Sopenharmony_ci asm volatile("vpminuw %ymm4,%ymm6,%ymm2"); 23788c2ecf20Sopenharmony_ci asm volatile("vpbroadcastmw2d %k6,%zmm6"); 23798c2ecf20Sopenharmony_ci 23808c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 38 3b */ 23818c2ecf20Sopenharmony_ci 23828c2ecf20Sopenharmony_ci asm volatile("vpminud %ymm4,%ymm6,%ymm2"); 23838c2ecf20Sopenharmony_ci asm volatile("vpminud %zmm4,%zmm5,%zmm6"); 23848c2ecf20Sopenharmony_ci asm volatile("vpminuq %zmm4,%zmm5,%zmm6"); 23858c2ecf20Sopenharmony_ci 23868c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 38 3d */ 23878c2ecf20Sopenharmony_ci 23888c2ecf20Sopenharmony_ci asm volatile("vpmaxsd %ymm4,%ymm6,%ymm2"); 23898c2ecf20Sopenharmony_ci asm volatile("vpmaxsd %zmm4,%zmm5,%zmm6"); 23908c2ecf20Sopenharmony_ci asm volatile("vpmaxsq %zmm4,%zmm5,%zmm6"); 23918c2ecf20Sopenharmony_ci 23928c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 38 3f */ 23938c2ecf20Sopenharmony_ci 23948c2ecf20Sopenharmony_ci asm volatile("vpmaxud %ymm4,%ymm6,%ymm2"); 23958c2ecf20Sopenharmony_ci asm volatile("vpmaxud %zmm4,%zmm5,%zmm6"); 23968c2ecf20Sopenharmony_ci asm volatile("vpmaxuq %zmm4,%zmm5,%zmm6"); 23978c2ecf20Sopenharmony_ci 23988c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 38 40 */ 23998c2ecf20Sopenharmony_ci 24008c2ecf20Sopenharmony_ci asm volatile("vpmulld %ymm4,%ymm6,%ymm2"); 24018c2ecf20Sopenharmony_ci asm volatile("vpmulld %zmm4,%zmm5,%zmm6"); 24028c2ecf20Sopenharmony_ci asm volatile("vpmullq %zmm4,%zmm5,%zmm6"); 24038c2ecf20Sopenharmony_ci 24048c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 38 42 */ 24058c2ecf20Sopenharmony_ci 24068c2ecf20Sopenharmony_ci asm volatile("vgetexpps %zmm5,%zmm6"); 24078c2ecf20Sopenharmony_ci asm volatile("vgetexppd %zmm5,%zmm6"); 24088c2ecf20Sopenharmony_ci 24098c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 38 43 */ 24108c2ecf20Sopenharmony_ci 24118c2ecf20Sopenharmony_ci asm volatile("vgetexpss %xmm4,%xmm5,%xmm6{%k7}"); 24128c2ecf20Sopenharmony_ci asm volatile("vgetexpsd %xmm2,%xmm3,%xmm4{%k7}"); 24138c2ecf20Sopenharmony_ci 24148c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 38 44 */ 24158c2ecf20Sopenharmony_ci 24168c2ecf20Sopenharmony_ci asm volatile("vplzcntd %zmm5,%zmm6"); 24178c2ecf20Sopenharmony_ci asm volatile("vplzcntq %zmm5,%zmm6"); 24188c2ecf20Sopenharmony_ci 24198c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 38 46 */ 24208c2ecf20Sopenharmony_ci 24218c2ecf20Sopenharmony_ci asm volatile("vpsravd %ymm4,%ymm6,%ymm2"); 24228c2ecf20Sopenharmony_ci asm volatile("vpsravd %zmm4,%zmm5,%zmm6"); 24238c2ecf20Sopenharmony_ci asm volatile("vpsravq %zmm4,%zmm5,%zmm6"); 24248c2ecf20Sopenharmony_ci 24258c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 38 4c */ 24268c2ecf20Sopenharmony_ci 24278c2ecf20Sopenharmony_ci asm volatile("vrcp14ps %zmm5,%zmm6"); 24288c2ecf20Sopenharmony_ci asm volatile("vrcp14pd %zmm5,%zmm6"); 24298c2ecf20Sopenharmony_ci 24308c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 38 4d */ 24318c2ecf20Sopenharmony_ci 24328c2ecf20Sopenharmony_ci asm volatile("vrcp14ss %xmm4,%xmm5,%xmm6{%k7}"); 24338c2ecf20Sopenharmony_ci asm volatile("vrcp14sd %xmm4,%xmm5,%xmm6{%k7}"); 24348c2ecf20Sopenharmony_ci 24358c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 38 4e */ 24368c2ecf20Sopenharmony_ci 24378c2ecf20Sopenharmony_ci asm volatile("vrsqrt14ps %zmm5,%zmm6"); 24388c2ecf20Sopenharmony_ci asm volatile("vrsqrt14pd %zmm5,%zmm6"); 24398c2ecf20Sopenharmony_ci 24408c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 38 4f */ 24418c2ecf20Sopenharmony_ci 24428c2ecf20Sopenharmony_ci asm volatile("vrsqrt14ss %xmm4,%xmm5,%xmm6{%k7}"); 24438c2ecf20Sopenharmony_ci asm volatile("vrsqrt14sd %xmm4,%xmm5,%xmm6{%k7}"); 24448c2ecf20Sopenharmony_ci 24458c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 38 50 */ 24468c2ecf20Sopenharmony_ci 24478c2ecf20Sopenharmony_ci asm volatile("vpdpbusd %xmm1, %xmm2, %xmm3"); 24488c2ecf20Sopenharmony_ci asm volatile("vpdpbusd %ymm1, %ymm2, %ymm3"); 24498c2ecf20Sopenharmony_ci asm volatile("vpdpbusd %zmm1, %zmm2, %zmm3"); 24508c2ecf20Sopenharmony_ci asm volatile("vpdpbusd 0x12345678(%eax,%ecx,8),%zmm2,%zmm3"); 24518c2ecf20Sopenharmony_ci 24528c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 38 51 */ 24538c2ecf20Sopenharmony_ci 24548c2ecf20Sopenharmony_ci asm volatile("vpdpbusds %xmm1, %xmm2, %xmm3"); 24558c2ecf20Sopenharmony_ci asm volatile("vpdpbusds %ymm1, %ymm2, %ymm3"); 24568c2ecf20Sopenharmony_ci asm volatile("vpdpbusds %zmm1, %zmm2, %zmm3"); 24578c2ecf20Sopenharmony_ci asm volatile("vpdpbusds 0x12345678(%eax,%ecx,8),%zmm2,%zmm3"); 24588c2ecf20Sopenharmony_ci 24598c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 38 52 */ 24608c2ecf20Sopenharmony_ci 24618c2ecf20Sopenharmony_ci asm volatile("vdpbf16ps %xmm1, %xmm2, %xmm3"); 24628c2ecf20Sopenharmony_ci asm volatile("vdpbf16ps %ymm1, %ymm2, %ymm3"); 24638c2ecf20Sopenharmony_ci asm volatile("vdpbf16ps %zmm1, %zmm2, %zmm3"); 24648c2ecf20Sopenharmony_ci asm volatile("vdpbf16ps 0x12345678(%eax,%ecx,8),%zmm2,%zmm3"); 24658c2ecf20Sopenharmony_ci 24668c2ecf20Sopenharmony_ci asm volatile("vpdpwssd %xmm1, %xmm2, %xmm3"); 24678c2ecf20Sopenharmony_ci asm volatile("vpdpwssd %ymm1, %ymm2, %ymm3"); 24688c2ecf20Sopenharmony_ci asm volatile("vpdpwssd %zmm1, %zmm2, %zmm3"); 24698c2ecf20Sopenharmony_ci asm volatile("vpdpwssd 0x12345678(%eax,%ecx,8),%zmm2,%zmm3"); 24708c2ecf20Sopenharmony_ci 24718c2ecf20Sopenharmony_ci asm volatile("vp4dpwssd (%eax), %zmm0, %zmm4"); 24728c2ecf20Sopenharmony_ci asm volatile("vp4dpwssd 0x12345678(%eax,%ecx,8),%zmm0,%zmm4"); 24738c2ecf20Sopenharmony_ci 24748c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 38 53 */ 24758c2ecf20Sopenharmony_ci 24768c2ecf20Sopenharmony_ci asm volatile("vpdpwssds %xmm1, %xmm2, %xmm3"); 24778c2ecf20Sopenharmony_ci asm volatile("vpdpwssds %ymm1, %ymm2, %ymm3"); 24788c2ecf20Sopenharmony_ci asm volatile("vpdpwssds %zmm1, %zmm2, %zmm3"); 24798c2ecf20Sopenharmony_ci asm volatile("vpdpwssds 0x12345678(%eax,%ecx,8),%zmm2,%zmm3"); 24808c2ecf20Sopenharmony_ci 24818c2ecf20Sopenharmony_ci asm volatile("vp4dpwssds (%eax), %zmm0, %zmm4"); 24828c2ecf20Sopenharmony_ci asm volatile("vp4dpwssds 0x12345678(%eax,%ecx,8),%zmm0,%zmm4"); 24838c2ecf20Sopenharmony_ci 24848c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 38 54 */ 24858c2ecf20Sopenharmony_ci 24868c2ecf20Sopenharmony_ci asm volatile("vpopcntb %xmm1, %xmm2"); 24878c2ecf20Sopenharmony_ci asm volatile("vpopcntb %ymm1, %ymm2"); 24888c2ecf20Sopenharmony_ci asm volatile("vpopcntb %zmm1, %zmm2"); 24898c2ecf20Sopenharmony_ci asm volatile("vpopcntb 0x12345678(%eax,%ecx,8),%zmm2"); 24908c2ecf20Sopenharmony_ci 24918c2ecf20Sopenharmony_ci asm volatile("vpopcntw %xmm1, %xmm2"); 24928c2ecf20Sopenharmony_ci asm volatile("vpopcntw %ymm1, %ymm2"); 24938c2ecf20Sopenharmony_ci asm volatile("vpopcntw %zmm1, %zmm2"); 24948c2ecf20Sopenharmony_ci asm volatile("vpopcntw 0x12345678(%eax,%ecx,8),%zmm2"); 24958c2ecf20Sopenharmony_ci 24968c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 38 55 */ 24978c2ecf20Sopenharmony_ci 24988c2ecf20Sopenharmony_ci asm volatile("vpopcntd %xmm1, %xmm2"); 24998c2ecf20Sopenharmony_ci asm volatile("vpopcntd %ymm1, %ymm2"); 25008c2ecf20Sopenharmony_ci asm volatile("vpopcntd %zmm1, %zmm2"); 25018c2ecf20Sopenharmony_ci asm volatile("vpopcntd 0x12345678(%eax,%ecx,8),%zmm2"); 25028c2ecf20Sopenharmony_ci 25038c2ecf20Sopenharmony_ci asm volatile("vpopcntq %xmm1, %xmm2"); 25048c2ecf20Sopenharmony_ci asm volatile("vpopcntq %ymm1, %ymm2"); 25058c2ecf20Sopenharmony_ci asm volatile("vpopcntq %zmm1, %zmm2"); 25068c2ecf20Sopenharmony_ci asm volatile("vpopcntq 0x12345678(%eax,%ecx,8),%zmm2"); 25078c2ecf20Sopenharmony_ci 25088c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 38 59 */ 25098c2ecf20Sopenharmony_ci 25108c2ecf20Sopenharmony_ci asm volatile("vpbroadcastq %xmm4,%xmm6"); 25118c2ecf20Sopenharmony_ci asm volatile("vbroadcasti32x2 %xmm7,%zmm6"); 25128c2ecf20Sopenharmony_ci 25138c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 38 5a */ 25148c2ecf20Sopenharmony_ci 25158c2ecf20Sopenharmony_ci asm volatile("vbroadcasti128 (%ecx),%ymm4"); 25168c2ecf20Sopenharmony_ci asm volatile("vbroadcasti32x4 (%ecx),%zmm6"); 25178c2ecf20Sopenharmony_ci asm volatile("vbroadcasti64x2 (%ecx),%zmm6"); 25188c2ecf20Sopenharmony_ci 25198c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 38 5b */ 25208c2ecf20Sopenharmony_ci 25218c2ecf20Sopenharmony_ci asm volatile("vbroadcasti32x8 (%ecx),%zmm6"); 25228c2ecf20Sopenharmony_ci asm volatile("vbroadcasti64x4 (%ecx),%zmm6"); 25238c2ecf20Sopenharmony_ci 25248c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 38 62 */ 25258c2ecf20Sopenharmony_ci 25268c2ecf20Sopenharmony_ci asm volatile("vpexpandb %xmm1, %xmm2"); 25278c2ecf20Sopenharmony_ci asm volatile("vpexpandb %ymm1, %ymm2"); 25288c2ecf20Sopenharmony_ci asm volatile("vpexpandb %zmm1, %zmm2"); 25298c2ecf20Sopenharmony_ci asm volatile("vpexpandb 0x12345678(%eax,%ecx,8),%zmm2"); 25308c2ecf20Sopenharmony_ci 25318c2ecf20Sopenharmony_ci asm volatile("vpexpandw %xmm1, %xmm2"); 25328c2ecf20Sopenharmony_ci asm volatile("vpexpandw %ymm1, %ymm2"); 25338c2ecf20Sopenharmony_ci asm volatile("vpexpandw %zmm1, %zmm2"); 25348c2ecf20Sopenharmony_ci asm volatile("vpexpandw 0x12345678(%eax,%ecx,8),%zmm2"); 25358c2ecf20Sopenharmony_ci 25368c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 38 63 */ 25378c2ecf20Sopenharmony_ci 25388c2ecf20Sopenharmony_ci asm volatile("vpcompressb %xmm1, %xmm2"); 25398c2ecf20Sopenharmony_ci asm volatile("vpcompressb %ymm1, %ymm2"); 25408c2ecf20Sopenharmony_ci asm volatile("vpcompressb %zmm1, %zmm2"); 25418c2ecf20Sopenharmony_ci asm volatile("vpcompressb %zmm2,0x12345678(%eax,%ecx,8)"); 25428c2ecf20Sopenharmony_ci 25438c2ecf20Sopenharmony_ci asm volatile("vpcompressw %xmm1, %xmm2"); 25448c2ecf20Sopenharmony_ci asm volatile("vpcompressw %ymm1, %ymm2"); 25458c2ecf20Sopenharmony_ci asm volatile("vpcompressw %zmm1, %zmm2"); 25468c2ecf20Sopenharmony_ci asm volatile("vpcompressw %zmm2,0x12345678(%eax,%ecx,8)"); 25478c2ecf20Sopenharmony_ci 25488c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 38 64 */ 25498c2ecf20Sopenharmony_ci 25508c2ecf20Sopenharmony_ci asm volatile("vpblendmd %zmm4,%zmm5,%zmm6"); 25518c2ecf20Sopenharmony_ci asm volatile("vpblendmq %zmm4,%zmm5,%zmm6"); 25528c2ecf20Sopenharmony_ci 25538c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 38 65 */ 25548c2ecf20Sopenharmony_ci 25558c2ecf20Sopenharmony_ci asm volatile("vblendmps %zmm4,%zmm5,%zmm6"); 25568c2ecf20Sopenharmony_ci asm volatile("vblendmpd %zmm4,%zmm5,%zmm6"); 25578c2ecf20Sopenharmony_ci 25588c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 38 66 */ 25598c2ecf20Sopenharmony_ci 25608c2ecf20Sopenharmony_ci asm volatile("vpblendmb %zmm4,%zmm5,%zmm6"); 25618c2ecf20Sopenharmony_ci asm volatile("vpblendmw %zmm4,%zmm5,%zmm6"); 25628c2ecf20Sopenharmony_ci 25638c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 38 68 */ 25648c2ecf20Sopenharmony_ci 25658c2ecf20Sopenharmony_ci asm volatile("vp2intersectd %xmm1, %xmm2, %k3"); 25668c2ecf20Sopenharmony_ci asm volatile("vp2intersectd %ymm1, %ymm2, %k3"); 25678c2ecf20Sopenharmony_ci asm volatile("vp2intersectd %zmm1, %zmm2, %k3"); 25688c2ecf20Sopenharmony_ci asm volatile("vp2intersectd 0x12345678(%eax,%ecx,8),%zmm2,%k3"); 25698c2ecf20Sopenharmony_ci 25708c2ecf20Sopenharmony_ci asm volatile("vp2intersectq %xmm1, %xmm2, %k3"); 25718c2ecf20Sopenharmony_ci asm volatile("vp2intersectq %ymm1, %ymm2, %k3"); 25728c2ecf20Sopenharmony_ci asm volatile("vp2intersectq %zmm1, %zmm2, %k3"); 25738c2ecf20Sopenharmony_ci asm volatile("vp2intersectq 0x12345678(%eax,%ecx,8),%zmm2,%k3"); 25748c2ecf20Sopenharmony_ci 25758c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 38 70 */ 25768c2ecf20Sopenharmony_ci 25778c2ecf20Sopenharmony_ci asm volatile("vpshldvw %xmm1, %xmm2, %xmm3"); 25788c2ecf20Sopenharmony_ci asm volatile("vpshldvw %ymm1, %ymm2, %ymm3"); 25798c2ecf20Sopenharmony_ci asm volatile("vpshldvw %zmm1, %zmm2, %zmm3"); 25808c2ecf20Sopenharmony_ci asm volatile("vpshldvw 0x12345678(%eax,%ecx,8),%zmm2,%zmm3"); 25818c2ecf20Sopenharmony_ci 25828c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 38 71 */ 25838c2ecf20Sopenharmony_ci 25848c2ecf20Sopenharmony_ci asm volatile("vpshldvd %xmm1, %xmm2, %xmm3"); 25858c2ecf20Sopenharmony_ci asm volatile("vpshldvd %ymm1, %ymm2, %ymm3"); 25868c2ecf20Sopenharmony_ci asm volatile("vpshldvd %zmm1, %zmm2, %zmm3"); 25878c2ecf20Sopenharmony_ci asm volatile("vpshldvd 0x12345678(%eax,%ecx,8),%zmm2,%zmm3"); 25888c2ecf20Sopenharmony_ci 25898c2ecf20Sopenharmony_ci asm volatile("vpshldvq %xmm1, %xmm2, %xmm3"); 25908c2ecf20Sopenharmony_ci asm volatile("vpshldvq %ymm1, %ymm2, %ymm3"); 25918c2ecf20Sopenharmony_ci asm volatile("vpshldvq %zmm1, %zmm2, %zmm3"); 25928c2ecf20Sopenharmony_ci asm volatile("vpshldvq 0x12345678(%eax,%ecx,8),%zmm2,%zmm3"); 25938c2ecf20Sopenharmony_ci 25948c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 38 72 */ 25958c2ecf20Sopenharmony_ci 25968c2ecf20Sopenharmony_ci asm volatile("vcvtne2ps2bf16 %xmm1, %xmm2, %xmm3"); 25978c2ecf20Sopenharmony_ci asm volatile("vcvtne2ps2bf16 %ymm1, %ymm2, %ymm3"); 25988c2ecf20Sopenharmony_ci asm volatile("vcvtne2ps2bf16 %zmm1, %zmm2, %zmm3"); 25998c2ecf20Sopenharmony_ci asm volatile("vcvtne2ps2bf16 0x12345678(%eax,%ecx,8),%zmm2,%zmm3"); 26008c2ecf20Sopenharmony_ci 26018c2ecf20Sopenharmony_ci asm volatile("vcvtneps2bf16 %xmm1, %xmm2"); 26028c2ecf20Sopenharmony_ci asm volatile("vcvtneps2bf16 %ymm1, %xmm2"); 26038c2ecf20Sopenharmony_ci asm volatile("vcvtneps2bf16 %zmm1, %ymm2"); 26048c2ecf20Sopenharmony_ci asm volatile("vcvtneps2bf16 0x12345678(%eax,%ecx,8),%ymm2"); 26058c2ecf20Sopenharmony_ci 26068c2ecf20Sopenharmony_ci asm volatile("vpshrdvw %xmm1, %xmm2, %xmm3"); 26078c2ecf20Sopenharmony_ci asm volatile("vpshrdvw %ymm1, %ymm2, %ymm3"); 26088c2ecf20Sopenharmony_ci asm volatile("vpshrdvw %zmm1, %zmm2, %zmm3"); 26098c2ecf20Sopenharmony_ci asm volatile("vpshrdvw 0x12345678(%eax,%ecx,8),%zmm2,%zmm3"); 26108c2ecf20Sopenharmony_ci 26118c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 38 73 */ 26128c2ecf20Sopenharmony_ci 26138c2ecf20Sopenharmony_ci asm volatile("vpshrdvd %xmm1, %xmm2, %xmm3"); 26148c2ecf20Sopenharmony_ci asm volatile("vpshrdvd %ymm1, %ymm2, %ymm3"); 26158c2ecf20Sopenharmony_ci asm volatile("vpshrdvd %zmm1, %zmm2, %zmm3"); 26168c2ecf20Sopenharmony_ci asm volatile("vpshrdvd 0x12345678(%eax,%ecx,8),%zmm2,%zmm3"); 26178c2ecf20Sopenharmony_ci 26188c2ecf20Sopenharmony_ci asm volatile("vpshrdvq %xmm1, %xmm2, %xmm3"); 26198c2ecf20Sopenharmony_ci asm volatile("vpshrdvq %ymm1, %ymm2, %ymm3"); 26208c2ecf20Sopenharmony_ci asm volatile("vpshrdvq %zmm1, %zmm2, %zmm3"); 26218c2ecf20Sopenharmony_ci asm volatile("vpshrdvq 0x12345678(%eax,%ecx,8),%zmm2,%zmm3"); 26228c2ecf20Sopenharmony_ci 26238c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 38 75 */ 26248c2ecf20Sopenharmony_ci 26258c2ecf20Sopenharmony_ci asm volatile("vpermi2b %zmm4,%zmm5,%zmm6"); 26268c2ecf20Sopenharmony_ci asm volatile("vpermi2w %zmm4,%zmm5,%zmm6"); 26278c2ecf20Sopenharmony_ci 26288c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 38 76 */ 26298c2ecf20Sopenharmony_ci 26308c2ecf20Sopenharmony_ci asm volatile("vpermi2d %zmm4,%zmm5,%zmm6"); 26318c2ecf20Sopenharmony_ci asm volatile("vpermi2q %zmm4,%zmm5,%zmm6"); 26328c2ecf20Sopenharmony_ci 26338c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 38 77 */ 26348c2ecf20Sopenharmony_ci 26358c2ecf20Sopenharmony_ci asm volatile("vpermi2ps %zmm4,%zmm5,%zmm6"); 26368c2ecf20Sopenharmony_ci asm volatile("vpermi2pd %zmm4,%zmm5,%zmm6"); 26378c2ecf20Sopenharmony_ci 26388c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 38 7a */ 26398c2ecf20Sopenharmony_ci 26408c2ecf20Sopenharmony_ci asm volatile("vpbroadcastb %eax,%xmm3"); 26418c2ecf20Sopenharmony_ci 26428c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 38 7b */ 26438c2ecf20Sopenharmony_ci 26448c2ecf20Sopenharmony_ci asm volatile("vpbroadcastw %eax,%xmm3"); 26458c2ecf20Sopenharmony_ci 26468c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 38 7c */ 26478c2ecf20Sopenharmony_ci 26488c2ecf20Sopenharmony_ci asm volatile("vpbroadcastd %eax,%xmm3"); 26498c2ecf20Sopenharmony_ci 26508c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 38 7d */ 26518c2ecf20Sopenharmony_ci 26528c2ecf20Sopenharmony_ci asm volatile("vpermt2b %zmm4,%zmm5,%zmm6"); 26538c2ecf20Sopenharmony_ci asm volatile("vpermt2w %zmm4,%zmm5,%zmm6"); 26548c2ecf20Sopenharmony_ci 26558c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 38 7e */ 26568c2ecf20Sopenharmony_ci 26578c2ecf20Sopenharmony_ci asm volatile("vpermt2d %zmm4,%zmm5,%zmm6"); 26588c2ecf20Sopenharmony_ci asm volatile("vpermt2q %zmm4,%zmm5,%zmm6"); 26598c2ecf20Sopenharmony_ci 26608c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 38 7f */ 26618c2ecf20Sopenharmony_ci 26628c2ecf20Sopenharmony_ci asm volatile("vpermt2ps %zmm4,%zmm5,%zmm6"); 26638c2ecf20Sopenharmony_ci asm volatile("vpermt2pd %zmm4,%zmm5,%zmm6"); 26648c2ecf20Sopenharmony_ci 26658c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 38 83 */ 26668c2ecf20Sopenharmony_ci 26678c2ecf20Sopenharmony_ci asm volatile("vpmultishiftqb %zmm4,%zmm5,%zmm6"); 26688c2ecf20Sopenharmony_ci 26698c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 38 88 */ 26708c2ecf20Sopenharmony_ci 26718c2ecf20Sopenharmony_ci asm volatile("vexpandps (%ecx),%zmm6"); 26728c2ecf20Sopenharmony_ci asm volatile("vexpandpd (%ecx),%zmm6"); 26738c2ecf20Sopenharmony_ci 26748c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 38 89 */ 26758c2ecf20Sopenharmony_ci 26768c2ecf20Sopenharmony_ci asm volatile("vpexpandd (%ecx),%zmm6"); 26778c2ecf20Sopenharmony_ci asm volatile("vpexpandq (%ecx),%zmm6"); 26788c2ecf20Sopenharmony_ci 26798c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 38 8a */ 26808c2ecf20Sopenharmony_ci 26818c2ecf20Sopenharmony_ci asm volatile("vcompressps %zmm6,(%ecx)"); 26828c2ecf20Sopenharmony_ci asm volatile("vcompresspd %zmm6,(%ecx)"); 26838c2ecf20Sopenharmony_ci 26848c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 38 8b */ 26858c2ecf20Sopenharmony_ci 26868c2ecf20Sopenharmony_ci asm volatile("vpcompressd %zmm6,(%ecx)"); 26878c2ecf20Sopenharmony_ci asm volatile("vpcompressq %zmm6,(%ecx)"); 26888c2ecf20Sopenharmony_ci 26898c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 38 8d */ 26908c2ecf20Sopenharmony_ci 26918c2ecf20Sopenharmony_ci asm volatile("vpermb %zmm4,%zmm5,%zmm6"); 26928c2ecf20Sopenharmony_ci asm volatile("vpermw %zmm4,%zmm5,%zmm6"); 26938c2ecf20Sopenharmony_ci 26948c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 38 8f */ 26958c2ecf20Sopenharmony_ci 26968c2ecf20Sopenharmony_ci asm volatile("vpshufbitqmb %xmm1, %xmm2, %k3"); 26978c2ecf20Sopenharmony_ci asm volatile("vpshufbitqmb %ymm1, %ymm2, %k3"); 26988c2ecf20Sopenharmony_ci asm volatile("vpshufbitqmb %zmm1, %zmm2, %k3"); 26998c2ecf20Sopenharmony_ci asm volatile("vpshufbitqmb 0x12345678(%eax,%ecx,8),%zmm2,%k3"); 27008c2ecf20Sopenharmony_ci 27018c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 38 90 */ 27028c2ecf20Sopenharmony_ci 27038c2ecf20Sopenharmony_ci asm volatile("vpgatherdd %xmm2,0x02(%ebp,%xmm7,2),%xmm1"); 27048c2ecf20Sopenharmony_ci asm volatile("vpgatherdq %xmm2,0x04(%ebp,%xmm7,2),%xmm1"); 27058c2ecf20Sopenharmony_ci asm volatile("vpgatherdd 0x7b(%ebp,%zmm7,8),%zmm6{%k1}"); 27068c2ecf20Sopenharmony_ci asm volatile("vpgatherdq 0x7b(%ebp,%ymm7,8),%zmm6{%k1}"); 27078c2ecf20Sopenharmony_ci 27088c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 38 91 */ 27098c2ecf20Sopenharmony_ci 27108c2ecf20Sopenharmony_ci asm volatile("vpgatherqd %xmm2,0x02(%ebp,%xmm7,2),%xmm1"); 27118c2ecf20Sopenharmony_ci asm volatile("vpgatherqq %xmm2,0x02(%ebp,%xmm7,2),%xmm1"); 27128c2ecf20Sopenharmony_ci asm volatile("vpgatherqd 0x7b(%ebp,%zmm7,8),%ymm6{%k1}"); 27138c2ecf20Sopenharmony_ci asm volatile("vpgatherqq 0x7b(%ebp,%zmm7,8),%zmm6{%k1}"); 27148c2ecf20Sopenharmony_ci 27158c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 38 9a */ 27168c2ecf20Sopenharmony_ci 27178c2ecf20Sopenharmony_ci asm volatile("vfmsub132ps %xmm1, %xmm2, %xmm3"); 27188c2ecf20Sopenharmony_ci asm volatile("vfmsub132ps %ymm1, %ymm2, %ymm3"); 27198c2ecf20Sopenharmony_ci asm volatile("vfmsub132ps %zmm1, %zmm2, %zmm3"); 27208c2ecf20Sopenharmony_ci asm volatile("vfmsub132ps 0x12345678(%eax,%ecx,8),%zmm2,%zmm3"); 27218c2ecf20Sopenharmony_ci 27228c2ecf20Sopenharmony_ci asm volatile("vfmsub132pd %xmm1, %xmm2, %xmm3"); 27238c2ecf20Sopenharmony_ci asm volatile("vfmsub132pd %ymm1, %ymm2, %ymm3"); 27248c2ecf20Sopenharmony_ci asm volatile("vfmsub132pd %zmm1, %zmm2, %zmm3"); 27258c2ecf20Sopenharmony_ci asm volatile("vfmsub132pd 0x12345678(%eax,%ecx,8),%zmm2,%zmm3"); 27268c2ecf20Sopenharmony_ci 27278c2ecf20Sopenharmony_ci asm volatile("v4fmaddps (%eax), %zmm0, %zmm4"); 27288c2ecf20Sopenharmony_ci asm volatile("v4fmaddps 0x12345678(%eax,%ecx,8),%zmm0,%zmm4"); 27298c2ecf20Sopenharmony_ci 27308c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 38 9b */ 27318c2ecf20Sopenharmony_ci 27328c2ecf20Sopenharmony_ci asm volatile("vfmsub132ss %xmm1, %xmm2, %xmm3"); 27338c2ecf20Sopenharmony_ci asm volatile("vfmsub132ss 0x12345678(%eax,%ecx,8),%xmm2,%xmm3"); 27348c2ecf20Sopenharmony_ci 27358c2ecf20Sopenharmony_ci asm volatile("vfmsub132sd %xmm1, %xmm2, %xmm3"); 27368c2ecf20Sopenharmony_ci asm volatile("vfmsub132sd 0x12345678(%eax,%ecx,8),%xmm2,%xmm3"); 27378c2ecf20Sopenharmony_ci 27388c2ecf20Sopenharmony_ci asm volatile("v4fmaddss (%eax), %xmm0, %xmm4"); 27398c2ecf20Sopenharmony_ci asm volatile("v4fmaddss 0x12345678(%eax,%ecx,8),%xmm0,%xmm4"); 27408c2ecf20Sopenharmony_ci 27418c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 38 a0 */ 27428c2ecf20Sopenharmony_ci 27438c2ecf20Sopenharmony_ci asm volatile("vpscatterdd %zmm6,0x7b(%ebp,%zmm7,8){%k1}"); 27448c2ecf20Sopenharmony_ci asm volatile("vpscatterdq %zmm6,0x7b(%ebp,%ymm7,8){%k1}"); 27458c2ecf20Sopenharmony_ci 27468c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 38 a1 */ 27478c2ecf20Sopenharmony_ci 27488c2ecf20Sopenharmony_ci asm volatile("vpscatterqd %ymm6,0x7b(%ebp,%zmm7,8){%k1}"); 27498c2ecf20Sopenharmony_ci asm volatile("vpscatterqq %ymm6,0x7b(%ebp,%ymm7,8){%k1}"); 27508c2ecf20Sopenharmony_ci 27518c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 38 a2 */ 27528c2ecf20Sopenharmony_ci 27538c2ecf20Sopenharmony_ci asm volatile("vscatterdps %zmm6,0x7b(%ebp,%zmm7,8){%k1}"); 27548c2ecf20Sopenharmony_ci asm volatile("vscatterdpd %zmm6,0x7b(%ebp,%ymm7,8){%k1}"); 27558c2ecf20Sopenharmony_ci 27568c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 38 a3 */ 27578c2ecf20Sopenharmony_ci 27588c2ecf20Sopenharmony_ci asm volatile("vscatterqps %ymm6,0x7b(%ebp,%zmm7,8){%k1}"); 27598c2ecf20Sopenharmony_ci asm volatile("vscatterqpd %zmm6,0x7b(%ebp,%zmm7,8){%k1}"); 27608c2ecf20Sopenharmony_ci 27618c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 38 aa */ 27628c2ecf20Sopenharmony_ci 27638c2ecf20Sopenharmony_ci asm volatile("vfmsub213ps %xmm1, %xmm2, %xmm3"); 27648c2ecf20Sopenharmony_ci asm volatile("vfmsub213ps %ymm1, %ymm2, %ymm3"); 27658c2ecf20Sopenharmony_ci asm volatile("vfmsub213ps %zmm1, %zmm2, %zmm3"); 27668c2ecf20Sopenharmony_ci asm volatile("vfmsub213ps 0x12345678(%eax,%ecx,8),%zmm2,%zmm3"); 27678c2ecf20Sopenharmony_ci 27688c2ecf20Sopenharmony_ci asm volatile("vfmsub213pd %xmm1, %xmm2, %xmm3"); 27698c2ecf20Sopenharmony_ci asm volatile("vfmsub213pd %ymm1, %ymm2, %ymm3"); 27708c2ecf20Sopenharmony_ci asm volatile("vfmsub213pd %zmm1, %zmm2, %zmm3"); 27718c2ecf20Sopenharmony_ci asm volatile("vfmsub213pd 0x12345678(%eax,%ecx,8),%zmm2,%zmm3"); 27728c2ecf20Sopenharmony_ci 27738c2ecf20Sopenharmony_ci asm volatile("v4fnmaddps (%eax), %zmm0, %zmm4"); 27748c2ecf20Sopenharmony_ci asm volatile("v4fnmaddps 0x12345678(%eax,%ecx,8),%zmm0,%zmm4"); 27758c2ecf20Sopenharmony_ci 27768c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 38 ab */ 27778c2ecf20Sopenharmony_ci 27788c2ecf20Sopenharmony_ci asm volatile("vfmsub213ss %xmm1, %xmm2, %xmm3"); 27798c2ecf20Sopenharmony_ci asm volatile("vfmsub213ss 0x12345678(%eax,%ecx,8),%xmm2,%xmm3"); 27808c2ecf20Sopenharmony_ci 27818c2ecf20Sopenharmony_ci asm volatile("vfmsub213sd %xmm1, %xmm2, %xmm3"); 27828c2ecf20Sopenharmony_ci asm volatile("vfmsub213sd 0x12345678(%eax,%ecx,8),%xmm2,%xmm3"); 27838c2ecf20Sopenharmony_ci 27848c2ecf20Sopenharmony_ci asm volatile("v4fnmaddss (%eax), %xmm0, %xmm4"); 27858c2ecf20Sopenharmony_ci asm volatile("v4fnmaddss 0x12345678(%eax,%ecx,8),%xmm0,%xmm4"); 27868c2ecf20Sopenharmony_ci 27878c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 38 b4 */ 27888c2ecf20Sopenharmony_ci 27898c2ecf20Sopenharmony_ci asm volatile("vpmadd52luq %zmm4,%zmm5,%zmm6"); 27908c2ecf20Sopenharmony_ci 27918c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 38 b5 */ 27928c2ecf20Sopenharmony_ci 27938c2ecf20Sopenharmony_ci asm volatile("vpmadd52huq %zmm4,%zmm5,%zmm6"); 27948c2ecf20Sopenharmony_ci 27958c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 38 c4 */ 27968c2ecf20Sopenharmony_ci 27978c2ecf20Sopenharmony_ci asm volatile("vpconflictd %zmm5,%zmm6"); 27988c2ecf20Sopenharmony_ci asm volatile("vpconflictq %zmm5,%zmm6"); 27998c2ecf20Sopenharmony_ci 28008c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 38 c8 */ 28018c2ecf20Sopenharmony_ci 28028c2ecf20Sopenharmony_ci asm volatile("vexp2ps %zmm6,%zmm7"); 28038c2ecf20Sopenharmony_ci asm volatile("vexp2pd %zmm6,%zmm7"); 28048c2ecf20Sopenharmony_ci 28058c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 38 ca */ 28068c2ecf20Sopenharmony_ci 28078c2ecf20Sopenharmony_ci asm volatile("vrcp28ps %zmm6,%zmm7"); 28088c2ecf20Sopenharmony_ci asm volatile("vrcp28pd %zmm6,%zmm7"); 28098c2ecf20Sopenharmony_ci 28108c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 38 cb */ 28118c2ecf20Sopenharmony_ci 28128c2ecf20Sopenharmony_ci asm volatile("vrcp28ss %xmm5,%xmm6,%xmm7{%k7}"); 28138c2ecf20Sopenharmony_ci asm volatile("vrcp28sd %xmm5,%xmm6,%xmm7{%k7}"); 28148c2ecf20Sopenharmony_ci 28158c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 38 cc */ 28168c2ecf20Sopenharmony_ci 28178c2ecf20Sopenharmony_ci asm volatile("vrsqrt28ps %zmm6,%zmm7"); 28188c2ecf20Sopenharmony_ci asm volatile("vrsqrt28pd %zmm6,%zmm7"); 28198c2ecf20Sopenharmony_ci 28208c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 38 cd */ 28218c2ecf20Sopenharmony_ci 28228c2ecf20Sopenharmony_ci asm volatile("vrsqrt28ss %xmm5,%xmm6,%xmm7{%k7}"); 28238c2ecf20Sopenharmony_ci asm volatile("vrsqrt28sd %xmm5,%xmm6,%xmm7{%k7}"); 28248c2ecf20Sopenharmony_ci 28258c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 38 cf */ 28268c2ecf20Sopenharmony_ci 28278c2ecf20Sopenharmony_ci asm volatile("gf2p8mulb %xmm1, %xmm3"); 28288c2ecf20Sopenharmony_ci asm volatile("gf2p8mulb 0x12345678(%eax,%ecx,8),%xmm3"); 28298c2ecf20Sopenharmony_ci 28308c2ecf20Sopenharmony_ci asm volatile("vgf2p8mulb %xmm1, %xmm2, %xmm3"); 28318c2ecf20Sopenharmony_ci asm volatile("vgf2p8mulb %ymm1, %ymm2, %ymm3"); 28328c2ecf20Sopenharmony_ci asm volatile("vgf2p8mulb %zmm1, %zmm2, %zmm3"); 28338c2ecf20Sopenharmony_ci asm volatile("vgf2p8mulb 0x12345678(%eax,%ecx,8),%zmm2,%zmm3"); 28348c2ecf20Sopenharmony_ci 28358c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 38 dc */ 28368c2ecf20Sopenharmony_ci 28378c2ecf20Sopenharmony_ci asm volatile("vaesenc %xmm1, %xmm2, %xmm3"); 28388c2ecf20Sopenharmony_ci asm volatile("vaesenc %ymm1, %ymm2, %ymm3"); 28398c2ecf20Sopenharmony_ci asm volatile("vaesenc %zmm1, %zmm2, %zmm3"); 28408c2ecf20Sopenharmony_ci asm volatile("vaesenc 0x12345678(%eax,%ecx,8),%zmm2,%zmm3"); 28418c2ecf20Sopenharmony_ci 28428c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 38 dd */ 28438c2ecf20Sopenharmony_ci 28448c2ecf20Sopenharmony_ci asm volatile("vaesenclast %xmm1, %xmm2, %xmm3"); 28458c2ecf20Sopenharmony_ci asm volatile("vaesenclast %ymm1, %ymm2, %ymm3"); 28468c2ecf20Sopenharmony_ci asm volatile("vaesenclast %zmm1, %zmm2, %zmm3"); 28478c2ecf20Sopenharmony_ci asm volatile("vaesenclast 0x12345678(%eax,%ecx,8),%zmm2,%zmm3"); 28488c2ecf20Sopenharmony_ci 28498c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 38 de */ 28508c2ecf20Sopenharmony_ci 28518c2ecf20Sopenharmony_ci asm volatile("vaesdec %xmm1, %xmm2, %xmm3"); 28528c2ecf20Sopenharmony_ci asm volatile("vaesdec %ymm1, %ymm2, %ymm3"); 28538c2ecf20Sopenharmony_ci asm volatile("vaesdec %zmm1, %zmm2, %zmm3"); 28548c2ecf20Sopenharmony_ci asm volatile("vaesdec 0x12345678(%eax,%ecx,8),%zmm2,%zmm3"); 28558c2ecf20Sopenharmony_ci 28568c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 38 df */ 28578c2ecf20Sopenharmony_ci 28588c2ecf20Sopenharmony_ci asm volatile("vaesdeclast %xmm1, %xmm2, %xmm3"); 28598c2ecf20Sopenharmony_ci asm volatile("vaesdeclast %ymm1, %ymm2, %ymm3"); 28608c2ecf20Sopenharmony_ci asm volatile("vaesdeclast %zmm1, %zmm2, %zmm3"); 28618c2ecf20Sopenharmony_ci asm volatile("vaesdeclast 0x12345678(%eax,%ecx,8),%zmm2,%zmm3"); 28628c2ecf20Sopenharmony_ci 28638c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 3a 03 */ 28648c2ecf20Sopenharmony_ci 28658c2ecf20Sopenharmony_ci asm volatile("valignd $0x12,%zmm5,%zmm6,%zmm7"); 28668c2ecf20Sopenharmony_ci asm volatile("valignq $0x12,%zmm5,%zmm6,%zmm7"); 28678c2ecf20Sopenharmony_ci 28688c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 3a 08 */ 28698c2ecf20Sopenharmony_ci 28708c2ecf20Sopenharmony_ci asm volatile("vroundps $0x5,%ymm6,%ymm2"); 28718c2ecf20Sopenharmony_ci asm volatile("vrndscaleps $0x12,%zmm5,%zmm6"); 28728c2ecf20Sopenharmony_ci 28738c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 3a 09 */ 28748c2ecf20Sopenharmony_ci 28758c2ecf20Sopenharmony_ci asm volatile("vroundpd $0x5,%ymm6,%ymm2"); 28768c2ecf20Sopenharmony_ci asm volatile("vrndscalepd $0x12,%zmm5,%zmm6"); 28778c2ecf20Sopenharmony_ci 28788c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 3a 0a */ 28798c2ecf20Sopenharmony_ci 28808c2ecf20Sopenharmony_ci asm volatile("vroundss $0x5,%xmm4,%xmm6,%xmm2"); 28818c2ecf20Sopenharmony_ci asm volatile("vrndscaless $0x12,%xmm4,%xmm5,%xmm6{%k7}"); 28828c2ecf20Sopenharmony_ci 28838c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 3a 0b */ 28848c2ecf20Sopenharmony_ci 28858c2ecf20Sopenharmony_ci asm volatile("vroundsd $0x5,%xmm4,%xmm6,%xmm2"); 28868c2ecf20Sopenharmony_ci asm volatile("vrndscalesd $0x12,%xmm4,%xmm5,%xmm6{%k7}"); 28878c2ecf20Sopenharmony_ci 28888c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 3a 18 */ 28898c2ecf20Sopenharmony_ci 28908c2ecf20Sopenharmony_ci asm volatile("vinsertf128 $0x5,%xmm4,%ymm4,%ymm6"); 28918c2ecf20Sopenharmony_ci asm volatile("vinsertf32x4 $0x12,%xmm4,%zmm5,%zmm6{%k7}"); 28928c2ecf20Sopenharmony_ci asm volatile("vinsertf64x2 $0x12,%xmm4,%zmm5,%zmm6{%k7}"); 28938c2ecf20Sopenharmony_ci 28948c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 3a 19 */ 28958c2ecf20Sopenharmony_ci 28968c2ecf20Sopenharmony_ci asm volatile("vextractf128 $0x5,%ymm4,%xmm4"); 28978c2ecf20Sopenharmony_ci asm volatile("vextractf32x4 $0x12,%zmm5,%xmm6{%k7}"); 28988c2ecf20Sopenharmony_ci asm volatile("vextractf64x2 $0x12,%zmm5,%xmm6{%k7}"); 28998c2ecf20Sopenharmony_ci 29008c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 3a 1a */ 29018c2ecf20Sopenharmony_ci 29028c2ecf20Sopenharmony_ci asm volatile("vinsertf32x8 $0x12,%ymm5,%zmm6,%zmm7{%k7}"); 29038c2ecf20Sopenharmony_ci asm volatile("vinsertf64x4 $0x12,%ymm5,%zmm6,%zmm7{%k7}"); 29048c2ecf20Sopenharmony_ci 29058c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 3a 1b */ 29068c2ecf20Sopenharmony_ci 29078c2ecf20Sopenharmony_ci asm volatile("vextractf32x8 $0x12,%zmm6,%ymm7{%k7}"); 29088c2ecf20Sopenharmony_ci asm volatile("vextractf64x4 $0x12,%zmm6,%ymm7{%k7}"); 29098c2ecf20Sopenharmony_ci 29108c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 3a 1e */ 29118c2ecf20Sopenharmony_ci 29128c2ecf20Sopenharmony_ci asm volatile("vpcmpud $0x12,%zmm6,%zmm7,%k5"); 29138c2ecf20Sopenharmony_ci asm volatile("vpcmpuq $0x12,%zmm6,%zmm7,%k5"); 29148c2ecf20Sopenharmony_ci 29158c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 3a 1f */ 29168c2ecf20Sopenharmony_ci 29178c2ecf20Sopenharmony_ci asm volatile("vpcmpd $0x12,%zmm6,%zmm7,%k5"); 29188c2ecf20Sopenharmony_ci asm volatile("vpcmpq $0x12,%zmm6,%zmm7,%k5"); 29198c2ecf20Sopenharmony_ci 29208c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 3a 23 */ 29218c2ecf20Sopenharmony_ci 29228c2ecf20Sopenharmony_ci asm volatile("vshuff32x4 $0x12,%zmm5,%zmm6,%zmm7"); 29238c2ecf20Sopenharmony_ci asm volatile("vshuff64x2 $0x12,%zmm5,%zmm6,%zmm7"); 29248c2ecf20Sopenharmony_ci 29258c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 3a 25 */ 29268c2ecf20Sopenharmony_ci 29278c2ecf20Sopenharmony_ci asm volatile("vpternlogd $0x12,%zmm5,%zmm6,%zmm7"); 29288c2ecf20Sopenharmony_ci asm volatile("vpternlogq $0x12,%zmm5,%zmm6,%zmm7"); 29298c2ecf20Sopenharmony_ci 29308c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 3a 26 */ 29318c2ecf20Sopenharmony_ci 29328c2ecf20Sopenharmony_ci asm volatile("vgetmantps $0x12,%zmm6,%zmm7"); 29338c2ecf20Sopenharmony_ci asm volatile("vgetmantpd $0x12,%zmm6,%zmm7"); 29348c2ecf20Sopenharmony_ci 29358c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 3a 27 */ 29368c2ecf20Sopenharmony_ci 29378c2ecf20Sopenharmony_ci asm volatile("vgetmantss $0x12,%xmm5,%xmm6,%xmm7{%k7}"); 29388c2ecf20Sopenharmony_ci asm volatile("vgetmantsd $0x12,%xmm5,%xmm6,%xmm7{%k7}"); 29398c2ecf20Sopenharmony_ci 29408c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 3a 38 */ 29418c2ecf20Sopenharmony_ci 29428c2ecf20Sopenharmony_ci asm volatile("vinserti128 $0x5,%xmm4,%ymm4,%ymm6"); 29438c2ecf20Sopenharmony_ci asm volatile("vinserti32x4 $0x12,%xmm4,%zmm5,%zmm6{%k7}"); 29448c2ecf20Sopenharmony_ci asm volatile("vinserti64x2 $0x12,%xmm4,%zmm5,%zmm6{%k7}"); 29458c2ecf20Sopenharmony_ci 29468c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 3a 39 */ 29478c2ecf20Sopenharmony_ci 29488c2ecf20Sopenharmony_ci asm volatile("vextracti128 $0x5,%ymm4,%xmm6"); 29498c2ecf20Sopenharmony_ci asm volatile("vextracti32x4 $0x12,%zmm5,%xmm6{%k7}"); 29508c2ecf20Sopenharmony_ci asm volatile("vextracti64x2 $0x12,%zmm5,%xmm6{%k7}"); 29518c2ecf20Sopenharmony_ci 29528c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 3a 3a */ 29538c2ecf20Sopenharmony_ci 29548c2ecf20Sopenharmony_ci asm volatile("vinserti32x8 $0x12,%ymm5,%zmm6,%zmm7{%k7}"); 29558c2ecf20Sopenharmony_ci asm volatile("vinserti64x4 $0x12,%ymm5,%zmm6,%zmm7{%k7}"); 29568c2ecf20Sopenharmony_ci 29578c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 3a 3b */ 29588c2ecf20Sopenharmony_ci 29598c2ecf20Sopenharmony_ci asm volatile("vextracti32x8 $0x12,%zmm6,%ymm7{%k7}"); 29608c2ecf20Sopenharmony_ci asm volatile("vextracti64x4 $0x12,%zmm6,%ymm7{%k7}"); 29618c2ecf20Sopenharmony_ci 29628c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 3a 3e */ 29638c2ecf20Sopenharmony_ci 29648c2ecf20Sopenharmony_ci asm volatile("vpcmpub $0x12,%zmm6,%zmm7,%k5"); 29658c2ecf20Sopenharmony_ci asm volatile("vpcmpuw $0x12,%zmm6,%zmm7,%k5"); 29668c2ecf20Sopenharmony_ci 29678c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 3a 3f */ 29688c2ecf20Sopenharmony_ci 29698c2ecf20Sopenharmony_ci asm volatile("vpcmpb $0x12,%zmm6,%zmm7,%k5"); 29708c2ecf20Sopenharmony_ci asm volatile("vpcmpw $0x12,%zmm6,%zmm7,%k5"); 29718c2ecf20Sopenharmony_ci 29728c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 3a 42 */ 29738c2ecf20Sopenharmony_ci 29748c2ecf20Sopenharmony_ci asm volatile("vmpsadbw $0x5,%ymm4,%ymm6,%ymm2"); 29758c2ecf20Sopenharmony_ci asm volatile("vdbpsadbw $0x12,%zmm4,%zmm5,%zmm6"); 29768c2ecf20Sopenharmony_ci 29778c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 3a 43 */ 29788c2ecf20Sopenharmony_ci 29798c2ecf20Sopenharmony_ci asm volatile("vshufi32x4 $0x12,%zmm5,%zmm6,%zmm7"); 29808c2ecf20Sopenharmony_ci asm volatile("vshufi64x2 $0x12,%zmm5,%zmm6,%zmm7"); 29818c2ecf20Sopenharmony_ci 29828c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 3a 44 */ 29838c2ecf20Sopenharmony_ci 29848c2ecf20Sopenharmony_ci asm volatile("vpclmulqdq $0x12,%xmm1,%xmm2,%xmm3"); 29858c2ecf20Sopenharmony_ci asm volatile("vpclmulqdq $0x12,%ymm1,%ymm2,%ymm3"); 29868c2ecf20Sopenharmony_ci asm volatile("vpclmulqdq $0x12,%zmm1,%zmm2,%zmm3"); 29878c2ecf20Sopenharmony_ci 29888c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 3a 50 */ 29898c2ecf20Sopenharmony_ci 29908c2ecf20Sopenharmony_ci asm volatile("vrangeps $0x12,%zmm5,%zmm6,%zmm7"); 29918c2ecf20Sopenharmony_ci asm volatile("vrangepd $0x12,%zmm5,%zmm6,%zmm7"); 29928c2ecf20Sopenharmony_ci 29938c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 3a 51 */ 29948c2ecf20Sopenharmony_ci 29958c2ecf20Sopenharmony_ci asm volatile("vrangess $0x12,%xmm5,%xmm6,%xmm7"); 29968c2ecf20Sopenharmony_ci asm volatile("vrangesd $0x12,%xmm5,%xmm6,%xmm7"); 29978c2ecf20Sopenharmony_ci 29988c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 3a 54 */ 29998c2ecf20Sopenharmony_ci 30008c2ecf20Sopenharmony_ci asm volatile("vfixupimmps $0x12,%zmm5,%zmm6,%zmm7"); 30018c2ecf20Sopenharmony_ci asm volatile("vfixupimmpd $0x12,%zmm5,%zmm6,%zmm7"); 30028c2ecf20Sopenharmony_ci 30038c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 3a 55 */ 30048c2ecf20Sopenharmony_ci 30058c2ecf20Sopenharmony_ci asm volatile("vfixupimmss $0x12,%xmm5,%xmm6,%xmm7{%k7}"); 30068c2ecf20Sopenharmony_ci asm volatile("vfixupimmsd $0x12,%xmm5,%xmm6,%xmm7{%k7}"); 30078c2ecf20Sopenharmony_ci 30088c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 3a 56 */ 30098c2ecf20Sopenharmony_ci 30108c2ecf20Sopenharmony_ci asm volatile("vreduceps $0x12,%zmm6,%zmm7"); 30118c2ecf20Sopenharmony_ci asm volatile("vreducepd $0x12,%zmm6,%zmm7"); 30128c2ecf20Sopenharmony_ci 30138c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 3a 57 */ 30148c2ecf20Sopenharmony_ci 30158c2ecf20Sopenharmony_ci asm volatile("vreducess $0x12,%xmm5,%xmm6,%xmm7"); 30168c2ecf20Sopenharmony_ci asm volatile("vreducesd $0x12,%xmm5,%xmm6,%xmm7"); 30178c2ecf20Sopenharmony_ci 30188c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 3a 66 */ 30198c2ecf20Sopenharmony_ci 30208c2ecf20Sopenharmony_ci asm volatile("vfpclassps $0x12,%zmm7,%k5"); 30218c2ecf20Sopenharmony_ci asm volatile("vfpclasspd $0x12,%zmm7,%k5"); 30228c2ecf20Sopenharmony_ci 30238c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 3a 67 */ 30248c2ecf20Sopenharmony_ci 30258c2ecf20Sopenharmony_ci asm volatile("vfpclassss $0x12,%xmm7,%k5"); 30268c2ecf20Sopenharmony_ci asm volatile("vfpclasssd $0x12,%xmm7,%k5"); 30278c2ecf20Sopenharmony_ci 30288c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 3a 70 */ 30298c2ecf20Sopenharmony_ci 30308c2ecf20Sopenharmony_ci asm volatile("vpshldw $0x12,%xmm1,%xmm2,%xmm3"); 30318c2ecf20Sopenharmony_ci asm volatile("vpshldw $0x12,%ymm1,%ymm2,%ymm3"); 30328c2ecf20Sopenharmony_ci asm volatile("vpshldw $0x12,%zmm1,%zmm2,%zmm3"); 30338c2ecf20Sopenharmony_ci 30348c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 3a 71 */ 30358c2ecf20Sopenharmony_ci 30368c2ecf20Sopenharmony_ci asm volatile("vpshldd $0x12,%xmm1,%xmm2,%xmm3"); 30378c2ecf20Sopenharmony_ci asm volatile("vpshldd $0x12,%ymm1,%ymm2,%ymm3"); 30388c2ecf20Sopenharmony_ci asm volatile("vpshldd $0x12,%zmm1,%zmm2,%zmm3"); 30398c2ecf20Sopenharmony_ci 30408c2ecf20Sopenharmony_ci asm volatile("vpshldq $0x12,%xmm1,%xmm2,%xmm3"); 30418c2ecf20Sopenharmony_ci asm volatile("vpshldq $0x12,%ymm1,%ymm2,%ymm3"); 30428c2ecf20Sopenharmony_ci asm volatile("vpshldq $0x12,%zmm1,%zmm2,%zmm3"); 30438c2ecf20Sopenharmony_ci 30448c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 3a 72 */ 30458c2ecf20Sopenharmony_ci 30468c2ecf20Sopenharmony_ci asm volatile("vpshrdw $0x12,%xmm1,%xmm2,%xmm3"); 30478c2ecf20Sopenharmony_ci asm volatile("vpshrdw $0x12,%ymm1,%ymm2,%ymm3"); 30488c2ecf20Sopenharmony_ci asm volatile("vpshrdw $0x12,%zmm1,%zmm2,%zmm3"); 30498c2ecf20Sopenharmony_ci 30508c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 3a 73 */ 30518c2ecf20Sopenharmony_ci 30528c2ecf20Sopenharmony_ci asm volatile("vpshrdd $0x12,%xmm1,%xmm2,%xmm3"); 30538c2ecf20Sopenharmony_ci asm volatile("vpshrdd $0x12,%ymm1,%ymm2,%ymm3"); 30548c2ecf20Sopenharmony_ci asm volatile("vpshrdd $0x12,%zmm1,%zmm2,%zmm3"); 30558c2ecf20Sopenharmony_ci 30568c2ecf20Sopenharmony_ci asm volatile("vpshrdq $0x12,%xmm1,%xmm2,%xmm3"); 30578c2ecf20Sopenharmony_ci asm volatile("vpshrdq $0x12,%ymm1,%ymm2,%ymm3"); 30588c2ecf20Sopenharmony_ci asm volatile("vpshrdq $0x12,%zmm1,%zmm2,%zmm3"); 30598c2ecf20Sopenharmony_ci 30608c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 3a ce */ 30618c2ecf20Sopenharmony_ci 30628c2ecf20Sopenharmony_ci asm volatile("gf2p8affineqb $0x12,%xmm1,%xmm3"); 30638c2ecf20Sopenharmony_ci 30648c2ecf20Sopenharmony_ci asm volatile("vgf2p8affineqb $0x12,%xmm1,%xmm2,%xmm3"); 30658c2ecf20Sopenharmony_ci asm volatile("vgf2p8affineqb $0x12,%ymm1,%ymm2,%ymm3"); 30668c2ecf20Sopenharmony_ci asm volatile("vgf2p8affineqb $0x12,%zmm1,%zmm2,%zmm3"); 30678c2ecf20Sopenharmony_ci 30688c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 3a cf */ 30698c2ecf20Sopenharmony_ci 30708c2ecf20Sopenharmony_ci asm volatile("gf2p8affineinvqb $0x12,%xmm1,%xmm3"); 30718c2ecf20Sopenharmony_ci 30728c2ecf20Sopenharmony_ci asm volatile("vgf2p8affineinvqb $0x12,%xmm1,%xmm2,%xmm3"); 30738c2ecf20Sopenharmony_ci asm volatile("vgf2p8affineinvqb $0x12,%ymm1,%ymm2,%ymm3"); 30748c2ecf20Sopenharmony_ci asm volatile("vgf2p8affineinvqb $0x12,%zmm1,%zmm2,%zmm3"); 30758c2ecf20Sopenharmony_ci 30768c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 72 (Grp13) */ 30778c2ecf20Sopenharmony_ci 30788c2ecf20Sopenharmony_ci asm volatile("vprord $0x12,%zmm5,%zmm6"); 30798c2ecf20Sopenharmony_ci asm volatile("vprorq $0x12,%zmm5,%zmm6"); 30808c2ecf20Sopenharmony_ci asm volatile("vprold $0x12,%zmm5,%zmm6"); 30818c2ecf20Sopenharmony_ci asm volatile("vprolq $0x12,%zmm5,%zmm6"); 30828c2ecf20Sopenharmony_ci asm volatile("psrad $0x2,%mm6"); 30838c2ecf20Sopenharmony_ci asm volatile("vpsrad $0x5,%ymm6,%ymm2"); 30848c2ecf20Sopenharmony_ci asm volatile("vpsrad $0x5,%zmm6,%zmm2"); 30858c2ecf20Sopenharmony_ci asm volatile("vpsraq $0x5,%zmm6,%zmm2"); 30868c2ecf20Sopenharmony_ci 30878c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 38 c6 (Grp18) */ 30888c2ecf20Sopenharmony_ci 30898c2ecf20Sopenharmony_ci asm volatile("vgatherpf0dps 0x7b(%ebp,%zmm7,8){%k1}"); 30908c2ecf20Sopenharmony_ci asm volatile("vgatherpf0dpd 0x7b(%ebp,%ymm7,8){%k1}"); 30918c2ecf20Sopenharmony_ci asm volatile("vgatherpf1dps 0x7b(%ebp,%zmm7,8){%k1}"); 30928c2ecf20Sopenharmony_ci asm volatile("vgatherpf1dpd 0x7b(%ebp,%ymm7,8){%k1}"); 30938c2ecf20Sopenharmony_ci asm volatile("vscatterpf0dps 0x7b(%ebp,%zmm7,8){%k1}"); 30948c2ecf20Sopenharmony_ci asm volatile("vscatterpf0dpd 0x7b(%ebp,%ymm7,8){%k1}"); 30958c2ecf20Sopenharmony_ci asm volatile("vscatterpf1dps 0x7b(%ebp,%zmm7,8){%k1}"); 30968c2ecf20Sopenharmony_ci asm volatile("vscatterpf1dpd 0x7b(%ebp,%ymm7,8){%k1}"); 30978c2ecf20Sopenharmony_ci 30988c2ecf20Sopenharmony_ci /* AVX-512: Op code 0f 38 c7 (Grp19) */ 30998c2ecf20Sopenharmony_ci 31008c2ecf20Sopenharmony_ci asm volatile("vgatherpf0qps 0x7b(%ebp,%zmm7,8){%k1}"); 31018c2ecf20Sopenharmony_ci asm volatile("vgatherpf0qpd 0x7b(%ebp,%zmm7,8){%k1}"); 31028c2ecf20Sopenharmony_ci asm volatile("vgatherpf1qps 0x7b(%ebp,%zmm7,8){%k1}"); 31038c2ecf20Sopenharmony_ci asm volatile("vgatherpf1qpd 0x7b(%ebp,%zmm7,8){%k1}"); 31048c2ecf20Sopenharmony_ci asm volatile("vscatterpf0qps 0x7b(%ebp,%zmm7,8){%k1}"); 31058c2ecf20Sopenharmony_ci asm volatile("vscatterpf0qpd 0x7b(%ebp,%zmm7,8){%k1}"); 31068c2ecf20Sopenharmony_ci asm volatile("vscatterpf1qps 0x7b(%ebp,%zmm7,8){%k1}"); 31078c2ecf20Sopenharmony_ci asm volatile("vscatterpf1qpd 0x7b(%ebp,%zmm7,8){%k1}"); 31088c2ecf20Sopenharmony_ci 31098c2ecf20Sopenharmony_ci /* AVX-512: Examples */ 31108c2ecf20Sopenharmony_ci 31118c2ecf20Sopenharmony_ci asm volatile("vaddpd %zmm4,%zmm5,%zmm6"); 31128c2ecf20Sopenharmony_ci asm volatile("vaddpd %zmm4,%zmm5,%zmm6{%k7}"); 31138c2ecf20Sopenharmony_ci asm volatile("vaddpd %zmm4,%zmm5,%zmm6{%k7}{z}"); 31148c2ecf20Sopenharmony_ci asm volatile("vaddpd {rn-sae},%zmm4,%zmm5,%zmm6"); 31158c2ecf20Sopenharmony_ci asm volatile("vaddpd {ru-sae},%zmm4,%zmm5,%zmm6"); 31168c2ecf20Sopenharmony_ci asm volatile("vaddpd {rd-sae},%zmm4,%zmm5,%zmm6"); 31178c2ecf20Sopenharmony_ci asm volatile("vaddpd {rz-sae},%zmm4,%zmm5,%zmm6"); 31188c2ecf20Sopenharmony_ci asm volatile("vaddpd (%ecx),%zmm5,%zmm6"); 31198c2ecf20Sopenharmony_ci asm volatile("vaddpd 0x123(%eax,%ecx,8),%zmm5,%zmm6"); 31208c2ecf20Sopenharmony_ci asm volatile("vaddpd (%ecx){1to8},%zmm5,%zmm6"); 31218c2ecf20Sopenharmony_ci asm volatile("vaddpd 0x1fc0(%edx),%zmm5,%zmm6"); 31228c2ecf20Sopenharmony_ci asm volatile("vaddpd 0x3f8(%edx){1to8},%zmm5,%zmm6"); 31238c2ecf20Sopenharmony_ci asm volatile("vcmpeq_uqps 0x1fc(%edx){1to16},%zmm6,%k5"); 31248c2ecf20Sopenharmony_ci asm volatile("vcmpltsd 0x123(%eax,%ecx,8),%xmm3,%k5{%k7}"); 31258c2ecf20Sopenharmony_ci asm volatile("vcmplesd {sae},%xmm4,%xmm5,%k5{%k7}"); 31268c2ecf20Sopenharmony_ci asm volatile("vgetmantss $0x5b,0x123(%eax,%ecx,8),%xmm4,%xmm5{%k7}"); 31278c2ecf20Sopenharmony_ci 31288c2ecf20Sopenharmony_ci /* bndmk m32, bnd */ 31298c2ecf20Sopenharmony_ci 31308c2ecf20Sopenharmony_ci asm volatile("bndmk (%eax), %bnd0"); 31318c2ecf20Sopenharmony_ci asm volatile("bndmk (0x12345678), %bnd0"); 31328c2ecf20Sopenharmony_ci asm volatile("bndmk (%eax), %bnd3"); 31338c2ecf20Sopenharmony_ci asm volatile("bndmk (%ecx,%eax,1), %bnd0"); 31348c2ecf20Sopenharmony_ci asm volatile("bndmk 0x12345678(,%eax,1), %bnd0"); 31358c2ecf20Sopenharmony_ci asm volatile("bndmk (%eax,%ecx,1), %bnd0"); 31368c2ecf20Sopenharmony_ci asm volatile("bndmk (%eax,%ecx,8), %bnd0"); 31378c2ecf20Sopenharmony_ci asm volatile("bndmk 0x12(%eax), %bnd0"); 31388c2ecf20Sopenharmony_ci asm volatile("bndmk 0x12(%ebp), %bnd0"); 31398c2ecf20Sopenharmony_ci asm volatile("bndmk 0x12(%ecx,%eax,1), %bnd0"); 31408c2ecf20Sopenharmony_ci asm volatile("bndmk 0x12(%ebp,%eax,1), %bnd0"); 31418c2ecf20Sopenharmony_ci asm volatile("bndmk 0x12(%eax,%ecx,1), %bnd0"); 31428c2ecf20Sopenharmony_ci asm volatile("bndmk 0x12(%eax,%ecx,8), %bnd0"); 31438c2ecf20Sopenharmony_ci asm volatile("bndmk 0x12345678(%eax), %bnd0"); 31448c2ecf20Sopenharmony_ci asm volatile("bndmk 0x12345678(%ebp), %bnd0"); 31458c2ecf20Sopenharmony_ci asm volatile("bndmk 0x12345678(%ecx,%eax,1), %bnd0"); 31468c2ecf20Sopenharmony_ci asm volatile("bndmk 0x12345678(%ebp,%eax,1), %bnd0"); 31478c2ecf20Sopenharmony_ci asm volatile("bndmk 0x12345678(%eax,%ecx,1), %bnd0"); 31488c2ecf20Sopenharmony_ci asm volatile("bndmk 0x12345678(%eax,%ecx,8), %bnd0"); 31498c2ecf20Sopenharmony_ci 31508c2ecf20Sopenharmony_ci /* bndcl r/m32, bnd */ 31518c2ecf20Sopenharmony_ci 31528c2ecf20Sopenharmony_ci asm volatile("bndcl (%eax), %bnd0"); 31538c2ecf20Sopenharmony_ci asm volatile("bndcl (0x12345678), %bnd0"); 31548c2ecf20Sopenharmony_ci asm volatile("bndcl (%eax), %bnd3"); 31558c2ecf20Sopenharmony_ci asm volatile("bndcl (%ecx,%eax,1), %bnd0"); 31568c2ecf20Sopenharmony_ci asm volatile("bndcl 0x12345678(,%eax,1), %bnd0"); 31578c2ecf20Sopenharmony_ci asm volatile("bndcl (%eax,%ecx,1), %bnd0"); 31588c2ecf20Sopenharmony_ci asm volatile("bndcl (%eax,%ecx,8), %bnd0"); 31598c2ecf20Sopenharmony_ci asm volatile("bndcl 0x12(%eax), %bnd0"); 31608c2ecf20Sopenharmony_ci asm volatile("bndcl 0x12(%ebp), %bnd0"); 31618c2ecf20Sopenharmony_ci asm volatile("bndcl 0x12(%ecx,%eax,1), %bnd0"); 31628c2ecf20Sopenharmony_ci asm volatile("bndcl 0x12(%ebp,%eax,1), %bnd0"); 31638c2ecf20Sopenharmony_ci asm volatile("bndcl 0x12(%eax,%ecx,1), %bnd0"); 31648c2ecf20Sopenharmony_ci asm volatile("bndcl 0x12(%eax,%ecx,8), %bnd0"); 31658c2ecf20Sopenharmony_ci asm volatile("bndcl 0x12345678(%eax), %bnd0"); 31668c2ecf20Sopenharmony_ci asm volatile("bndcl 0x12345678(%ebp), %bnd0"); 31678c2ecf20Sopenharmony_ci asm volatile("bndcl 0x12345678(%ecx,%eax,1), %bnd0"); 31688c2ecf20Sopenharmony_ci asm volatile("bndcl 0x12345678(%ebp,%eax,1), %bnd0"); 31698c2ecf20Sopenharmony_ci asm volatile("bndcl 0x12345678(%eax,%ecx,1), %bnd0"); 31708c2ecf20Sopenharmony_ci asm volatile("bndcl 0x12345678(%eax,%ecx,8), %bnd0"); 31718c2ecf20Sopenharmony_ci asm volatile("bndcl %eax, %bnd0"); 31728c2ecf20Sopenharmony_ci 31738c2ecf20Sopenharmony_ci /* bndcu r/m32, bnd */ 31748c2ecf20Sopenharmony_ci 31758c2ecf20Sopenharmony_ci asm volatile("bndcu (%eax), %bnd0"); 31768c2ecf20Sopenharmony_ci asm volatile("bndcu (0x12345678), %bnd0"); 31778c2ecf20Sopenharmony_ci asm volatile("bndcu (%eax), %bnd3"); 31788c2ecf20Sopenharmony_ci asm volatile("bndcu (%ecx,%eax,1), %bnd0"); 31798c2ecf20Sopenharmony_ci asm volatile("bndcu 0x12345678(,%eax,1), %bnd0"); 31808c2ecf20Sopenharmony_ci asm volatile("bndcu (%eax,%ecx,1), %bnd0"); 31818c2ecf20Sopenharmony_ci asm volatile("bndcu (%eax,%ecx,8), %bnd0"); 31828c2ecf20Sopenharmony_ci asm volatile("bndcu 0x12(%eax), %bnd0"); 31838c2ecf20Sopenharmony_ci asm volatile("bndcu 0x12(%ebp), %bnd0"); 31848c2ecf20Sopenharmony_ci asm volatile("bndcu 0x12(%ecx,%eax,1), %bnd0"); 31858c2ecf20Sopenharmony_ci asm volatile("bndcu 0x12(%ebp,%eax,1), %bnd0"); 31868c2ecf20Sopenharmony_ci asm volatile("bndcu 0x12(%eax,%ecx,1), %bnd0"); 31878c2ecf20Sopenharmony_ci asm volatile("bndcu 0x12(%eax,%ecx,8), %bnd0"); 31888c2ecf20Sopenharmony_ci asm volatile("bndcu 0x12345678(%eax), %bnd0"); 31898c2ecf20Sopenharmony_ci asm volatile("bndcu 0x12345678(%ebp), %bnd0"); 31908c2ecf20Sopenharmony_ci asm volatile("bndcu 0x12345678(%ecx,%eax,1), %bnd0"); 31918c2ecf20Sopenharmony_ci asm volatile("bndcu 0x12345678(%ebp,%eax,1), %bnd0"); 31928c2ecf20Sopenharmony_ci asm volatile("bndcu 0x12345678(%eax,%ecx,1), %bnd0"); 31938c2ecf20Sopenharmony_ci asm volatile("bndcu 0x12345678(%eax,%ecx,8), %bnd0"); 31948c2ecf20Sopenharmony_ci asm volatile("bndcu %eax, %bnd0"); 31958c2ecf20Sopenharmony_ci 31968c2ecf20Sopenharmony_ci /* bndcn r/m32, bnd */ 31978c2ecf20Sopenharmony_ci 31988c2ecf20Sopenharmony_ci asm volatile("bndcn (%eax), %bnd0"); 31998c2ecf20Sopenharmony_ci asm volatile("bndcn (0x12345678), %bnd0"); 32008c2ecf20Sopenharmony_ci asm volatile("bndcn (%eax), %bnd3"); 32018c2ecf20Sopenharmony_ci asm volatile("bndcn (%ecx,%eax,1), %bnd0"); 32028c2ecf20Sopenharmony_ci asm volatile("bndcn 0x12345678(,%eax,1), %bnd0"); 32038c2ecf20Sopenharmony_ci asm volatile("bndcn (%eax,%ecx,1), %bnd0"); 32048c2ecf20Sopenharmony_ci asm volatile("bndcn (%eax,%ecx,8), %bnd0"); 32058c2ecf20Sopenharmony_ci asm volatile("bndcn 0x12(%eax), %bnd0"); 32068c2ecf20Sopenharmony_ci asm volatile("bndcn 0x12(%ebp), %bnd0"); 32078c2ecf20Sopenharmony_ci asm volatile("bndcn 0x12(%ecx,%eax,1), %bnd0"); 32088c2ecf20Sopenharmony_ci asm volatile("bndcn 0x12(%ebp,%eax,1), %bnd0"); 32098c2ecf20Sopenharmony_ci asm volatile("bndcn 0x12(%eax,%ecx,1), %bnd0"); 32108c2ecf20Sopenharmony_ci asm volatile("bndcn 0x12(%eax,%ecx,8), %bnd0"); 32118c2ecf20Sopenharmony_ci asm volatile("bndcn 0x12345678(%eax), %bnd0"); 32128c2ecf20Sopenharmony_ci asm volatile("bndcn 0x12345678(%ebp), %bnd0"); 32138c2ecf20Sopenharmony_ci asm volatile("bndcn 0x12345678(%ecx,%eax,1), %bnd0"); 32148c2ecf20Sopenharmony_ci asm volatile("bndcn 0x12345678(%ebp,%eax,1), %bnd0"); 32158c2ecf20Sopenharmony_ci asm volatile("bndcn 0x12345678(%eax,%ecx,1), %bnd0"); 32168c2ecf20Sopenharmony_ci asm volatile("bndcn 0x12345678(%eax,%ecx,8), %bnd0"); 32178c2ecf20Sopenharmony_ci asm volatile("bndcn %eax, %bnd0"); 32188c2ecf20Sopenharmony_ci 32198c2ecf20Sopenharmony_ci /* bndmov m64, bnd */ 32208c2ecf20Sopenharmony_ci 32218c2ecf20Sopenharmony_ci asm volatile("bndmov (%eax), %bnd0"); 32228c2ecf20Sopenharmony_ci asm volatile("bndmov (0x12345678), %bnd0"); 32238c2ecf20Sopenharmony_ci asm volatile("bndmov (%eax), %bnd3"); 32248c2ecf20Sopenharmony_ci asm volatile("bndmov (%ecx,%eax,1), %bnd0"); 32258c2ecf20Sopenharmony_ci asm volatile("bndmov 0x12345678(,%eax,1), %bnd0"); 32268c2ecf20Sopenharmony_ci asm volatile("bndmov (%eax,%ecx,1), %bnd0"); 32278c2ecf20Sopenharmony_ci asm volatile("bndmov (%eax,%ecx,8), %bnd0"); 32288c2ecf20Sopenharmony_ci asm volatile("bndmov 0x12(%eax), %bnd0"); 32298c2ecf20Sopenharmony_ci asm volatile("bndmov 0x12(%ebp), %bnd0"); 32308c2ecf20Sopenharmony_ci asm volatile("bndmov 0x12(%ecx,%eax,1), %bnd0"); 32318c2ecf20Sopenharmony_ci asm volatile("bndmov 0x12(%ebp,%eax,1), %bnd0"); 32328c2ecf20Sopenharmony_ci asm volatile("bndmov 0x12(%eax,%ecx,1), %bnd0"); 32338c2ecf20Sopenharmony_ci asm volatile("bndmov 0x12(%eax,%ecx,8), %bnd0"); 32348c2ecf20Sopenharmony_ci asm volatile("bndmov 0x12345678(%eax), %bnd0"); 32358c2ecf20Sopenharmony_ci asm volatile("bndmov 0x12345678(%ebp), %bnd0"); 32368c2ecf20Sopenharmony_ci asm volatile("bndmov 0x12345678(%ecx,%eax,1), %bnd0"); 32378c2ecf20Sopenharmony_ci asm volatile("bndmov 0x12345678(%ebp,%eax,1), %bnd0"); 32388c2ecf20Sopenharmony_ci asm volatile("bndmov 0x12345678(%eax,%ecx,1), %bnd0"); 32398c2ecf20Sopenharmony_ci asm volatile("bndmov 0x12345678(%eax,%ecx,8), %bnd0"); 32408c2ecf20Sopenharmony_ci 32418c2ecf20Sopenharmony_ci /* bndmov bnd, m64 */ 32428c2ecf20Sopenharmony_ci 32438c2ecf20Sopenharmony_ci asm volatile("bndmov %bnd0, (%eax)"); 32448c2ecf20Sopenharmony_ci asm volatile("bndmov %bnd0, (0x12345678)"); 32458c2ecf20Sopenharmony_ci asm volatile("bndmov %bnd3, (%eax)"); 32468c2ecf20Sopenharmony_ci asm volatile("bndmov %bnd0, (%ecx,%eax,1)"); 32478c2ecf20Sopenharmony_ci asm volatile("bndmov %bnd0, 0x12345678(,%eax,1)"); 32488c2ecf20Sopenharmony_ci asm volatile("bndmov %bnd0, (%eax,%ecx,1)"); 32498c2ecf20Sopenharmony_ci asm volatile("bndmov %bnd0, (%eax,%ecx,8)"); 32508c2ecf20Sopenharmony_ci asm volatile("bndmov %bnd0, 0x12(%eax)"); 32518c2ecf20Sopenharmony_ci asm volatile("bndmov %bnd0, 0x12(%ebp)"); 32528c2ecf20Sopenharmony_ci asm volatile("bndmov %bnd0, 0x12(%ecx,%eax,1)"); 32538c2ecf20Sopenharmony_ci asm volatile("bndmov %bnd0, 0x12(%ebp,%eax,1)"); 32548c2ecf20Sopenharmony_ci asm volatile("bndmov %bnd0, 0x12(%eax,%ecx,1)"); 32558c2ecf20Sopenharmony_ci asm volatile("bndmov %bnd0, 0x12(%eax,%ecx,8)"); 32568c2ecf20Sopenharmony_ci asm volatile("bndmov %bnd0, 0x12345678(%eax)"); 32578c2ecf20Sopenharmony_ci asm volatile("bndmov %bnd0, 0x12345678(%ebp)"); 32588c2ecf20Sopenharmony_ci asm volatile("bndmov %bnd0, 0x12345678(%ecx,%eax,1)"); 32598c2ecf20Sopenharmony_ci asm volatile("bndmov %bnd0, 0x12345678(%ebp,%eax,1)"); 32608c2ecf20Sopenharmony_ci asm volatile("bndmov %bnd0, 0x12345678(%eax,%ecx,1)"); 32618c2ecf20Sopenharmony_ci asm volatile("bndmov %bnd0, 0x12345678(%eax,%ecx,8)"); 32628c2ecf20Sopenharmony_ci 32638c2ecf20Sopenharmony_ci /* bndmov bnd2, bnd1 */ 32648c2ecf20Sopenharmony_ci 32658c2ecf20Sopenharmony_ci asm volatile("bndmov %bnd0, %bnd1"); 32668c2ecf20Sopenharmony_ci asm volatile("bndmov %bnd1, %bnd0"); 32678c2ecf20Sopenharmony_ci 32688c2ecf20Sopenharmony_ci /* bndldx mib, bnd */ 32698c2ecf20Sopenharmony_ci 32708c2ecf20Sopenharmony_ci asm volatile("bndldx (%eax), %bnd0"); 32718c2ecf20Sopenharmony_ci asm volatile("bndldx (0x12345678), %bnd0"); 32728c2ecf20Sopenharmony_ci asm volatile("bndldx (%eax), %bnd3"); 32738c2ecf20Sopenharmony_ci asm volatile("bndldx (%ecx,%eax,1), %bnd0"); 32748c2ecf20Sopenharmony_ci asm volatile("bndldx 0x12345678(,%eax,1), %bnd0"); 32758c2ecf20Sopenharmony_ci asm volatile("bndldx (%eax,%ecx,1), %bnd0"); 32768c2ecf20Sopenharmony_ci asm volatile("bndldx 0x12(%eax), %bnd0"); 32778c2ecf20Sopenharmony_ci asm volatile("bndldx 0x12(%ebp), %bnd0"); 32788c2ecf20Sopenharmony_ci asm volatile("bndldx 0x12(%ecx,%eax,1), %bnd0"); 32798c2ecf20Sopenharmony_ci asm volatile("bndldx 0x12(%ebp,%eax,1), %bnd0"); 32808c2ecf20Sopenharmony_ci asm volatile("bndldx 0x12(%eax,%ecx,1), %bnd0"); 32818c2ecf20Sopenharmony_ci asm volatile("bndldx 0x12345678(%eax), %bnd0"); 32828c2ecf20Sopenharmony_ci asm volatile("bndldx 0x12345678(%ebp), %bnd0"); 32838c2ecf20Sopenharmony_ci asm volatile("bndldx 0x12345678(%ecx,%eax,1), %bnd0"); 32848c2ecf20Sopenharmony_ci asm volatile("bndldx 0x12345678(%ebp,%eax,1), %bnd0"); 32858c2ecf20Sopenharmony_ci asm volatile("bndldx 0x12345678(%eax,%ecx,1), %bnd0"); 32868c2ecf20Sopenharmony_ci 32878c2ecf20Sopenharmony_ci /* bndstx bnd, mib */ 32888c2ecf20Sopenharmony_ci 32898c2ecf20Sopenharmony_ci asm volatile("bndstx %bnd0, (%eax)"); 32908c2ecf20Sopenharmony_ci asm volatile("bndstx %bnd0, (0x12345678)"); 32918c2ecf20Sopenharmony_ci asm volatile("bndstx %bnd3, (%eax)"); 32928c2ecf20Sopenharmony_ci asm volatile("bndstx %bnd0, (%ecx,%eax,1)"); 32938c2ecf20Sopenharmony_ci asm volatile("bndstx %bnd0, 0x12345678(,%eax,1)"); 32948c2ecf20Sopenharmony_ci asm volatile("bndstx %bnd0, (%eax,%ecx,1)"); 32958c2ecf20Sopenharmony_ci asm volatile("bndstx %bnd0, 0x12(%eax)"); 32968c2ecf20Sopenharmony_ci asm volatile("bndstx %bnd0, 0x12(%ebp)"); 32978c2ecf20Sopenharmony_ci asm volatile("bndstx %bnd0, 0x12(%ecx,%eax,1)"); 32988c2ecf20Sopenharmony_ci asm volatile("bndstx %bnd0, 0x12(%ebp,%eax,1)"); 32998c2ecf20Sopenharmony_ci asm volatile("bndstx %bnd0, 0x12(%eax,%ecx,1)"); 33008c2ecf20Sopenharmony_ci asm volatile("bndstx %bnd0, 0x12345678(%eax)"); 33018c2ecf20Sopenharmony_ci asm volatile("bndstx %bnd0, 0x12345678(%ebp)"); 33028c2ecf20Sopenharmony_ci asm volatile("bndstx %bnd0, 0x12345678(%ecx,%eax,1)"); 33038c2ecf20Sopenharmony_ci asm volatile("bndstx %bnd0, 0x12345678(%ebp,%eax,1)"); 33048c2ecf20Sopenharmony_ci asm volatile("bndstx %bnd0, 0x12345678(%eax,%ecx,1)"); 33058c2ecf20Sopenharmony_ci 33068c2ecf20Sopenharmony_ci /* bnd prefix on call, ret, jmp and all jcc */ 33078c2ecf20Sopenharmony_ci 33088c2ecf20Sopenharmony_ci asm volatile("bnd call label1"); /* Expecting: call unconditional 0xfffffffc */ 33098c2ecf20Sopenharmony_ci asm volatile("bnd call *(%eax)"); /* Expecting: call indirect 0 */ 33108c2ecf20Sopenharmony_ci asm volatile("bnd ret"); /* Expecting: ret indirect 0 */ 33118c2ecf20Sopenharmony_ci asm volatile("bnd jmp label1"); /* Expecting: jmp unconditional 0xfffffffc */ 33128c2ecf20Sopenharmony_ci asm volatile("bnd jmp label1"); /* Expecting: jmp unconditional 0xfffffffc */ 33138c2ecf20Sopenharmony_ci asm volatile("bnd jmp *(%ecx)"); /* Expecting: jmp indirect 0 */ 33148c2ecf20Sopenharmony_ci asm volatile("bnd jne label1"); /* Expecting: jcc conditional 0xfffffffc */ 33158c2ecf20Sopenharmony_ci 33168c2ecf20Sopenharmony_ci /* sha1rnds4 imm8, xmm2/m128, xmm1 */ 33178c2ecf20Sopenharmony_ci 33188c2ecf20Sopenharmony_ci asm volatile("sha1rnds4 $0x0, %xmm1, %xmm0"); 33198c2ecf20Sopenharmony_ci asm volatile("sha1rnds4 $0x91, %xmm7, %xmm2"); 33208c2ecf20Sopenharmony_ci asm volatile("sha1rnds4 $0x91, (%eax), %xmm0"); 33218c2ecf20Sopenharmony_ci asm volatile("sha1rnds4 $0x91, (0x12345678), %xmm0"); 33228c2ecf20Sopenharmony_ci asm volatile("sha1rnds4 $0x91, (%eax), %xmm3"); 33238c2ecf20Sopenharmony_ci asm volatile("sha1rnds4 $0x91, (%ecx,%eax,1), %xmm0"); 33248c2ecf20Sopenharmony_ci asm volatile("sha1rnds4 $0x91, 0x12345678(,%eax,1), %xmm0"); 33258c2ecf20Sopenharmony_ci asm volatile("sha1rnds4 $0x91, (%eax,%ecx,1), %xmm0"); 33268c2ecf20Sopenharmony_ci asm volatile("sha1rnds4 $0x91, (%eax,%ecx,8), %xmm0"); 33278c2ecf20Sopenharmony_ci asm volatile("sha1rnds4 $0x91, 0x12(%eax), %xmm0"); 33288c2ecf20Sopenharmony_ci asm volatile("sha1rnds4 $0x91, 0x12(%ebp), %xmm0"); 33298c2ecf20Sopenharmony_ci asm volatile("sha1rnds4 $0x91, 0x12(%ecx,%eax,1), %xmm0"); 33308c2ecf20Sopenharmony_ci asm volatile("sha1rnds4 $0x91, 0x12(%ebp,%eax,1), %xmm0"); 33318c2ecf20Sopenharmony_ci asm volatile("sha1rnds4 $0x91, 0x12(%eax,%ecx,1), %xmm0"); 33328c2ecf20Sopenharmony_ci asm volatile("sha1rnds4 $0x91, 0x12(%eax,%ecx,8), %xmm0"); 33338c2ecf20Sopenharmony_ci asm volatile("sha1rnds4 $0x91, 0x12345678(%eax), %xmm0"); 33348c2ecf20Sopenharmony_ci asm volatile("sha1rnds4 $0x91, 0x12345678(%ebp), %xmm0"); 33358c2ecf20Sopenharmony_ci asm volatile("sha1rnds4 $0x91, 0x12345678(%ecx,%eax,1), %xmm0"); 33368c2ecf20Sopenharmony_ci asm volatile("sha1rnds4 $0x91, 0x12345678(%ebp,%eax,1), %xmm0"); 33378c2ecf20Sopenharmony_ci asm volatile("sha1rnds4 $0x91, 0x12345678(%eax,%ecx,1), %xmm0"); 33388c2ecf20Sopenharmony_ci asm volatile("sha1rnds4 $0x91, 0x12345678(%eax,%ecx,8), %xmm0"); 33398c2ecf20Sopenharmony_ci 33408c2ecf20Sopenharmony_ci /* sha1nexte xmm2/m128, xmm1 */ 33418c2ecf20Sopenharmony_ci 33428c2ecf20Sopenharmony_ci asm volatile("sha1nexte %xmm1, %xmm0"); 33438c2ecf20Sopenharmony_ci asm volatile("sha1nexte %xmm7, %xmm2"); 33448c2ecf20Sopenharmony_ci asm volatile("sha1nexte (%eax), %xmm0"); 33458c2ecf20Sopenharmony_ci asm volatile("sha1nexte (0x12345678), %xmm0"); 33468c2ecf20Sopenharmony_ci asm volatile("sha1nexte (%eax), %xmm3"); 33478c2ecf20Sopenharmony_ci asm volatile("sha1nexte (%ecx,%eax,1), %xmm0"); 33488c2ecf20Sopenharmony_ci asm volatile("sha1nexte 0x12345678(,%eax,1), %xmm0"); 33498c2ecf20Sopenharmony_ci asm volatile("sha1nexte (%eax,%ecx,1), %xmm0"); 33508c2ecf20Sopenharmony_ci asm volatile("sha1nexte (%eax,%ecx,8), %xmm0"); 33518c2ecf20Sopenharmony_ci asm volatile("sha1nexte 0x12(%eax), %xmm0"); 33528c2ecf20Sopenharmony_ci asm volatile("sha1nexte 0x12(%ebp), %xmm0"); 33538c2ecf20Sopenharmony_ci asm volatile("sha1nexte 0x12(%ecx,%eax,1), %xmm0"); 33548c2ecf20Sopenharmony_ci asm volatile("sha1nexte 0x12(%ebp,%eax,1), %xmm0"); 33558c2ecf20Sopenharmony_ci asm volatile("sha1nexte 0x12(%eax,%ecx,1), %xmm0"); 33568c2ecf20Sopenharmony_ci asm volatile("sha1nexte 0x12(%eax,%ecx,8), %xmm0"); 33578c2ecf20Sopenharmony_ci asm volatile("sha1nexte 0x12345678(%eax), %xmm0"); 33588c2ecf20Sopenharmony_ci asm volatile("sha1nexte 0x12345678(%ebp), %xmm0"); 33598c2ecf20Sopenharmony_ci asm volatile("sha1nexte 0x12345678(%ecx,%eax,1), %xmm0"); 33608c2ecf20Sopenharmony_ci asm volatile("sha1nexte 0x12345678(%ebp,%eax,1), %xmm0"); 33618c2ecf20Sopenharmony_ci asm volatile("sha1nexte 0x12345678(%eax,%ecx,1), %xmm0"); 33628c2ecf20Sopenharmony_ci asm volatile("sha1nexte 0x12345678(%eax,%ecx,8), %xmm0"); 33638c2ecf20Sopenharmony_ci 33648c2ecf20Sopenharmony_ci /* sha1msg1 xmm2/m128, xmm1 */ 33658c2ecf20Sopenharmony_ci 33668c2ecf20Sopenharmony_ci asm volatile("sha1msg1 %xmm1, %xmm0"); 33678c2ecf20Sopenharmony_ci asm volatile("sha1msg1 %xmm7, %xmm2"); 33688c2ecf20Sopenharmony_ci asm volatile("sha1msg1 (%eax), %xmm0"); 33698c2ecf20Sopenharmony_ci asm volatile("sha1msg1 (0x12345678), %xmm0"); 33708c2ecf20Sopenharmony_ci asm volatile("sha1msg1 (%eax), %xmm3"); 33718c2ecf20Sopenharmony_ci asm volatile("sha1msg1 (%ecx,%eax,1), %xmm0"); 33728c2ecf20Sopenharmony_ci asm volatile("sha1msg1 0x12345678(,%eax,1), %xmm0"); 33738c2ecf20Sopenharmony_ci asm volatile("sha1msg1 (%eax,%ecx,1), %xmm0"); 33748c2ecf20Sopenharmony_ci asm volatile("sha1msg1 (%eax,%ecx,8), %xmm0"); 33758c2ecf20Sopenharmony_ci asm volatile("sha1msg1 0x12(%eax), %xmm0"); 33768c2ecf20Sopenharmony_ci asm volatile("sha1msg1 0x12(%ebp), %xmm0"); 33778c2ecf20Sopenharmony_ci asm volatile("sha1msg1 0x12(%ecx,%eax,1), %xmm0"); 33788c2ecf20Sopenharmony_ci asm volatile("sha1msg1 0x12(%ebp,%eax,1), %xmm0"); 33798c2ecf20Sopenharmony_ci asm volatile("sha1msg1 0x12(%eax,%ecx,1), %xmm0"); 33808c2ecf20Sopenharmony_ci asm volatile("sha1msg1 0x12(%eax,%ecx,8), %xmm0"); 33818c2ecf20Sopenharmony_ci asm volatile("sha1msg1 0x12345678(%eax), %xmm0"); 33828c2ecf20Sopenharmony_ci asm volatile("sha1msg1 0x12345678(%ebp), %xmm0"); 33838c2ecf20Sopenharmony_ci asm volatile("sha1msg1 0x12345678(%ecx,%eax,1), %xmm0"); 33848c2ecf20Sopenharmony_ci asm volatile("sha1msg1 0x12345678(%ebp,%eax,1), %xmm0"); 33858c2ecf20Sopenharmony_ci asm volatile("sha1msg1 0x12345678(%eax,%ecx,1), %xmm0"); 33868c2ecf20Sopenharmony_ci asm volatile("sha1msg1 0x12345678(%eax,%ecx,8), %xmm0"); 33878c2ecf20Sopenharmony_ci 33888c2ecf20Sopenharmony_ci /* sha1msg2 xmm2/m128, xmm1 */ 33898c2ecf20Sopenharmony_ci 33908c2ecf20Sopenharmony_ci asm volatile("sha1msg2 %xmm1, %xmm0"); 33918c2ecf20Sopenharmony_ci asm volatile("sha1msg2 %xmm7, %xmm2"); 33928c2ecf20Sopenharmony_ci asm volatile("sha1msg2 (%eax), %xmm0"); 33938c2ecf20Sopenharmony_ci asm volatile("sha1msg2 (0x12345678), %xmm0"); 33948c2ecf20Sopenharmony_ci asm volatile("sha1msg2 (%eax), %xmm3"); 33958c2ecf20Sopenharmony_ci asm volatile("sha1msg2 (%ecx,%eax,1), %xmm0"); 33968c2ecf20Sopenharmony_ci asm volatile("sha1msg2 0x12345678(,%eax,1), %xmm0"); 33978c2ecf20Sopenharmony_ci asm volatile("sha1msg2 (%eax,%ecx,1), %xmm0"); 33988c2ecf20Sopenharmony_ci asm volatile("sha1msg2 (%eax,%ecx,8), %xmm0"); 33998c2ecf20Sopenharmony_ci asm volatile("sha1msg2 0x12(%eax), %xmm0"); 34008c2ecf20Sopenharmony_ci asm volatile("sha1msg2 0x12(%ebp), %xmm0"); 34018c2ecf20Sopenharmony_ci asm volatile("sha1msg2 0x12(%ecx,%eax,1), %xmm0"); 34028c2ecf20Sopenharmony_ci asm volatile("sha1msg2 0x12(%ebp,%eax,1), %xmm0"); 34038c2ecf20Sopenharmony_ci asm volatile("sha1msg2 0x12(%eax,%ecx,1), %xmm0"); 34048c2ecf20Sopenharmony_ci asm volatile("sha1msg2 0x12(%eax,%ecx,8), %xmm0"); 34058c2ecf20Sopenharmony_ci asm volatile("sha1msg2 0x12345678(%eax), %xmm0"); 34068c2ecf20Sopenharmony_ci asm volatile("sha1msg2 0x12345678(%ebp), %xmm0"); 34078c2ecf20Sopenharmony_ci asm volatile("sha1msg2 0x12345678(%ecx,%eax,1), %xmm0"); 34088c2ecf20Sopenharmony_ci asm volatile("sha1msg2 0x12345678(%ebp,%eax,1), %xmm0"); 34098c2ecf20Sopenharmony_ci asm volatile("sha1msg2 0x12345678(%eax,%ecx,1), %xmm0"); 34108c2ecf20Sopenharmony_ci asm volatile("sha1msg2 0x12345678(%eax,%ecx,8), %xmm0"); 34118c2ecf20Sopenharmony_ci 34128c2ecf20Sopenharmony_ci /* sha256rnds2 <XMM0>, xmm2/m128, xmm1 */ 34138c2ecf20Sopenharmony_ci /* Note sha256rnds2 has an implicit operand 'xmm0' */ 34148c2ecf20Sopenharmony_ci 34158c2ecf20Sopenharmony_ci asm volatile("sha256rnds2 %xmm4, %xmm1"); 34168c2ecf20Sopenharmony_ci asm volatile("sha256rnds2 %xmm7, %xmm2"); 34178c2ecf20Sopenharmony_ci asm volatile("sha256rnds2 (%eax), %xmm1"); 34188c2ecf20Sopenharmony_ci asm volatile("sha256rnds2 (0x12345678), %xmm1"); 34198c2ecf20Sopenharmony_ci asm volatile("sha256rnds2 (%eax), %xmm3"); 34208c2ecf20Sopenharmony_ci asm volatile("sha256rnds2 (%ecx,%eax,1), %xmm1"); 34218c2ecf20Sopenharmony_ci asm volatile("sha256rnds2 0x12345678(,%eax,1), %xmm1"); 34228c2ecf20Sopenharmony_ci asm volatile("sha256rnds2 (%eax,%ecx,1), %xmm1"); 34238c2ecf20Sopenharmony_ci asm volatile("sha256rnds2 (%eax,%ecx,8), %xmm1"); 34248c2ecf20Sopenharmony_ci asm volatile("sha256rnds2 0x12(%eax), %xmm1"); 34258c2ecf20Sopenharmony_ci asm volatile("sha256rnds2 0x12(%ebp), %xmm1"); 34268c2ecf20Sopenharmony_ci asm volatile("sha256rnds2 0x12(%ecx,%eax,1), %xmm1"); 34278c2ecf20Sopenharmony_ci asm volatile("sha256rnds2 0x12(%ebp,%eax,1), %xmm1"); 34288c2ecf20Sopenharmony_ci asm volatile("sha256rnds2 0x12(%eax,%ecx,1), %xmm1"); 34298c2ecf20Sopenharmony_ci asm volatile("sha256rnds2 0x12(%eax,%ecx,8), %xmm1"); 34308c2ecf20Sopenharmony_ci asm volatile("sha256rnds2 0x12345678(%eax), %xmm1"); 34318c2ecf20Sopenharmony_ci asm volatile("sha256rnds2 0x12345678(%ebp), %xmm1"); 34328c2ecf20Sopenharmony_ci asm volatile("sha256rnds2 0x12345678(%ecx,%eax,1), %xmm1"); 34338c2ecf20Sopenharmony_ci asm volatile("sha256rnds2 0x12345678(%ebp,%eax,1), %xmm1"); 34348c2ecf20Sopenharmony_ci asm volatile("sha256rnds2 0x12345678(%eax,%ecx,1), %xmm1"); 34358c2ecf20Sopenharmony_ci asm volatile("sha256rnds2 0x12345678(%eax,%ecx,8), %xmm1"); 34368c2ecf20Sopenharmony_ci 34378c2ecf20Sopenharmony_ci /* sha256msg1 xmm2/m128, xmm1 */ 34388c2ecf20Sopenharmony_ci 34398c2ecf20Sopenharmony_ci asm volatile("sha256msg1 %xmm1, %xmm0"); 34408c2ecf20Sopenharmony_ci asm volatile("sha256msg1 %xmm7, %xmm2"); 34418c2ecf20Sopenharmony_ci asm volatile("sha256msg1 (%eax), %xmm0"); 34428c2ecf20Sopenharmony_ci asm volatile("sha256msg1 (0x12345678), %xmm0"); 34438c2ecf20Sopenharmony_ci asm volatile("sha256msg1 (%eax), %xmm3"); 34448c2ecf20Sopenharmony_ci asm volatile("sha256msg1 (%ecx,%eax,1), %xmm0"); 34458c2ecf20Sopenharmony_ci asm volatile("sha256msg1 0x12345678(,%eax,1), %xmm0"); 34468c2ecf20Sopenharmony_ci asm volatile("sha256msg1 (%eax,%ecx,1), %xmm0"); 34478c2ecf20Sopenharmony_ci asm volatile("sha256msg1 (%eax,%ecx,8), %xmm0"); 34488c2ecf20Sopenharmony_ci asm volatile("sha256msg1 0x12(%eax), %xmm0"); 34498c2ecf20Sopenharmony_ci asm volatile("sha256msg1 0x12(%ebp), %xmm0"); 34508c2ecf20Sopenharmony_ci asm volatile("sha256msg1 0x12(%ecx,%eax,1), %xmm0"); 34518c2ecf20Sopenharmony_ci asm volatile("sha256msg1 0x12(%ebp,%eax,1), %xmm0"); 34528c2ecf20Sopenharmony_ci asm volatile("sha256msg1 0x12(%eax,%ecx,1), %xmm0"); 34538c2ecf20Sopenharmony_ci asm volatile("sha256msg1 0x12(%eax,%ecx,8), %xmm0"); 34548c2ecf20Sopenharmony_ci asm volatile("sha256msg1 0x12345678(%eax), %xmm0"); 34558c2ecf20Sopenharmony_ci asm volatile("sha256msg1 0x12345678(%ebp), %xmm0"); 34568c2ecf20Sopenharmony_ci asm volatile("sha256msg1 0x12345678(%ecx,%eax,1), %xmm0"); 34578c2ecf20Sopenharmony_ci asm volatile("sha256msg1 0x12345678(%ebp,%eax,1), %xmm0"); 34588c2ecf20Sopenharmony_ci asm volatile("sha256msg1 0x12345678(%eax,%ecx,1), %xmm0"); 34598c2ecf20Sopenharmony_ci asm volatile("sha256msg1 0x12345678(%eax,%ecx,8), %xmm0"); 34608c2ecf20Sopenharmony_ci 34618c2ecf20Sopenharmony_ci /* sha256msg2 xmm2/m128, xmm1 */ 34628c2ecf20Sopenharmony_ci 34638c2ecf20Sopenharmony_ci asm volatile("sha256msg2 %xmm1, %xmm0"); 34648c2ecf20Sopenharmony_ci asm volatile("sha256msg2 %xmm7, %xmm2"); 34658c2ecf20Sopenharmony_ci asm volatile("sha256msg2 (%eax), %xmm0"); 34668c2ecf20Sopenharmony_ci asm volatile("sha256msg2 (0x12345678), %xmm0"); 34678c2ecf20Sopenharmony_ci asm volatile("sha256msg2 (%eax), %xmm3"); 34688c2ecf20Sopenharmony_ci asm volatile("sha256msg2 (%ecx,%eax,1), %xmm0"); 34698c2ecf20Sopenharmony_ci asm volatile("sha256msg2 0x12345678(,%eax,1), %xmm0"); 34708c2ecf20Sopenharmony_ci asm volatile("sha256msg2 (%eax,%ecx,1), %xmm0"); 34718c2ecf20Sopenharmony_ci asm volatile("sha256msg2 (%eax,%ecx,8), %xmm0"); 34728c2ecf20Sopenharmony_ci asm volatile("sha256msg2 0x12(%eax), %xmm0"); 34738c2ecf20Sopenharmony_ci asm volatile("sha256msg2 0x12(%ebp), %xmm0"); 34748c2ecf20Sopenharmony_ci asm volatile("sha256msg2 0x12(%ecx,%eax,1), %xmm0"); 34758c2ecf20Sopenharmony_ci asm volatile("sha256msg2 0x12(%ebp,%eax,1), %xmm0"); 34768c2ecf20Sopenharmony_ci asm volatile("sha256msg2 0x12(%eax,%ecx,1), %xmm0"); 34778c2ecf20Sopenharmony_ci asm volatile("sha256msg2 0x12(%eax,%ecx,8), %xmm0"); 34788c2ecf20Sopenharmony_ci asm volatile("sha256msg2 0x12345678(%eax), %xmm0"); 34798c2ecf20Sopenharmony_ci asm volatile("sha256msg2 0x12345678(%ebp), %xmm0"); 34808c2ecf20Sopenharmony_ci asm volatile("sha256msg2 0x12345678(%ecx,%eax,1), %xmm0"); 34818c2ecf20Sopenharmony_ci asm volatile("sha256msg2 0x12345678(%ebp,%eax,1), %xmm0"); 34828c2ecf20Sopenharmony_ci asm volatile("sha256msg2 0x12345678(%eax,%ecx,1), %xmm0"); 34838c2ecf20Sopenharmony_ci asm volatile("sha256msg2 0x12345678(%eax,%ecx,8), %xmm0"); 34848c2ecf20Sopenharmony_ci 34858c2ecf20Sopenharmony_ci /* clflushopt m8 */ 34868c2ecf20Sopenharmony_ci 34878c2ecf20Sopenharmony_ci asm volatile("clflushopt (%eax)"); 34888c2ecf20Sopenharmony_ci asm volatile("clflushopt (0x12345678)"); 34898c2ecf20Sopenharmony_ci asm volatile("clflushopt 0x12345678(%eax,%ecx,8)"); 34908c2ecf20Sopenharmony_ci /* Also check instructions in the same group encoding as clflushopt */ 34918c2ecf20Sopenharmony_ci asm volatile("clflush (%eax)"); 34928c2ecf20Sopenharmony_ci asm volatile("sfence"); 34938c2ecf20Sopenharmony_ci 34948c2ecf20Sopenharmony_ci /* clwb m8 */ 34958c2ecf20Sopenharmony_ci 34968c2ecf20Sopenharmony_ci asm volatile("clwb (%eax)"); 34978c2ecf20Sopenharmony_ci asm volatile("clwb (0x12345678)"); 34988c2ecf20Sopenharmony_ci asm volatile("clwb 0x12345678(%eax,%ecx,8)"); 34998c2ecf20Sopenharmony_ci /* Also check instructions in the same group encoding as clwb */ 35008c2ecf20Sopenharmony_ci asm volatile("xsaveopt (%eax)"); 35018c2ecf20Sopenharmony_ci asm volatile("mfence"); 35028c2ecf20Sopenharmony_ci 35038c2ecf20Sopenharmony_ci /* cldemote m8 */ 35048c2ecf20Sopenharmony_ci 35058c2ecf20Sopenharmony_ci asm volatile("cldemote (%eax)"); 35068c2ecf20Sopenharmony_ci asm volatile("cldemote (0x12345678)"); 35078c2ecf20Sopenharmony_ci asm volatile("cldemote 0x12345678(%eax,%ecx,8)"); 35088c2ecf20Sopenharmony_ci 35098c2ecf20Sopenharmony_ci /* xsavec mem */ 35108c2ecf20Sopenharmony_ci 35118c2ecf20Sopenharmony_ci asm volatile("xsavec (%eax)"); 35128c2ecf20Sopenharmony_ci asm volatile("xsavec (0x12345678)"); 35138c2ecf20Sopenharmony_ci asm volatile("xsavec 0x12345678(%eax,%ecx,8)"); 35148c2ecf20Sopenharmony_ci 35158c2ecf20Sopenharmony_ci /* xsaves mem */ 35168c2ecf20Sopenharmony_ci 35178c2ecf20Sopenharmony_ci asm volatile("xsaves (%eax)"); 35188c2ecf20Sopenharmony_ci asm volatile("xsaves (0x12345678)"); 35198c2ecf20Sopenharmony_ci asm volatile("xsaves 0x12345678(%eax,%ecx,8)"); 35208c2ecf20Sopenharmony_ci 35218c2ecf20Sopenharmony_ci /* xrstors mem */ 35228c2ecf20Sopenharmony_ci 35238c2ecf20Sopenharmony_ci asm volatile("xrstors (%eax)"); 35248c2ecf20Sopenharmony_ci asm volatile("xrstors (0x12345678)"); 35258c2ecf20Sopenharmony_ci asm volatile("xrstors 0x12345678(%eax,%ecx,8)"); 35268c2ecf20Sopenharmony_ci 35278c2ecf20Sopenharmony_ci /* ptwrite */ 35288c2ecf20Sopenharmony_ci 35298c2ecf20Sopenharmony_ci asm volatile("ptwrite (%eax)"); 35308c2ecf20Sopenharmony_ci asm volatile("ptwrite (0x12345678)"); 35318c2ecf20Sopenharmony_ci asm volatile("ptwrite 0x12345678(%eax,%ecx,8)"); 35328c2ecf20Sopenharmony_ci 35338c2ecf20Sopenharmony_ci asm volatile("ptwritel (%eax)"); 35348c2ecf20Sopenharmony_ci asm volatile("ptwritel (0x12345678)"); 35358c2ecf20Sopenharmony_ci asm volatile("ptwritel 0x12345678(%eax,%ecx,8)"); 35368c2ecf20Sopenharmony_ci 35378c2ecf20Sopenharmony_ci /* tpause */ 35388c2ecf20Sopenharmony_ci 35398c2ecf20Sopenharmony_ci asm volatile("tpause %ebx"); 35408c2ecf20Sopenharmony_ci 35418c2ecf20Sopenharmony_ci /* umonitor */ 35428c2ecf20Sopenharmony_ci 35438c2ecf20Sopenharmony_ci asm volatile("umonitor %ax"); 35448c2ecf20Sopenharmony_ci asm volatile("umonitor %eax"); 35458c2ecf20Sopenharmony_ci 35468c2ecf20Sopenharmony_ci /* umwait */ 35478c2ecf20Sopenharmony_ci 35488c2ecf20Sopenharmony_ci asm volatile("umwait %eax"); 35498c2ecf20Sopenharmony_ci 35508c2ecf20Sopenharmony_ci /* movdiri */ 35518c2ecf20Sopenharmony_ci 35528c2ecf20Sopenharmony_ci asm volatile("movdiri %eax,(%ebx)"); 35538c2ecf20Sopenharmony_ci asm volatile("movdiri %ecx,0x12345678(%eax)"); 35548c2ecf20Sopenharmony_ci 35558c2ecf20Sopenharmony_ci /* movdir64b */ 35568c2ecf20Sopenharmony_ci 35578c2ecf20Sopenharmony_ci asm volatile("movdir64b (%eax),%ebx"); 35588c2ecf20Sopenharmony_ci asm volatile("movdir64b 0x12345678(%eax),%ecx"); 35598c2ecf20Sopenharmony_ci asm volatile("movdir64b (%si),%bx"); 35608c2ecf20Sopenharmony_ci asm volatile("movdir64b 0x1234(%si),%cx"); 35618c2ecf20Sopenharmony_ci 35628c2ecf20Sopenharmony_ci /* enqcmd */ 35638c2ecf20Sopenharmony_ci 35648c2ecf20Sopenharmony_ci asm volatile("enqcmd (%eax),%ebx"); 35658c2ecf20Sopenharmony_ci asm volatile("enqcmd 0x12345678(%eax),%ecx"); 35668c2ecf20Sopenharmony_ci asm volatile("enqcmd (%si),%bx"); 35678c2ecf20Sopenharmony_ci asm volatile("enqcmd 0x1234(%si),%cx"); 35688c2ecf20Sopenharmony_ci 35698c2ecf20Sopenharmony_ci /* enqcmds */ 35708c2ecf20Sopenharmony_ci 35718c2ecf20Sopenharmony_ci asm volatile("enqcmds (%eax),%ebx"); 35728c2ecf20Sopenharmony_ci asm volatile("enqcmds 0x12345678(%eax),%ecx"); 35738c2ecf20Sopenharmony_ci asm volatile("enqcmds (%si),%bx"); 35748c2ecf20Sopenharmony_ci asm volatile("enqcmds 0x1234(%si),%cx"); 35758c2ecf20Sopenharmony_ci 35768c2ecf20Sopenharmony_ci /* incsspd */ 35778c2ecf20Sopenharmony_ci 35788c2ecf20Sopenharmony_ci asm volatile("incsspd %eax"); 35798c2ecf20Sopenharmony_ci /* Also check instructions in the same group encoding as incsspd */ 35808c2ecf20Sopenharmony_ci asm volatile("xrstor (%eax)"); 35818c2ecf20Sopenharmony_ci asm volatile("xrstor (0x12345678)"); 35828c2ecf20Sopenharmony_ci asm volatile("xrstor 0x12345678(%eax,%ecx,8)"); 35838c2ecf20Sopenharmony_ci asm volatile("lfence"); 35848c2ecf20Sopenharmony_ci 35858c2ecf20Sopenharmony_ci /* rdsspd */ 35868c2ecf20Sopenharmony_ci 35878c2ecf20Sopenharmony_ci asm volatile("rdsspd %eax"); 35888c2ecf20Sopenharmony_ci 35898c2ecf20Sopenharmony_ci /* saveprevssp */ 35908c2ecf20Sopenharmony_ci 35918c2ecf20Sopenharmony_ci asm volatile("saveprevssp"); 35928c2ecf20Sopenharmony_ci 35938c2ecf20Sopenharmony_ci /* rstorssp */ 35948c2ecf20Sopenharmony_ci 35958c2ecf20Sopenharmony_ci asm volatile("rstorssp (%eax)"); 35968c2ecf20Sopenharmony_ci asm volatile("rstorssp (0x12345678)"); 35978c2ecf20Sopenharmony_ci asm volatile("rstorssp 0x12345678(%eax,%ecx,8)"); 35988c2ecf20Sopenharmony_ci 35998c2ecf20Sopenharmony_ci /* wrssd */ 36008c2ecf20Sopenharmony_ci 36018c2ecf20Sopenharmony_ci asm volatile("wrssd %ecx,(%eax)"); 36028c2ecf20Sopenharmony_ci asm volatile("wrssd %edx,(0x12345678)"); 36038c2ecf20Sopenharmony_ci asm volatile("wrssd %edx,0x12345678(%eax,%ecx,8)"); 36048c2ecf20Sopenharmony_ci 36058c2ecf20Sopenharmony_ci /* wrussd */ 36068c2ecf20Sopenharmony_ci 36078c2ecf20Sopenharmony_ci asm volatile("wrussd %ecx,(%eax)"); 36088c2ecf20Sopenharmony_ci asm volatile("wrussd %edx,(0x12345678)"); 36098c2ecf20Sopenharmony_ci asm volatile("wrussd %edx,0x12345678(%eax,%ecx,8)"); 36108c2ecf20Sopenharmony_ci 36118c2ecf20Sopenharmony_ci /* setssbsy */ 36128c2ecf20Sopenharmony_ci 36138c2ecf20Sopenharmony_ci asm volatile("setssbsy"); 36148c2ecf20Sopenharmony_ci /* Also check instructions in the same group encoding as setssbsy */ 36158c2ecf20Sopenharmony_ci asm volatile("rdpkru"); 36168c2ecf20Sopenharmony_ci asm volatile("wrpkru"); 36178c2ecf20Sopenharmony_ci 36188c2ecf20Sopenharmony_ci /* clrssbsy */ 36198c2ecf20Sopenharmony_ci 36208c2ecf20Sopenharmony_ci asm volatile("clrssbsy (%eax)"); 36218c2ecf20Sopenharmony_ci asm volatile("clrssbsy (0x12345678)"); 36228c2ecf20Sopenharmony_ci asm volatile("clrssbsy 0x12345678(%eax,%ecx,8)"); 36238c2ecf20Sopenharmony_ci 36248c2ecf20Sopenharmony_ci /* endbr32/64 */ 36258c2ecf20Sopenharmony_ci 36268c2ecf20Sopenharmony_ci asm volatile("endbr32"); 36278c2ecf20Sopenharmony_ci asm volatile("endbr64"); 36288c2ecf20Sopenharmony_ci 36298c2ecf20Sopenharmony_ci /* call with/without notrack prefix */ 36308c2ecf20Sopenharmony_ci 36318c2ecf20Sopenharmony_ci asm volatile("call *%eax"); /* Expecting: call indirect 0 */ 36328c2ecf20Sopenharmony_ci asm volatile("call *(%eax)"); /* Expecting: call indirect 0 */ 36338c2ecf20Sopenharmony_ci asm volatile("call *(0x12345678)"); /* Expecting: call indirect 0 */ 36348c2ecf20Sopenharmony_ci asm volatile("call *0x12345678(%eax,%ecx,8)"); /* Expecting: call indirect 0 */ 36358c2ecf20Sopenharmony_ci 36368c2ecf20Sopenharmony_ci asm volatile("bnd call *%eax"); /* Expecting: call indirect 0 */ 36378c2ecf20Sopenharmony_ci asm volatile("bnd call *(%eax)"); /* Expecting: call indirect 0 */ 36388c2ecf20Sopenharmony_ci asm volatile("bnd call *(0x12345678)"); /* Expecting: call indirect 0 */ 36398c2ecf20Sopenharmony_ci asm volatile("bnd call *0x12345678(%eax,%ecx,8)"); /* Expecting: call indirect 0 */ 36408c2ecf20Sopenharmony_ci 36418c2ecf20Sopenharmony_ci asm volatile("notrack call *%eax"); /* Expecting: call indirect 0 */ 36428c2ecf20Sopenharmony_ci asm volatile("notrack call *(%eax)"); /* Expecting: call indirect 0 */ 36438c2ecf20Sopenharmony_ci asm volatile("notrack call *(0x12345678)"); /* Expecting: call indirect 0 */ 36448c2ecf20Sopenharmony_ci asm volatile("notrack call *0x12345678(%eax,%ecx,8)"); /* Expecting: call indirect 0 */ 36458c2ecf20Sopenharmony_ci 36468c2ecf20Sopenharmony_ci asm volatile("notrack bnd call *%eax"); /* Expecting: call indirect 0 */ 36478c2ecf20Sopenharmony_ci asm volatile("notrack bnd call *(%eax)"); /* Expecting: call indirect 0 */ 36488c2ecf20Sopenharmony_ci asm volatile("notrack bnd call *(0x12345678)"); /* Expecting: call indirect 0 */ 36498c2ecf20Sopenharmony_ci asm volatile("notrack bnd call *0x12345678(%eax,%ecx,8)"); /* Expecting: call indirect 0 */ 36508c2ecf20Sopenharmony_ci 36518c2ecf20Sopenharmony_ci /* jmp with/without notrack prefix */ 36528c2ecf20Sopenharmony_ci 36538c2ecf20Sopenharmony_ci asm volatile("jmp *%eax"); /* Expecting: jmp indirect 0 */ 36548c2ecf20Sopenharmony_ci asm volatile("jmp *(%eax)"); /* Expecting: jmp indirect 0 */ 36558c2ecf20Sopenharmony_ci asm volatile("jmp *(0x12345678)"); /* Expecting: jmp indirect 0 */ 36568c2ecf20Sopenharmony_ci asm volatile("jmp *0x12345678(%eax,%ecx,8)"); /* Expecting: jmp indirect 0 */ 36578c2ecf20Sopenharmony_ci 36588c2ecf20Sopenharmony_ci asm volatile("bnd jmp *%eax"); /* Expecting: jmp indirect 0 */ 36598c2ecf20Sopenharmony_ci asm volatile("bnd jmp *(%eax)"); /* Expecting: jmp indirect 0 */ 36608c2ecf20Sopenharmony_ci asm volatile("bnd jmp *(0x12345678)"); /* Expecting: jmp indirect 0 */ 36618c2ecf20Sopenharmony_ci asm volatile("bnd jmp *0x12345678(%eax,%ecx,8)"); /* Expecting: jmp indirect 0 */ 36628c2ecf20Sopenharmony_ci 36638c2ecf20Sopenharmony_ci asm volatile("notrack jmp *%eax"); /* Expecting: jmp indirect 0 */ 36648c2ecf20Sopenharmony_ci asm volatile("notrack jmp *(%eax)"); /* Expecting: jmp indirect 0 */ 36658c2ecf20Sopenharmony_ci asm volatile("notrack jmp *(0x12345678)"); /* Expecting: jmp indirect 0 */ 36668c2ecf20Sopenharmony_ci asm volatile("notrack jmp *0x12345678(%eax,%ecx,8)"); /* Expecting: jmp indirect 0 */ 36678c2ecf20Sopenharmony_ci 36688c2ecf20Sopenharmony_ci asm volatile("notrack bnd jmp *%eax"); /* Expecting: jmp indirect 0 */ 36698c2ecf20Sopenharmony_ci asm volatile("notrack bnd jmp *(%eax)"); /* Expecting: jmp indirect 0 */ 36708c2ecf20Sopenharmony_ci asm volatile("notrack bnd jmp *(0x12345678)"); /* Expecting: jmp indirect 0 */ 36718c2ecf20Sopenharmony_ci asm volatile("notrack bnd jmp *0x12345678(%eax,%ecx,8)"); /* Expecting: jmp indirect 0 */ 36728c2ecf20Sopenharmony_ci 36738c2ecf20Sopenharmony_ci#endif /* #ifndef __x86_64__ */ 36748c2ecf20Sopenharmony_ci 36758c2ecf20Sopenharmony_ci /* SGX */ 36768c2ecf20Sopenharmony_ci 36778c2ecf20Sopenharmony_ci asm volatile("encls"); 36788c2ecf20Sopenharmony_ci asm volatile("enclu"); 36798c2ecf20Sopenharmony_ci asm volatile("enclv"); 36808c2ecf20Sopenharmony_ci 36818c2ecf20Sopenharmony_ci /* pconfig */ 36828c2ecf20Sopenharmony_ci 36838c2ecf20Sopenharmony_ci asm volatile("pconfig"); 36848c2ecf20Sopenharmony_ci 36858c2ecf20Sopenharmony_ci /* wbnoinvd */ 36868c2ecf20Sopenharmony_ci 36878c2ecf20Sopenharmony_ci asm volatile("wbnoinvd"); 36888c2ecf20Sopenharmony_ci 36898c2ecf20Sopenharmony_ci /* Following line is a marker for the awk script - do not change */ 36908c2ecf20Sopenharmony_ci asm volatile("rdtsc"); /* Stop here */ 36918c2ecf20Sopenharmony_ci 36928c2ecf20Sopenharmony_ci return 0; 36938c2ecf20Sopenharmony_ci} 3694