Lines Matching refs:m4
480 mova m4, [aq]
484 psubw m4, m0
491 paddw m0, m4
492 paddw m1, m4
493 paddw m2, m4
494 paddw m3, m4
495 pxor m4, m4
496 pmaxsw m0, m4
497 pmaxsw m1, m4
498 pmaxsw m2, m4
499 pmaxsw m3, m4
516 mova m4, [pw_1023]
542 pminsw m0, m4
543 pminsw m1, m4
544 pminsw m2, m4
545 pminsw m3, m4
556 mova m4, [pw_4095]
564 mova m4, [aq]
569 psubw m4, m0
578 paddw m0, m2, m4
580 paddw m1, m3, m4
620 mova m4, [aq+mmsize*0]
627 psubw m4, m0
637 paddw m0, m3, m4
723 mova m4, [pb_2to15_14_15]
725 SHIFT_RIGHTx2 m1, m2, m0, m4 ; bcdefghh/cdefghhh
734 SHIFT_RIGHT m0, m0, m4 ; CDEFGHhh
752 PALIGNR m1, m3, m0, 2, m4 ; bcdefghi
753 PALIGNR m2, m3, m0, 4, m4 ; cdefghij
756 mova m4, [pb_2to15_14_15]
758 SHIFT_RIGHTx2 m2, m1, m3, m4 ; jklmnopp/klmnoppp
773 PALIGNR m3, m1, m0, 2, m4
776 SHIFT_RIGHT m1, m1, m4
787 PALIGNR m4, m1, m0, 2, m6
790 PALIGNR m4, m2, m1, 2, m6
793 PALIGNR m4, m3, m2, 2, m6
799 SHIFT_RIGHTx2 m4, m5, m3, m6
801 pshufd m4, m4, q3333 ; 55555555
815 mova [dstq+stride8q*1+48], m4
818 mova [dstq+stride8q*2+32], m4
819 mova [dstq+stride8q*2+48], m4
821 mova [dstq+stride24q +16], m4
822 mova [dstq+stride24q +32], m4
823 mova [dstq+stride24q +48], m4
858 vpalignr m4, m2, m0, 4 ; cdefghijklmnoppp
868 vpalignr m4, m2, m0, 4
870 mova [dstq+strideq*2], m4
872 vpalignr m4, m2, m0, 8
875 mova [dstq+strideq*0], m4
877 vpalignr m4, m2, m0, 12
879 mova [dstq+strideq*2], m4
898 vperm2i128 m5, m1, m4, q0201 ; yz01234555555555
902 vperm2i128 m2, m1, m4, q0201 ; Z......555555555
912 vpalignr m4, m2, m1, 2
914 mova [dstq+strideq*1 +32], m4
916 vpalignr m4, m2, m1, 4
918 mova [dstq+strideq*2 +32], m4
920 vpalignr m4, m2, m1, 6
922 mova [dstq+stride3q*1+32], m4
925 vpalignr m4, m2, m1, 8
927 mova [dstq+strideq*0 +32], m4
929 vpalignr m4, m2, m1, 10
931 mova [dstq+strideq*1 +32], m4
933 vpalignr m4, m2, m1, 12
935 mova [dstq+strideq*2+32], m4
937 vpalignr m4, m2, m1, 14
939 mova [dstq+stride3q+ 32], m4
941 vpalignr m4, m2, m1, 16
942 vperm2i128 m5, m3, m4, q0201
943 vperm2i128 m2, m4, m4, q0101
945 mova m1, m4
978 PALIGNR m1, m0, 2, m4 ; tuvwxyz*
979 PALIGNR m2, m1, 2, m4 ; uvwxyz*a
1010 mova m4, [aq] ; abcdefgh
1014 PALIGNR m5, m4, 2, m3 ; bcdefghi
1017 PALIGNR m4, m2, 2, m3 ; uvwxyz*a
1028 mova [dst8q+strideq*0+ 0], m4
1031 mova [dst8q+strideq*8+16], m4
1033 vpalignr m2, m4, m2, 2
1034 vpalignr m4, m5, m4, 2
1037 PALIGNR m0, m4, m2, 2, m1
1039 PALIGNR m0, m5, m4, 2, m1
1040 mova m4, m0
1057 PALIGNR m0, m1, 2, m4 ; a[17-24]
1060 movu m4, [aq+mmsize*1-2] ; a[7-14]
1063 mova m4, [aq+mmsize*0] ; a[0-7]
1065 PALIGNR m3, m4, 2, m6 ; a[1-8]
1074 PALIGNR m4, m5, 2, m0 ; l[26-31]*a
1110 mova [dst8q+stride8q*0+ 0], m4
1115 mova [dst8q+stride8q*1+16], m4
1120 mova [dst8q+stride8q*2+32], m4
1125 mova [dst8q+stride24q +48], m4
1129 vpalignr m5, m4, m5, 2
1130 vpalignr m4, m3, m4, 2
1143 PALIGNR m2, m4, m5, 2, m0
1145 PALIGNR m2, m3, m4, 2, m0
1146 mova m4, m2
1179 vperm2i128 m4, m2, m2, q2001 ; ijklmnop........
1180 vpalignr m5, m4, m2, 2 ; bcdefghijklmnop.
1183 vpalignr m4, m3, m0, 2 ; lmnopqrstuvwxyz*
1193 vpalignr m4, m1, m5, 2
1195 mova [ dstq+stride3q*2], m4 ; 6
1197 vpalignr m4, m1, m5, 4
1200 mova [dst3q+strideq*2 ], m4 ; 5
1203 vpalignr m4, m1, m5, 6
1205 mova [dst3q+strideq*1], m4 ; 4
1207 vpalignr m4, m1, m5, 8
1209 mova [dst3q+strideq*0], m4 ; 3
1211 vpalignr m4, m1, m5, 10
1213 mova [dstq+strideq*2 ], m4 ; 2
1215 vpalignr m4, m1, m5, 12
1217 mova [dstq+strideq*1 ], m4 ; 1
1219 vpalignr m4, m1, m5, 14
1221 mova [dstq+strideq*0], m4 ; 0
1231 vperm2i128 m4, m3, m1, q0201 ; jklmnopppppppppp
1237 pavgw m4, m2 ; ijklmnoppppppppp
1245 vpalignr m0, m4, m3, 2
1249 vpalignr m0, m4, m3, 4
1253 vpalignr m0, m4, m3, 6
1257 vpalignr m0, m4, m3, 8
1261 vpalignr m0, m4, m3, 10
1263 vpalignr m0, m4, m3, 12
1265 vpalignr m0, m4, m3, 14
1281 vpalignr m4, m2, m1, 4 ; mnopqrstuvwxyz*a
1287 vpunpcklwd m0, m3, m4 ; kLlMmNnOsTtUuVvW
1288 vpunpckhwd m1, m3, m4 ; oPpQqRrSwXxYyZz#
1290 vperm2i128 m4, m0, m1, q0301 ; sTtUuVvWwXxYyZz#
1291 vperm2i128 m0, m4, m2, q0201 ; wXxYyZz#ABCDEFGH
1292 vperm2i128 m1, m3, m4, q0201 ; oPpQqRrSsTtUuVvW
1300 mova [dst5q+strideq*2], m4 ; 7 sTtUuVvWwXxYyZz#
1302 vpalignr m5, m4, m1, 4
1304 vpalignr m5, m0, m4, 4
1308 vpalignr m5, m4, m1, 8
1310 vpalignr m5, m0, m4, 8
1315 vpalignr m6, m4, m1, 12
1318 vpalignr m5, m0, m4, 12
1336 mova m4, [aq+mmsize*1+0] ; qrstuvwxyz012345
1345 vperm2i128 m5, m3, m4, q0201 ; ijklmnopqrstuvwx
1349 vperm2i128 m6, m4, m4, q2001 ; yz012345........
1350 vpalignr m7, m6, m4, 2 ; rstuvwxyz012345.
1352 vperm2i128 m4, m1, m2, q0201 ; TUVWXYZ#ABCDEFGH
1368 vpalignr m6, m4, m1, 2
1375 vpalignr m6, m4, m1, 4
1382 vpalignr m6, m4, m1, 6
1389 vpalignr m6, m4, m1, 8
1396 vpalignr m6, m4, m1, 10
1403 vpalignr m6, m4, m1, 12
1410 vpalignr m6, m4, m1, 14
1419 mova m1, m4
1420 mova m4, m2
1486 PALIGNR m3, m1, m0, 4, m4
1490 mova m4, [pb_2to15_14_15]
1492 SHIFT_RIGHTx2 m5, m0, m1, m4
1508 PALIGNR m5, m1, m2, 2, m4
1510 PALIGNR m5, m0, m3, 2, m4
1513 SHIFT_RIGHT m1, m1, m4
1514 SHIFT_RIGHT m0, m0, m4
1529 PALIGNR m4, m2, m1, 2, m0
1532 pavgw m4, m1
1562 mova [dstq+strideq*0+16], m4
1569 mova [dstq+stride16q+ 0], m4
1583 vpalignr m6, m4, m6, 2
1584 vpalignr m4, m2, m4, 2
1594 PALIGNR m3, m4, m6, 2, m1
1596 PALIGNR m3, m2, m4, 2, m1
1597 mova m4, m3
1676 PALIGNR m3, m1, m2, 14, m4 ; z*abcdef
1679 PALIGNR m1, m2, 2, m4 ; tuvwxyz*
1680 pslldq m4, m2, 2 ; .stuvwxy
1687 PALIGNR m0, m4, 14, m1
1688 pslldq m4, 2
1689 PALIGNR m3, m4, 14, m1
1690 pslldq m4, 2
1694 PALIGNR m0, m4, 14, m1
1695 pslldq m4, 2
1696 PALIGNR m3, m4, 14, m1
1697 pslldq m4, 2
1700 PALIGNR m0, m4, 14, m1
1701 pslldq m4, 2
1702 PALIGNR m3, m4, 14, m4
1711 mova m4, [aq+mmsize] ; ijklmnop
1716 pavgw m2, m4
1723 pslldq m4, m5, 2 ; .lmnopqr
1726 psrld m4, m1, 16
1730 packssdw m7, m4
1741 PALIGNR m2, m3, 14, m4
1742 PALIGNR m3, m7, 14, m4
1744 PALIGNR m6, m0, 14, m4
1745 PALIGNR m0, m5, 14, m4
1756 mova m4, [aq+mmsize*3+0] ; a[24-31]
1760 pavgw m3, m4
1761 mova m4, [aq+mmsize*2+0] ; a[16-23]
1765 pavgw m2, m4
1766 mova m4, [aq+mmsize*1+0] ; a[8-15]
1770 pavgw m1, m4
1771 mova m4, [aq+mmsize*0+0] ; a[0-7]
1776 pavgw m4, m0
1816 mova [dstq+strideq*0+ 0], m4
1827 mova [dstq+stride16q+16], m4
1839 PALIGNR m1, m4, 14, m5
1840 PALIGNR m4, m6, 14, m5
1864 mova [dstq+strideq*0+ 0], m4
1869 mova [dstq+stride16q+16], m4
1875 PALIGNR m3, m4, 14, m6
1876 PALIGNR m4, m5, 14, m6
1961 SHIFT_RIGHTx2 m0, m4, m3, m5
1976 mova [dstq+strideq *8+16], m4
1977 mova [dstq+stride3q*4+ 0], m4
1983 vpalignr m3, m4, m3, 4
1984 vpalignr m4, m0, m4, 4
1990 PALIGNR m5, m4, m3, 4, m6
1992 PALIGNR m5, m0, m4, 4, m6
1993 mova m4, m5
2008 mova m4, [lq+mmsize*1+0]
2012 pavgw m3, m4
2016 movu m4, [lq+mmsize*2+4]
2057 mova [dstq+stride4q*2+48], m4
2088 mova [dstq+stride3q*4+32], m4
2091 mova [dstq+stride4q*4+16], m4
2094 mova [dstq+stride20q + 0], m4
2108 vpalignr m5, m4, m5, 4
2109 vpalignr m4, m7, m4, 4
2115 PALIGNR m0, m4, m5, 4, m3
2117 PALIGNR m0, m7, m4, 4, m3
2118 mova m4, m0
2165 PALIGNR m3, m1, m0, 4, m4
2170 psrldq m4, m1, 4
2185 PALIGNR m0, m3, m2, 4, m4
2187 PALIGNR m0, m1, m3, 4, m4
2201 mova m4, [lq+mmsize]
2203 PALIGNR m3, m5, m4, 2, m6
2204 PALIGNR m2, m5, m4, 4, m6
2206 pavgw m3, m4
2210 movu m4, [aq+2]
2226 mova [dstq+mstride3q*4+16], m4
2237 vpalignr m2, m4, m2, 4
2238 vpalignr m4, m5, m4, 4
2246 PALIGNR m6, m4, m2, 4, m7
2248 PALIGNR m6, m5, m4, 4, m7
2249 mova m4, m6
2264 mova m4, [lq+mmsize*1+0]
2268 pavgw m3, m4
2276 movu m4, [lq+mmsize*2+4]
2307 mova [rsp+4*mmsize], m4
2338 mova [dstq+stride20q +48], m4
2341 mova [dstq+stride4q*4+32], m4
2345 mova [dstq+stride3q*4+16], m4
2348 mova [dstq+strideq* 8+ 0], m4
2368 vpalignr m5, m4, m5, 4
2369 vpalignr m4, m7, m4, 4
2390 PALIGNR m3, m4, m5, 4, m2
2392 PALIGNR m3, m7, m4, 4, m2
2393 mova m4, m3
2422 mova m4, [rsp+4*mmsize]
2443 mova [dstq+strideq* 4+48], m4
2446 mova [dstq+strideq* 0+32], m4
2454 vpalignr m5, m4, m5, 4
2455 vpalignr m4, m7, m4, 4
2470 PALIGNR m6, m4, m5, 4, m7
2476 PALIGNR m6, m7, m4, 4, m5
2477 mova m4, m6