Lines Matching refs:T2

344 my ($H0,$H1,$H2,$H3,$H4, $T0,$T1,$T2,$T3,$T4, $D0,$D1,$D2,$D3,$D4, $MASK) =
815 vpsrldq \$6,$T0,$T2 # splat input
819 vpunpcklqdq $T3,$T2,$T3 # 2:3
824 vpsrlq \$4,$T3,$T2
827 vpand $MASK,$T2,$T2 # 2
907 vpmuludq $T2,$D4,$D2 # d3 = h2*r0
919 vpmuludq $T2,$H2,$H0 # h2*r1
926 vpmuludq $T2,$H3,$H0 # h2*r2
952 vpmuludq $T2,$H3,$H3 # h2*s3
953 vpmuludq $T2,$H4,$T2 # h2*s4
957 vpaddq $T2,$D1,$D1 # d1 += h2*s4
1010 vmovdqa -0x80(%r11),$T2 # r1^4
1020 vpmuludq $H2,$T2,$T1 # h2*r1
1021 vpmuludq $H3,$T2,$T0 # h3*r1
1025 vpmuludq $H1,$T2,$T1 # h1*r1
1026 vpmuludq $H0,$T2,$T2 # h0*r1
1028 vpaddq $T2,$D1,$D1 # d1 += h0*r1
1035 vmovdqa -0x40(%r11),$T2 # r3^4
1042 vpmuludq $H1,$T2,$T1 # h1*r3
1047 vpmuludq $H0,$T2,$T2 # h0*r3
1049 vpaddq $T2,$D3,$D3 # d3 += h0*r3
1052 vpmuludq $H3,$T3,$T2 # h3*s3
1054 vpaddq $T2,$D1,$D1 # d1 += h3*s3
1060 vpsrldq \$6,$T0,$T2 # splat input
1073 vpunpcklqdq $T3,$T2,$T3 # 2:3
1080 vpsrlq \$4,$T3,$T2
1084 vpand $MASK,$T2,$T2 # 2
1133 vpaddq $H2,$T2,$T2
1152 vpmuludq $T2,$D4,$D2 # d2 = h2*r0
1162 vpmuludq $T2,$H2,$H1 # h2*r1
1173 vpmuludq $T2,$H4,$H1 # h2*r2
1196 vpmuludq $T2,$H4,$H4 # h2*s3
1205 vpmuludq $T2,$H3,$H1 # h2*s4
1247 vpshufd \$0x32,`16*1-64`($ctx),$T2 # r1^n
1253 vpmuludq $H3,$T2,$T0 # h3*r1
1256 vpmuludq $H2,$T2,$T1 # h2*r1
1259 vpmuludq $H1,$T2,$T0 # h1*r1
1261 vpmuludq $H0,$T2,$T2 # h0*r1
1262 vpaddq $T2,$D1,$D1 # d1 += h0*r1
1266 vpshufd \$0x32,`16*4-64`($ctx),$T2 # s2
1274 vpmuludq $H4,$T2,$T1 # h4*s2
1277 vpmuludq $H3,$T2,$T2 # h3*s2
1278 vpaddq $T2,$D0,$D0 # d0 += h3*s2
1284 vpshufd \$0x32,`16*7-64`($ctx),$T2 # r4
1293 vpmuludq $H0,$T2,$T2 # h0*r4
1294 vpaddq $T2,$D4,$D4 # d4 += h0*r4
1312 vpsrldq \$8,$D2,$T2
1317 vpaddq $T2,$D2,$D2
1442 my ($H0,$H1,$H2,$H3,$H4, $MASK, $T4,$T0,$T1,$T2,$T3, $D0,$D1,$D2,$D3,$D4) =
1752 vmovdqu `16*0-64`($ctx),%x#$T2
1761 vpermd $T2,$T0,$T2 # 00003412 -> 14243444
1766 vmovdqa $T2,0x00(%rsp)
1791 vpsrldq \$6,$T0,$T2 # splat input
1794 vpunpcklqdq $T3,$T2,$T2 # 2:3
1797 vpsrlq \$30,$T2,$T3
1798 vpsrlq \$4,$T2,$T2
1801 vpand $MASK,$T2,$T2 # 2
1807 vpaddq $H2,$T2,$H2 # accumulate input
1821 #vpaddq $H2,$T2,$H2 # accumulate input
1827 vmovdqa `32*3`(%rsp),$T2 # r2^4
1849 vpmuludq $H2,$T2,$D4 # d4 = h2*r2
1880 vpmuludq $H1,$T2,$T4 # h1*r2
1881 vpmuludq $H0,$T2,$T2 # h0*r2
1883 vpaddq $T2,$D2,$D2 # d2 += h0*r2
1889 vpsrldq \$6,$T0,$T2 # splat input
1904 vpunpcklqdq $T3,$T2,$T3 # 2:3
1925 vpsrlq \$4,$T3,$T2
1935 vpand $MASK,$T2,$T2 # 2
1942 vpaddq $T2,$H2,$H2 # modulo-scheduled
1971 #vpaddq $H2,$T2,$H2 # accumulate input
1977 vmovdqu `32*3+4`(%rsp),$T2 # r2^4
1984 vpmuludq $H2,$T2,$D4 # d4 = h2*r2
2012 vpmuludq $H1,$T2,$T4 # h1*r2
2013 vpmuludq $H0,$T2,$T2 # h0*r2
2015 vpaddq $T2,$D2,$D2 # d2 += h0*r2
2040 vpsrldq \$8,$H2,$T2
2045 vpaddq $T2,$H2,$H2
2054 vpermq \$0x2,$H2,$T2
2059 vpaddq $T2,$H2,$H2
2137 map(s/%y/%z/,($T4,$T0,$T1,$T2,$T3)); # switch to %zmm domain
2174 vmovdqa 96(%rcx),%y#$T2 # .Lpermd_avx2
2188 vpermd $D0,$T2,$R0 # 00003412 -> 14243444
2190 vpermd $D1,$T2,$R1
2191 vpermd $T0,$T2,$S1
2192 vpermd $D2,$T2,$R2
2195 vpermd $T1,$T2,$S2
2198 vpermd $D3,$T2,$R3
2200 vpermd $T3,$T2,$S3
2201 vpermd $D4,$T2,$R4
2203 vpermd $T4,$T2,$S4
2224 vpsrlq \$32,$R2,$T2
2238 vpmuludq $T2,$S3,$M0
2239 vpmuludq $T2,$S4,$M1
2240 vpmuludq $T2,$R1,$M3
2241 vpmuludq $T2,$R2,$M4
2242 vpmuludq $T2,$R0,$M2
2351 vpsrlq \$52,$T0,$T2 # splat input
2353 vporq $T3,$T2,$T2
2357 vpandq $MASK,$T2,$T2 # 2
2363 vpaddq $H2,$T2,$H2 # accumulate input
2381 #vpaddq $H2,$T2,$H2 # accumulate input
2465 vpsrlq \$52,$T0,$T2 # splat input
2472 vporq $T3,$T2,$T2
2478 vpandq $MASK,$T2,$T2 # 2
2491 vpaddq $T2,$H2,$H2 # modulo-scheduled
2538 #vpaddq $H2,$T2,$H2 # accumulate input
2640 map(s/%z/%y/,($T0,$T1,$T2,$T3,$T4, $PADBIT));
2648 vpsrldq \$6,$T0,$T2 # splat input
2655 vpunpcklqdq $T3,$T2,$T2 # 2:3
2664 vpsrlq \$30,$T2,$T3
2665 vpsrlq \$4,$T2,$T2
2676 vpand $MASK,$T2,$T2 # 2
2682 vpaddq $H2,$T2,$H2 # accumulate input for .Ltail_avx2
2696 vpsubq $T2,$H2,$H2 # undo input accumulation
2930 my ($T0,$T1,$T2,$T3,$mask44,$mask42,$tmp,$PAD) = map("%ymm$_",(24..31));
2975 vmovdqu64 16*0($inp),$T2 # load data
2979 vpunpcklqdq $T3,$T2,$T1 # transpose data
2980 vpunpckhqdq $T3,$T2,$T3
2984 vpsrlq \$24,$T3,$T2 # splat the data
2985 vporq $PAD,$T2,$T2
2986 vpaddq $T2,$H2,$H2 # accumulate input
3145 vmovdqu64 16*0($inp),$T2 # load data
3149 vpunpcklqdq $T3,$T2,$T1 # transpose data
3150 vpunpckhqdq $T3,$T2,$T3
3154 vpsrlq \$24,$T3,$T2 # splat the data
3155 vporq $PAD,$T2,$T2
3156 vpaddq $T2,$H2,$H2 # accumulate input
3168 #vpaddq $T2,$H2,$H2 # accumulate input
3185 vmovdqu64 16*0($inp),$T2 # load data
3195 vpunpcklqdq $T3,$T2,$T1 # transpose data
3196 vpunpckhqdq $T3,$T2,$T3
3211 vpsrlq \$24,$T3,$T2
3212 vporq $PAD,$T2,$T2
3230 vpaddq $T2,$H2,$H2 # accumulate input
3257 #vpaddq $T2,$H2,$H2 # accumulate input
3299 vpsrldq \$8,$D2lo,$T2
3305 vpaddq $T2,$D2lo,$D2lo
3312 vpermq \$0x2,$D2lo,$T2
3316 vpaddq $T2,$D2lo,${D2lo}{%k1}{z}
3373 my ($T0,$T1,$T2,$T3,$mask44,$mask42,$tmp,$PAD) = map("%ymm$_",(24..31));
3476 vpunpcklqdq $R2,$RR2,$T2 # 3748
3486 map(s/%y/%z/, $T0,$T1,$T2,$T3,$mask44,$mask42,$tmp,$PAD);
3490 vshufi64x2 \$0x44,$R2,$T2,$RR2 # 15263748
3494 vmovdqu64 16*0($inp),$T2 # load data
3515 vpunpcklqdq $T3,$T2,$T1 # transpose data
3516 vpunpckhqdq $T3,$T2,$T3
3520 vpsrlq \$24,$T3,$T2 # splat the data
3521 vporq $PAD,$T2,$T2
3522 vpaddq $T2,$H2,$H2 # accumulate input
3535 #vpaddq $T2,$H2,$H2 # accumulate input
3552 vmovdqu64 16*0($inp),$T2 # load data
3562 vpunpcklqdq $T3,$T2,$T1 # transpose data
3563 vpunpckhqdq $T3,$T2,$T3
3578 vpsrlq \$24,$T3,$T2
3579 vporq $PAD,$T2,$T2
3597 vpaddq $T2,$H2,$H2 # accumulate input
3614 #vpaddq $T2,$H2,$H2 # accumulate input
3656 vpsrldq \$8,$D2lo,$T2
3662 vpaddq $T2,$D2lo,$D2lo
3669 vpermq \$0x2,$D2lo,$T2
3675 vpaddq $T2,$D2lo,$D2lo
3680 vextracti64x4 \$1,$D2lo,%y#$T2
3686 map(s/%z/%y/, $T0,$T1,$T2,$T3,$mask44,$mask42,$tmp,$PAD);
3693 vpaddq $T2,$D2lo,${D2lo}{%k1}{z}