Lines Matching refs:T4

344 my ($H0,$H1,$H2,$H3,$H4, $T0,$T1,$T2,$T3,$T4, $D0,$D1,$D2,$D3,$D4, $MASK) =
817 vpunpckhqdq $T1,$T0,$T4 # 4
821 vpsrlq \$40,$T4,$T4 # 4
829 vpor 32(%rcx),$T4,$T4 # padbit, yes, always
910 vpmuludq $T4,$D4,$D4 # d4 = h4*r0
913 vpmuludq 0x20(%rsp),$T4,$H0 # h4*s1
936 vpmuludq $T4,$H4,$H0 # h4*s2
947 vpmuludq $T4,$H3,$H0 # h4*s3
959 vpmuludq $T4,$H4,$T4 # h4*s4
962 vpaddq $T4,$D3,$D3 # d3 += h4*s4
964 vpmuludq 0x70(%rsp),$T0,$T4 # h0*r4
967 vpaddq $T4,$D4,$D4 # d4 += h0*r4
968 vmovdqa -0x90(%r11),$T4 # r0^4
1006 vpmuludq $H0,$T4,$T0 # h0*r0
1007 vpmuludq $H1,$T4,$T1 # h1*r0
1011 vpmuludq $H2,$T4,$T0 # h2*r0
1012 vpmuludq $H3,$T4,$T1 # h3*r0
1015 vpmuludq $H4,$T4,$T4 # h4*r0
1017 vpaddq $T4,$D4,$D4
1030 vmovdqa -0x50(%r11),$T4 # s2^4
1037 vpmuludq $H4,$T4,$T0 # h4*s2
1041 vpmuludq $H3,$T4,$T4 # h3*s2
1043 vpaddq $T4,$D0,$D0 # d0 += h3*s2
1045 vmovdqa -0x10(%r11),$T4 # s4^4
1058 vpmuludq $H2,$T4,$H2 # h2*s4
1059 vpmuludq $H3,$T4,$H3 # h3*s4
1062 vpmuludq $H4,$T4,$H4 # h4*s4
1067 vpmuludq $H1,$T4,$H0
1068 vpunpckhqdq $T1,$T0,$T4 # 4
1075 #vpsrlq \$40,$T4,$T4 # 4
1076 vpsrldq \$`40/8`,$T4,$T4 # 4
1082 vpand 0(%rcx),$T4,$T4 # .Lmask24
1086 vpor 32(%rcx),$T4,$T4 # padbit, yes, always
1137 vpaddq $H4,$T4,$T4
1157 vpmuludq $T4,$D4,$D4 # d4 = h4*r0
1169 vpmuludq $T4,$H3,$H3 # h4*s1
1180 vpmuludq $T4,$H2,$H1 # h4*s2
1191 vpmuludq $T4,$H4,$H1 # h4*s3
1201 vpmuludq $T4,$H3,$H1 # h4*s4
1231 vpshufd \$0x32,`16*0-64`($ctx),$T4 # r0^n, 34xx -> x3x4
1241 vpmuludq $H0,$T4,$T0 # h0*r0
1243 vpmuludq $H1,$T4,$T1 # h1*r0
1245 vpmuludq $H2,$T4,$T0 # h2*r0
1248 vpmuludq $H3,$T4,$T1 # h3*r0
1250 vpmuludq $H4,$T4,$T4 # h4*r0
1251 vpaddq $T4,$D4,$D4 # d4 += h4*r0
1258 vpshufd \$0x32,`16*3-64`($ctx),$T4 # r2
1267 vpmuludq $H2,$T4,$T1 # h2*r2
1269 vpmuludq $H1,$T4,$T0 # h1*r2
1272 vpmuludq $H0,$T4,$T4 # h0*r2
1273 vpaddq $T4,$D2,$D2 # d2 += h0*r2
1276 vpshufd \$0x32,`16*6-64`($ctx),$T4 # s3
1285 vpmuludq $H4,$T4,$T1 # h4*s3
1288 vpmuludq $H3,$T4,$T0 # h3*s3
1290 vpmuludq $H2,$T4,$T4 # h2*s3
1291 vpaddq $T4,$D0,$D0 # d0 += h2*s3
1308 vpsrldq \$8,$D4,$T4
1314 vpaddq $T4,$D4,$D4
1442 my ($H0,$H1,$H2,$H3,$H4, $MASK, $T4,$T0,$T1,$T2,$T3, $D0,$D1,$D2,$D3,$D4) =
1755 vmovdqu `16*2-64`($ctx),%x#$T4
1765 vpermd $T4,$T0,$T4
1770 vmovdqa $T4,0x40-0x90(%rax)
1793 vpunpckhqdq $T1,$T0,$T4 # 4
1800 vpsrlq \$40,$T4,$T4 # 4
1805 vpor 32(%rcx),$T4,$T4 # padbit, yes, always
1828 vpaddq $H4,$T4,$H4
1853 vpmuludq $H0,$T1,$T4 # h0*r1
1855 vpaddq $T4,$D1,$D1 # d1 += h0*r1
1857 vpmuludq $H3,$T1,$T4 # h3*r1
1859 vpaddq $T4,$D4,$D4 # d4 += h3*r1
1863 vpmuludq $H0,$T0,$T4 # h0*r0
1865 vpaddq $T4,$D0,$D0 # d0 += h0*r0
1867 vpmuludq $H3,$T0,$T4 # h3*r0
1870 vpaddq $T4,$D3,$D3 # d3 += h3*r0
1874 vpmuludq $H3,$T1,$T4 # h3*s2
1877 vpaddq $T4,$D0,$D0 # d0 += h3*s2
1880 vpmuludq $H1,$T2,$T4 # h1*r2
1882 vpaddq $T4,$D3,$D3 # d3 += h1*r2
1887 vpmuludq $H1,$H2,$T4 # h1*r3
1890 vpaddq $T4,$D4,$D4 # d4 += h1*r3
1892 vpmuludq $H3,$T3,$T4 # h3*s3
1895 vpaddq $T4,$D1,$D1 # d1 += h3*s3
1897 vpunpckhqdq $T1,$T0,$T4 # 4
1949 vpsrlq \$40,$T4,$T4 # 4
1958 vpor 32(%rcx),$T4,$T4 # padbit, yes, always
1978 vpaddq $H4,$T4,$H4
1988 vpmuludq $H0,$T1,$T4 # h0*r1
1990 vpaddq $T4,$D1,$D1 # d1 += h0*r1
1992 vpmuludq $H3,$T1,$T4 # h3*r1
1994 vpaddq $T4,$D4,$D4 # d4 += h3*r1
1997 vpmuludq $H0,$T0,$T4 # h0*r0
1999 vpaddq $T4,$D0,$D0 # d0 += h0*r0
2002 vpmuludq $H3,$T0,$T4 # h3*r0
2004 vpaddq $T4,$D3,$D3 # d3 += h3*r0
2007 vpmuludq $H3,$T1,$T4 # h3*s2
2009 vpaddq $T4,$D0,$D0 # d0 += h3*s2
2012 vpmuludq $H1,$T2,$T4 # h1*r2
2014 vpaddq $T4,$D3,$D3 # d3 += h1*r2
2017 vpmuludq $H1,$H2,$T4 # h1*r3
2019 vpaddq $T4,$D4,$D4 # d4 += h1*r3
2021 vpmuludq $H3,$T3,$T4 # h3*s3
2023 vpaddq $T4,$D1,$D1 # d1 += h3*s3
2042 vpsrldq \$8,$H4,$T4
2047 vpaddq $T4,$H4,$H4
2051 vpermq \$0x2,$H4,$T4
2056 vpaddq $T4,$H4,$H4
2137 map(s/%y/%z/,($T4,$T0,$T1,$T2,$T3)); # switch to %zmm domain
2187 vmovdqu `16*8-64`($ctx),%x#$T4 # ... ${S4}
2203 vpermd $T4,$T2,$S4
2243 vpsrlq \$32,$R4,$T4
2261 vpmuludq $T4,$S4,$M3
2262 vpmuludq $T4,$R0,$M4
2263 vpmuludq $T4,$S1,$M0
2264 vpmuludq $T4,$S2,$M1
2265 vpmuludq $T4,$S3,$M2
2275 vmovdqu64 16*4($inp),%z#$T4
2316 vpunpcklqdq $T4,$T3,$T0 # transpose input
2317 vpunpckhqdq $T4,$T3,$T4
2352 vpsllq \$12,$T4,$T3
2355 vpsrlq \$14,$T4,$T3
2356 vpsrlq \$40,$T4,$T4 # 4
2361 #vporq $PADBIT,$T4,$T4 # padbit, yes, always
2405 vporq $PADBIT,$T4,$T4 # padbit, yes, always
2409 vpaddq $H4,$T4,$H4
2412 vmovdqu64 16*4($inp),$T4
2432 vpunpcklqdq $T4,$T3,$T0 # transpose input
2433 vpunpckhqdq $T4,$T3,$T4
2466 vpsllq \$12,$T4,$T3
2498 vpsrlq \$14,$T4,$T3
2504 vpsrlq \$40,$T4,$T4 # 4
2513 #vporq $PADBIT,$T4,$T4 # padbit, yes, always
2548 vporq $PADBIT,$T4,$T4 # padbit, yes, always
2551 vpaddq $H4,$T4,$H4
2640 map(s/%z/%y/,($T0,$T1,$T2,$T3,$T4, $PADBIT));
2650 vpunpckhqdq $T1,$T0,$T4 # 4
2671 vpsrlq \$40,$T4,$T4 # 4
2689 vpor 32(%rcx),$T4,$T4 # padbit, yes, always