Lines Matching refs:D4
344 my ($H0,$H1,$H2,$H3,$H4, $T0,$T1,$T2,$T3,$T4, $D0,$D1,$D2,$D3,$D4, $MASK) =
805 vmovdqu `16*3`($ctx),$D4 # preload r0^2
836 vpshufd \$0xEE,$D4,$D3 # 34xx -> 3434
837 vpshufd \$0x44,$D4,$D0 # xx12 -> 1212
840 vpshufd \$0xEE,$D1,$D4
843 vmovdqa $D4,-0x80(%r11)
850 vpshufd \$0xEE,$D0,$D4
853 vmovdqa $D4,-0x60(%r11)
860 vpshufd \$0xEE,$D2,$D4
863 vmovdqa $D4,-0x40(%r11)
870 vpshufd \$0xEE,$D1,$D4
872 vmovdqa $D4,-0x20(%r11)
875 vmovdqa 0x00(%rsp),$D4 # preload r0^2
902 # and $D4 is preloaded with r0^2...
904 vpmuludq $T0,$D4,$D0 # d0 = h0*r0
905 vpmuludq $T1,$D4,$D1 # d1 = h1*r0
907 vpmuludq $T2,$D4,$D2 # d3 = h2*r0
909 vpmuludq $T3,$D4,$D3 # d3 = h3*r0
910 vpmuludq $T4,$D4,$D4 # d4 = h4*r0
917 vpaddq $H1,$D4,$D4 # d4 += h3*r1
930 vpaddq $H0,$D4,$D4 # d4 += h2*r2
945 vpaddq $H1,$D4,$D4 # d4 += h1*r3
967 vpaddq $T4,$D4,$D4 # d4 += h0*r4
1017 vpaddq $T4,$D4,$D4
1024 vpaddq $T0,$D4,$D4 # d4 += h3*r1
1033 vpaddq $T0,$D4,$D4 # d4 += h2*r2
1046 vpaddq $T1,$D4,$D4 # d4 += h1*r3
1069 vpaddq $H4,$D4,$H4 # h4 = d4 + h0*r4
1078 vmovdqa 0x00(%rsp),$D4 # preload r0^2
1129 vpshufd \$0x10,$D4,$D4 # r0^n, xx12 -> x1x2
1152 vpmuludq $T2,$D4,$D2 # d2 = h2*r0
1153 vpmuludq $T0,$D4,$D0 # d0 = h0*r0
1155 vpmuludq $T1,$D4,$D1 # d1 = h1*r0
1156 vpmuludq $T3,$D4,$D3 # d3 = h3*r0
1157 vpmuludq $T4,$D4,$D4 # d4 = h4*r0
1160 vpaddq $H0,$D4,$D4 # d4 += h3*r1
1174 vpaddq $H1,$D4,$D4 # d4 += h2*r2
1187 vpaddq $H0,$D4,$D4 # d4 += h1*r3
1200 vpaddq $H2,$D4,$D4 # h4 = d4 + h0*r4
1251 vpaddq $T4,$D4,$D4 # d4 += h4*r0
1254 vpaddq $T0,$D4,$D4 # d4 += h3*r1
1268 vpaddq $T1,$D4,$D4 # d4 += h2*r2
1281 vpaddq $T0,$D4,$D4 # d4 += h1*r3
1294 vpaddq $T2,$D4,$D4 # d4 += h0*r4
1308 vpsrldq \$8,$D4,$T4
1314 vpaddq $T4,$D4,$D4
1324 vpaddq $H3,$D4,$D4 # h3 -> h4
1330 vpsrlq \$26,$D4,$H4
1331 vpand $MASK,$D4,$D4
1351 vpaddq $H3,$D4,$D4 # h3 -> h4
1357 vmovd $D4,`4*4-48-64`($ctx)
1442 my ($H0,$H1,$H2,$H3,$H4, $MASK, $T4,$T0,$T1,$T2,$T3, $D0,$D1,$D2,$D3,$D4) =
1762 vmovdqu `16*7-64`($ctx),%x#$D4
1775 vpermd $D4,$T0,$D4
1779 vmovdqa $D4,0xe0-0x90(%rax)
1849 vpmuludq $H2,$T2,$D4 # d4 = h2*r2
1859 vpaddq $T4,$D4,$D4 # d4 += h3*r1
1871 vpaddq $H2,$D4,$D4 # d4 += h4*r0
1890 vpaddq $T4,$D4,$D4 # d4 += h1*r3
1908 vpaddq $H4,$D4,$H4 # h4 = d4 + h0*r4
1922 vpsrlq \$26,$H4,$D4
1931 vpaddq $D4,$H0,$H0
1932 vpsllq \$2,$D4,$D4
1933 vpaddq $D4,$H0,$H0 # h4 -> h0
1984 vpmuludq $H2,$T2,$D4 # d4 = h2*r2
1994 vpaddq $T4,$D4,$D4 # d4 += h3*r1
2005 vpaddq $H2,$D4,$D4 # d4 += h4*r0
2019 vpaddq $T4,$D4,$D4 # d4 += h1*r3
2033 vpaddq $H4,$D4,$H4 # h4 = d4 + h0*r4
2072 vpsrlq \$26,$H4,$D4
2079 vpaddq $D4,$H0,$H0
2080 vpsllq \$2,$D4,$D4
2081 vpaddq $D4,$H0,$H0 # h4 -> h0
2138 map(s/%y/%z/,($D0,$D1,$D2,$D3,$D4));
2186 vmovdqu `16*7-64`($ctx),%x#$D4 # ... ${R4}
2201 vpermd $D4,$T2,$R4
2223 vpmuludq $T0,$R4,$D4 # d4 = r0'*r4
2236 vpaddq $M4,$D4,$D4 # d4 += r1'*r3
2247 vpaddq $M4,$D4,$D4 # d4 += r2'*r2
2257 vpaddq $M4,$D4,$D4 # d4 += r3'*r1
2267 vpaddq $M4,$D4,$D4 # d4 += r2'*r0
2283 vpaddq $M3,$D4,$D4 # d3 -> d4
2289 vpsrlq \$26,$D4,$M4
2290 vpandq $MASK,$D4,$D4
2310 vpaddq $M3,$D4,$D4 # d3 -> d4
2314 # $D0-$D4, ...
2338 vpermd $D4,$M0,${R4}{%k1}
2400 vpmuludq $H2,$R2,$D4 # d4 = h2*r2
2419 vpaddq $M4,$D4,$D4 # d4 += h0*r4
2428 vpaddq $M4,$D4,$D4 # d4 += h1*r3
2440 vpaddq $M4,$D4,$D4 # d4 += h3*r1
2450 vpaddq $M4,$D4,$D4 # d4 += h4*r0
2470 vpaddq $H3,$D4,$H4 # h3 -> h4
2480 vpsrlq \$26,$H4,$D4
2487 vpaddq $D4,$H0,$H0
2488 vpsllq \$2,$D4,$D4
2489 vpaddq $D4,$H0,$H0 # h4 -> h0
2542 vpmuludq $H2,$R2,$D4 # d4 = h2*r2
2559 vpaddq $M4,$D4,$D4 # d4 += h0*r4
2569 vpaddq $M4,$D4,$D4 # d4 += h1*r3
2579 vpaddq $M4,$D4,$D4 # d4 += h3*r1
2590 vpaddq $M4,$D4,$D4 # d4 += h4*r0
2607 vpermq \$0xb1,$D4,$H4
2612 vpaddq $D4,$H4,$H4
2619 vpermq \$0x2,$H4,$D4
2624 vpaddq $D4,$H4,$H4
2630 vextracti64x4 \$0x1,$H4,%y#$D4
2635 vpaddq $D4,$H4,${H4}{%k3}{z} # it's passed to .Ltail_avx2
2641 map(s/%z/%y/,($H0,$H1,$H2,$H3,$H4, $D0,$D1,$D2,$D3,$D4, $MASK));
2659 vpsrlq \$26,$H4,$D4
2668 vpaddq $D4,$H0,$H0
2669 vpsllq \$2,$D4,$D4
2672 vpaddq $D4,$H0,$H0 # h4 -> h0