Lines Matching refs:H2

344 my ($H0,$H1,$H2,$H3,$H4, $T0,$T1,$T2,$T3,$T4, $D0,$D1,$D2,$D3,$D4, $MASK) =
637 vmovd $h0#d,$H2
740 vmovd $h0#d,$H2
774 vmovd 4*2($ctx),$H2
906 vmovdqa $H2,0x20(%r11) # offload hash
908 vmovdqa 0x10(%rsp),$H2 # r1^2
915 vpmuludq $T3,$H2,$H1 # h3*r1
919 vpmuludq $T2,$H2,$H0 # h2*r1
920 vpmuludq $T1,$H2,$H1 # h1*r1
925 vpmuludq $T0,$H2,$H2 # h0*r1
927 vpaddq $H2,$D1,$D1 # d1 += h0*r1
934 vmovdqa 0x50(%rsp),$H2 # r3^2
943 vpmuludq $T1,$H2,$H1 # h1*r3
944 vpmuludq $T0,$H2,$H2 # h0*r3
946 vpaddq $H2,$D3,$D3 # d3 += h0*r3
960 vpsrldq \$6,$H0,$H2 # splat input
972 vpunpcklqdq $H3,$H2,$H3 # 2:3
978 vpsrlq \$4,$H3,$H2
982 vpand $MASK,$H2,$H2 # 2
988 vpaddq 0x20(%r11),$H2,$H2
1011 vpmuludq $H2,$T4,$T0 # h2*r0
1020 vpmuludq $H2,$T2,$T1 # h2*r1
1031 vpmuludq $H2,$T3,$T0 # h2*r2
1053 vpmuludq $H2,$T3,$T3 # h2*s3
1058 vpmuludq $H2,$T4,$H2 # h2*s4
1061 vpaddq $H2,$D1,$D1 # d1 += h2*s4
1064 vpaddq $H3,$D2,$H2 # h2 = d2 + h3*s4
1105 vpaddq $D1,$H2,$H2 # h1 -> h2
1111 vpsrlq \$26,$H2,$D2
1112 vpand $MASK,$H2,$H2
1133 vpaddq $H2,$T2,$T2
1140 vmovdqa $H2,0x20(%r11)
1154 vpshufd \$0x10,`16*1-64`($ctx),$H2 # r1^n
1159 vpmuludq $T3,$H2,$H0 # h3*r1
1162 vpmuludq $T2,$H2,$H1 # h2*r1
1165 vpmuludq $T1,$H2,$H0 # h1*r1
1167 vpmuludq $T0,$H2,$H2 # h0*r1
1168 vpaddq $H2,$D1,$D1 # d1 += h0*r1
1172 vpshufd \$0x10,`16*4-64`($ctx),$H2 # s2^n
1180 vpmuludq $T4,$H2,$H1 # h4*s2
1183 vpmuludq $T3,$H2,$H2 # h3*s2
1184 vpaddq $H2,$D0,$D0 # d0 += h3*s2
1190 vpshufd \$0x10,`16*7-64`($ctx),$H2 # r4^n
1199 vpmuludq $T0,$H2,$H2 # h0*r4
1200 vpaddq $H2,$D4,$D4 # h4 = d4 + h0*r4
1215 vpsrldq \$6,$H0,$H2 # splat input
1219 vpunpcklqdq $H3,$H2,$H3 # 2:3
1224 vpsrlq \$4,$H3,$H2
1227 vpand $MASK,$H2,$H2 # 2
1234 vpaddq 0x20(%r11),$H2,$H2
1245 vpmuludq $H2,$T4,$T0 # h2*r0
1256 vpmuludq $H2,$T2,$T1 # h2*r1
1267 vpmuludq $H2,$T4,$T1 # h2*r2
1290 vpmuludq $H2,$T4,$T4 # h2*s3
1299 vpmuludq $H2,$T3,$T1 # h2*s4
1341 vpsrlq \$26,$D2,$H2
1343 vpaddq $H2,$D3,$D3 # h2 -> h3
1442 my ($H0,$H1,$H2,$H3,$H4, $MASK, $T4,$T0,$T1,$T2,$T3, $D0,$D1,$D2,$D3,$D4) =
1567 vmovd $h0#d,%x#$H2
1675 vmovd $h0#d,%x#$H2
1712 vmovd 4*2($ctx),%x#$H2
1807 vpaddq $H2,$T2,$H2 # accumulate input
1821 #vpaddq $H2,$T2,$H2 # accumulate input
1847 vpmuludq $H2,$T0,$D2 # d2 = h2*r0
1848 vpmuludq $H2,$T1,$D3 # d3 = h2*r1
1849 vpmuludq $H2,$T2,$D4 # d4 = h2*r2
1850 vpmuludq $H2,$T3,$D0 # d0 = h2*s3
1851 vpmuludq $H2,$S4,$D1 # d1 = h2*s4
1854 vpmuludq $H1,$T1,$H2 # h1*r1, borrow $H2 as temp
1856 vpaddq $H2,$D2,$D2 # d2 += h1*r1
1858 vpmuludq `32*2`(%rsp),$H4,$H2 # h4*s1
1860 vpaddq $H2,$D0,$D0 # d0 += h4*s1
1864 vpmuludq $H1,$T0,$H2 # h1*r0
1866 vpaddq $H2,$D1,$D1 # d1 += h1*r0
1868 vpmuludq $H4,$T0,$H2 # h4*r0
1871 vpaddq $H2,$D4,$D4 # d4 += h4*r0
1875 vpmuludq $H4,$T1,$H2 # h4*s2
1878 vpaddq $H2,$D1,$D1 # d1 += h4*s2
1879 vmovdqa `32*5-0x90`(%rax),$H2 # r3
1887 vpmuludq $H1,$H2,$T4 # h1*r3
1888 vpmuludq $H0,$H2,$H2 # h0*r3
1891 vpaddq $H2,$D3,$D3 # d3 += h0*r3
1893 vpmuludq $H4,$T3,$H2 # h4*s3
1896 vpaddq $H2,$D2,$D2 # d2 += h4*s3
1902 vpaddq $H3,$D2,$H2 # h2 = d2 + h3*r4
1929 vpaddq $D1,$H2,$H2 # h1 -> h2
1938 vpsrlq \$26,$H2,$D2
1939 vpand $MASK,$H2,$H2
1942 vpaddq $T2,$H2,$H2 # modulo-scheduled
1971 #vpaddq $H2,$T2,$H2 # accumulate input
1982 vpmuludq $H2,$T0,$D2 # d2 = h2*r0
1983 vpmuludq $H2,$T1,$D3 # d3 = h2*r1
1984 vpmuludq $H2,$T2,$D4 # d4 = h2*r2
1985 vpmuludq $H2,$T3,$D0 # d0 = h2*s3
1986 vpmuludq $H2,$S4,$D1 # d1 = h2*s4
1989 vpmuludq $H1,$T1,$H2 # h1*r1
1991 vpaddq $H2,$D2,$D2 # d2 += h1*r1
1993 vpmuludq `32*2+4`(%rsp),$H4,$H2 # h4*s1
1995 vpaddq $H2,$D0,$D0 # d0 += h4*s1
1998 vpmuludq $H1,$T0,$H2 # h1*r0
2001 vpaddq $H2,$D1,$D1 # d1 += h1*r0
2003 vpmuludq $H4,$T0,$H2 # h4*r0
2005 vpaddq $H2,$D4,$D4 # d4 += h4*r0
2008 vpmuludq $H4,$T1,$H2 # h4*s2
2010 vpaddq $H2,$D1,$D1 # d1 += h4*s2
2011 vmovdqu `32*5+4-0x90`(%rax),$H2 # r3
2017 vpmuludq $H1,$H2,$T4 # h1*r3
2018 vpmuludq $H0,$H2,$H2 # h0*r3
2020 vpaddq $H2,$D3,$D3 # d3 += h0*r3
2022 vpmuludq $H4,$T3,$H2 # h4*s3
2024 vpaddq $H2,$D2,$D2 # d2 += h4*s3
2028 vpaddq $H3,$D2,$H2 # h2 = d2 + h3*r4
2040 vpsrldq \$8,$H2,$T2
2045 vpaddq $T2,$H2,$H2
2054 vpermq \$0x2,$H2,$T2
2059 vpaddq $T2,$H2,$H2
2077 vpaddq $D1,$H2,$H2 # h1 -> h2
2083 vpsrlq \$26,$H2,$D2
2084 vpand $MASK,$H2,$H2
2097 vmovd %x#$H2,`4*2-48-64`($ctx)
2139 map(s/%y/%z/,($H0,$H1,$H2,$H3,$H4));
2363 vpaddq $H2,$T2,$H2 # accumulate input
2381 #vpaddq $H2,$T2,$H2 # accumulate input
2398 vpmuludq $H2,$R1,$D3 # d3 = h2*r1
2400 vpmuludq $H2,$R2,$D4 # d4 = h2*r2
2402 vpmuludq $H2,$S3,$D0 # d0 = h2*s3
2404 vpmuludq $H2,$S4,$D1 # d1 = h2*s4
2406 vpmuludq $H2,$R0,$D2 # d2 = h2*r0
2460 vpaddq $M2,$D2,$H2 # h2 = d3 + h4*s3
2485 vpaddq $D1,$H2,$H2 # h1 -> h2
2491 vpaddq $T2,$H2,$H2 # modulo-scheduled
2494 vpsrlq \$26,$H2,$D2
2495 vpandq $MASK,$H2,$H2
2538 #vpaddq $H2,$T2,$H2 # accumulate input
2541 vpmuludq $H2,$R1,$D3 # d3 = h2*r1
2542 vpmuludq $H2,$R2,$D4 # d4 = h2*r2
2543 vpmuludq $H2,$S3,$D0 # d0 = h2*s3
2545 vpmuludq $H2,$S4,$D1 # d1 = h2*s4
2547 vpmuludq $H2,$R0,$D2 # d2 = h2*r0
2600 vpaddq $M2,$D2,$H2 # h2 = d3 + h4*s3
2610 vpermq \$0xb1,$H2,$D2
2615 vpaddq $D2,$H2,$H2
2622 vpermq \$0x2,$H2,$D2
2627 vpaddq $D2,$H2,$H2
2633 vextracti64x4 \$0x1,$H2,%y#$D2
2638 vpaddq $D2,$H2,${H2}{%k3}{z}
2641 map(s/%z/%y/,($H0,$H1,$H2,$H3,$H4, $D0,$D1,$D2,$D3,$D4, $MASK));
2666 vpaddq $D1,$H2,$H2 # h1 -> h2
2674 vpsrlq \$26,$H2,$D2
2675 vpand $MASK,$H2,$H2
2682 vpaddq $H2,$T2,$H2 # accumulate input for .Ltail_avx2
2696 vpsubq $T2,$H2,$H2 # undo input accumulation
2699 vmovd %x#$H2,`4*2-48-64`($ctx)
2802 my ($H0,$H1,$H2,$r2r1r0,$r1r0s2,$r0s2s1,$Dlo,$Dhi) = map("%ymm$_",(0..5,16,17));
2870 vpermq \$0b10101010,$Dlo,${H2}{%k7}{z}
2881 vpmadd52luq $r0s2s1,$H2,$Dlo
2882 vpmadd52huq $r0s2s1,$H2,$Dhi
2928 my ($H0,$H1,$H2,$R0,$R1,$R2,$S1,$S2) = map("%ymm$_",(0..5,16,17));
2956 vmovq 16($ctx),%x#$H2
2986 vpaddq $T2,$H2,$H2 # accumulate input
3001 vmovq 56($ctx),%x#$H2
3008 vmovdqa $H2,$R2
3014 vpmadd52luq $H2,$S1,$D0lo
3016 vpmadd52huq $H2,$S1,$D0hi
3018 vpmadd52luq $H2,$S2,$D1lo
3020 vpmadd52huq $H2,$S2,$D1hi
3022 vpmadd52luq $H2,$R0,$D2lo
3024 vpmadd52huq $H2,$R0,$D2hi
3058 vpandq $mask42,$D2lo,$H2
3076 vpunpcklqdq $R2,$H2,$R2
3077 vpbroadcastq %x#$H2,%x#$H2
3094 vinserti128 \$1,%x#$R2,$H2,$R2
3107 vmovq 16($ctx),%x#$H2
3156 vpaddq $T2,$H2,$H2 # accumulate input
3168 #vpaddq $T2,$H2,$H2 # accumulate input
3173 vpmadd52luq $H2,$S1,$D0lo
3175 vpmadd52huq $H2,$S1,$D0hi
3177 vpmadd52luq $H2,$S2,$D1lo
3179 vpmadd52huq $H2,$S2,$D1hi
3181 vpmadd52luq $H2,$R0,$D2lo
3183 vpmadd52huq $H2,$R0,$D2hi
3227 vpandq $mask42,$D2lo,$H2
3230 vpaddq $T2,$H2,$H2 # accumulate input
3257 #vpaddq $T2,$H2,$H2 # accumulate input
3262 vpmadd52luq $H2,$S1,$D0lo
3264 vpmadd52huq $H2,$S1,$D0hi
3266 vpmadd52luq $H2,$S2,$D1lo
3268 vpmadd52huq $H2,$S2,$D1hi
3270 vpmadd52luq $H2,$R0,$D2lo
3272 vpmadd52huq $H2,$R0,$D2hi
3300 vpsrldq \$8,$D2hi,$H2
3306 vpaddq $H2,$D2hi,$D2hi
3313 vpermq \$0x2,$D2hi,$H2
3317 vpaddq $H2,$D2hi,${D2hi}{%k1}{z}
3337 vpandq $mask42,$D2lo,$H2
3356 vmovq %x#$H2,16($ctx)
3371 my ($H0,$H1,$H2,$R0,$R1,$R2,$S1,$S2) = map("%ymm$_",(0..5,16,17));
3395 vmovq 16($ctx),%x#$H2
3484 map(s/%y/%z/, $H0,$H1,$H2,$R0,$R1,$R2,$S1,$S2);
3522 vpaddq $T2,$H2,$H2 # accumulate input
3535 #vpaddq $T2,$H2,$H2 # accumulate input
3540 vpmadd52luq $H2,$S1,$D0lo
3542 vpmadd52huq $H2,$S1,$D0hi
3544 vpmadd52luq $H2,$S2,$D1lo
3546 vpmadd52huq $H2,$S2,$D1hi
3548 vpmadd52luq $H2,$R0,$D2lo
3550 vpmadd52huq $H2,$R0,$D2hi
3594 vpandq $mask42,$D2lo,$H2
3597 vpaddq $T2,$H2,$H2 # accumulate input
3614 #vpaddq $T2,$H2,$H2 # accumulate input
3619 vpmadd52luq $H2,$SS1,$D0lo
3621 vpmadd52huq $H2,$SS1,$D0hi
3623 vpmadd52luq $H2,$SS2,$D1lo
3625 vpmadd52huq $H2,$SS2,$D1hi
3627 vpmadd52luq $H2,$RR0,$D2lo
3629 vpmadd52huq $H2,$RR0,$D2hi
3657 vpsrldq \$8,$D2hi,$H2
3663 vpaddq $H2,$D2hi,$D2hi
3670 vpermq \$0x2,$D2hi,$H2
3676 vpaddq $H2,$D2hi,$D2hi
3681 vextracti64x4 \$1,$D2hi,%y#$H2
3684 map(s/%z/%y/, $H0,$H1,$H2,$R0,$R1,$R2,$S1,$S2);
3694 vpaddq $H2,$D2hi,${D2hi}{%k1}{z}
3714 vpandq $mask42,$D2lo,$H2
3731 vmovq %x#$H2,16($ctx)