Lines Matching refs:H2

420 my ($H0,$H1,$H2,$H3,$H4, $T0,$T1,$T2,$T3,$T4, $D0,$D1,$D2,$D3,$D4, $MASK) =
715 vmovd $h0#d,$H2
817 vmovd $h0#d,$H2
847 vmovd 4*2($ctx),$H2
982 vmovdqa $H2,0x20(%r11) # offload hash
984 vmovdqa 0x10(%rsp),$H2 # r1^2
991 vpmuludq $T3,$H2,$H1 # h3*r1
995 vpmuludq $T2,$H2,$H0 # h2*r1
996 vpmuludq $T1,$H2,$H1 # h1*r1
1001 vpmuludq $T0,$H2,$H2 # h0*r1
1003 vpaddq $H2,$D1,$D1 # d1 += h0*r1
1010 vmovdqa 0x50(%rsp),$H2 # r3^2
1019 vpmuludq $T1,$H2,$H1 # h1*r3
1020 vpmuludq $T0,$H2,$H2 # h0*r3
1022 vpaddq $H2,$D3,$D3 # d3 += h0*r3
1036 vpsrldq \$6,$H0,$H2 # splat input
1048 vpunpcklqdq $H3,$H2,$H3 # 2:3
1054 vpsrlq \$4,$H3,$H2
1058 vpand $MASK,$H2,$H2 # 2
1064 vpaddq 0x20(%r11),$H2,$H2
1087 vpmuludq $H2,$T4,$T0 # h2*r0
1096 vpmuludq $H2,$T2,$T1 # h2*r1
1107 vpmuludq $H2,$T3,$T0 # h2*r2
1129 vpmuludq $H2,$T3,$T3 # h2*s3
1134 vpmuludq $H2,$T4,$H2 # h2*s4
1137 vpaddq $H2,$D1,$D1 # d1 += h2*s4
1140 vpaddq $H3,$D2,$H2 # h2 = d2 + h3*s4
1181 vpaddq $D1,$H2,$H2 # h1 -> h2
1187 vpsrlq \$26,$H2,$D2
1188 vpand $MASK,$H2,$H2
1209 vpaddq $H2,$T2,$T2
1216 vmovdqa $H2,0x20(%r11)
1230 vpshufd \$0x10,`16*1-64`($ctx),$H2 # r1^n
1235 vpmuludq $T3,$H2,$H0 # h3*r1
1238 vpmuludq $T2,$H2,$H1 # h2*r1
1241 vpmuludq $T1,$H2,$H0 # h1*r1
1243 vpmuludq $T0,$H2,$H2 # h0*r1
1244 vpaddq $H2,$D1,$D1 # d1 += h0*r1
1248 vpshufd \$0x10,`16*4-64`($ctx),$H2 # s2^n
1256 vpmuludq $T4,$H2,$H1 # h4*s2
1259 vpmuludq $T3,$H2,$H2 # h3*s2
1260 vpaddq $H2,$D0,$D0 # d0 += h3*s2
1266 vpshufd \$0x10,`16*7-64`($ctx),$H2 # r4^n
1275 vpmuludq $T0,$H2,$H2 # h0*r4
1276 vpaddq $H2,$D4,$D4 # h4 = d4 + h0*r4
1291 vpsrldq \$6,$H0,$H2 # splat input
1295 vpunpcklqdq $H3,$H2,$H3 # 2:3
1300 vpsrlq \$4,$H3,$H2
1303 vpand $MASK,$H2,$H2 # 2
1310 vpaddq 0x20(%r11),$H2,$H2
1321 vpmuludq $H2,$T4,$T0 # h2*r0
1332 vpmuludq $H2,$T2,$T1 # h2*r1
1343 vpmuludq $H2,$T4,$T1 # h2*r2
1366 vpmuludq $H2,$T4,$T4 # h2*s3
1375 vpmuludq $H2,$T3,$T1 # h2*s4
1417 vpsrlq \$26,$D2,$H2
1419 vpaddq $H2,$D3,$D3 # h2 -> h3
1517 my ($H0,$H1,$H2,$H3,$H4, $MASK, $T4,$T0,$T1,$T2,$T3, $D0,$D1,$D2,$D3,$D4) =
1643 vmovd $h0#d,%x#$H2
1750 vmovd $h0#d,%x#$H2
1791 vmovd 4*2($ctx),%x#$H2
1890 vpaddq $H2,$T2,$H2 # accumulate input
1904 #vpaddq $H2,$T2,$H2 # accumulate input
1930 vpmuludq $H2,$T0,$D2 # d2 = h2*r0
1931 vpmuludq $H2,$T1,$D3 # d3 = h2*r1
1932 vpmuludq $H2,$T2,$D4 # d4 = h2*r2
1933 vpmuludq $H2,$T3,$D0 # d0 = h2*s3
1934 vpmuludq $H2,$S4,$D1 # d1 = h2*s4
1937 vpmuludq $H1,$T1,$H2 # h1*r1, borrow $H2 as temp
1939 vpaddq $H2,$D2,$D2 # d2 += h1*r1
1941 vpmuludq `32*2`(%rsp),$H4,$H2 # h4*s1
1943 vpaddq $H2,$D0,$D0 # d0 += h4*s1
1947 vpmuludq $H1,$T0,$H2 # h1*r0
1949 vpaddq $H2,$D1,$D1 # d1 += h1*r0
1951 vpmuludq $H4,$T0,$H2 # h4*r0
1954 vpaddq $H2,$D4,$D4 # d4 += h4*r0
1958 vpmuludq $H4,$T1,$H2 # h4*s2
1961 vpaddq $H2,$D1,$D1 # d1 += h4*s2
1962 vmovdqa `32*5-0x90`(%rax),$H2 # r3
1970 vpmuludq $H1,$H2,$T4 # h1*r3
1971 vpmuludq $H0,$H2,$H2 # h0*r3
1974 vpaddq $H2,$D3,$D3 # d3 += h0*r3
1976 vpmuludq $H4,$T3,$H2 # h4*s3
1979 vpaddq $H2,$D2,$D2 # d2 += h4*s3
1985 vpaddq $H3,$D2,$H2 # h2 = d2 + h3*r4
2012 vpaddq $D1,$H2,$H2 # h1 -> h2
2021 vpsrlq \$26,$H2,$D2
2022 vpand $MASK,$H2,$H2
2025 vpaddq $T2,$H2,$H2 # modulo-scheduled
2054 #vpaddq $H2,$T2,$H2 # accumulate input
2065 vpmuludq $H2,$T0,$D2 # d2 = h2*r0
2066 vpmuludq $H2,$T1,$D3 # d3 = h2*r1
2067 vpmuludq $H2,$T2,$D4 # d4 = h2*r2
2068 vpmuludq $H2,$T3,$D0 # d0 = h2*s3
2069 vpmuludq $H2,$S4,$D1 # d1 = h2*s4
2072 vpmuludq $H1,$T1,$H2 # h1*r1
2074 vpaddq $H2,$D2,$D2 # d2 += h1*r1
2076 vpmuludq `32*2+4`(%rsp),$H4,$H2 # h4*s1
2078 vpaddq $H2,$D0,$D0 # d0 += h4*s1
2081 vpmuludq $H1,$T0,$H2 # h1*r0
2084 vpaddq $H2,$D1,$D1 # d1 += h1*r0
2086 vpmuludq $H4,$T0,$H2 # h4*r0
2088 vpaddq $H2,$D4,$D4 # d4 += h4*r0
2091 vpmuludq $H4,$T1,$H2 # h4*s2
2093 vpaddq $H2,$D1,$D1 # d1 += h4*s2
2094 vmovdqu `32*5+4-0x90`(%rax),$H2 # r3
2100 vpmuludq $H1,$H2,$T4 # h1*r3
2101 vpmuludq $H0,$H2,$H2 # h0*r3
2103 vpaddq $H2,$D3,$D3 # d3 += h0*r3
2105 vpmuludq $H4,$T3,$H2 # h4*s3
2107 vpaddq $H2,$D2,$D2 # d2 += h4*s3
2111 vpaddq $H3,$D2,$H2 # h2 = d2 + h3*r4
2123 vpsrldq \$8,$H2,$T2
2128 vpaddq $T2,$H2,$H2
2137 vpermq \$0x2,$H2,$T2
2142 vpaddq $T2,$H2,$H2
2160 vpaddq $D1,$H2,$H2 # h1 -> h2
2166 vpsrlq \$26,$H2,$D2
2167 vpand $MASK,$H2,$H2
2180 vmovd %x#$H2,`4*2-48-64`($ctx)
2214 map(s/%y/%z/,($H0,$H1,$H2,$H3,$H4));
2435 vpaddq $H2,$T2,$H2 # accumulate input
2453 #vpaddq $H2,$T2,$H2 # accumulate input
2470 vpmuludq $H2,$R1,$D3 # d3 = h2*r1
2472 vpmuludq $H2,$R2,$D4 # d4 = h2*r2
2474 vpmuludq $H2,$S3,$D0 # d0 = h2*s3
2476 vpmuludq $H2,$S4,$D1 # d1 = h2*s4
2478 vpmuludq $H2,$R0,$D2 # d2 = h2*r0
2532 vpaddq $M2,$D2,$H2 # h2 = d3 + h4*s3
2557 vpaddq $D1,$H2,$H2 # h1 -> h2
2563 vpaddq $T2,$H2,$H2 # modulo-scheduled
2566 vpsrlq \$26,$H2,$D2
2567 vpandq $MASK,$H2,$H2
2610 #vpaddq $H2,$T2,$H2 # accumulate input
2613 vpmuludq $H2,$R1,$D3 # d3 = h2*r1
2614 vpmuludq $H2,$R2,$D4 # d4 = h2*r2
2615 vpmuludq $H2,$S3,$D0 # d0 = h2*s3
2617 vpmuludq $H2,$S4,$D1 # d1 = h2*s4
2619 vpmuludq $H2,$R0,$D2 # d2 = h2*r0
2672 vpaddq $M2,$D2,$H2 # h2 = d3 + h4*s3
2682 vpermq \$0xb1,$H2,$D2
2687 vpaddq $D2,$H2,$H2
2694 vpermq \$0x2,$H2,$D2
2699 vpaddq $D2,$H2,$H2
2705 vextracti64x4 \$0x1,$H2,%y#$D2
2710 vpaddq $D2,$H2,${H2}{%k3}{z}
2713 map(s/%z/%y/,($H0,$H1,$H2,$H3,$H4, $D0,$D1,$D2,$D3,$D4, $MASK));
2738 vpaddq $D1,$H2,$H2 # h1 -> h2
2746 vpsrlq \$26,$H2,$D2
2747 vpand $MASK,$H2,$H2
2754 vpaddq $H2,$T2,$H2 # accumulate input for .Ltail_avx2
2768 vpsubq $T2,$H2,$H2 # undo input accumulation
2771 vmovd %x#$H2,`4*2-48-64`($ctx)
2900 my ($H0,$H1,$H2,$r2r1r0,$r1r0s2,$r0s2s1,$Dlo,$Dhi) = map("%ymm$_",(0..5,16,17));
2966 vpermq \$0b10101010,$Dlo,${H2}{%k7}{z}
2977 vpmadd52luq $r0s2s1,$H2,$Dlo
2978 vpmadd52huq $r0s2s1,$H2,$Dhi
3023 my ($H0,$H1,$H2,$R0,$R1,$R2,$S1,$S2) = map("%ymm$_",(0..5,16,17));
3050 vmovq 16($ctx),%x#$H2
3080 vpaddq $T2,$H2,$H2 # accumulate input
3095 vmovq 56($ctx),%x#$H2
3102 vmovdqa $H2,$R2
3108 vpmadd52luq $H2,$S1,$D0lo
3110 vpmadd52huq $H2,$S1,$D0hi
3112 vpmadd52luq $H2,$S2,$D1lo
3114 vpmadd52huq $H2,$S2,$D1hi
3116 vpmadd52luq $H2,$R0,$D2lo
3118 vpmadd52huq $H2,$R0,$D2hi
3152 vpandq $mask42,$D2lo,$H2
3170 vpunpcklqdq $R2,$H2,$R2
3171 vpbroadcastq %x#$H2,%x#$H2
3188 vinserti128 \$1,%x#$R2,$H2,$R2
3201 vmovq 16($ctx),%x#$H2
3250 vpaddq $T2,$H2,$H2 # accumulate input
3262 #vpaddq $T2,$H2,$H2 # accumulate input
3267 vpmadd52luq $H2,$S1,$D0lo
3269 vpmadd52huq $H2,$S1,$D0hi
3271 vpmadd52luq $H2,$S2,$D1lo
3273 vpmadd52huq $H2,$S2,$D1hi
3275 vpmadd52luq $H2,$R0,$D2lo
3277 vpmadd52huq $H2,$R0,$D2hi
3321 vpandq $mask42,$D2lo,$H2
3324 vpaddq $T2,$H2,$H2 # accumulate input
3351 #vpaddq $T2,$H2,$H2 # accumulate input
3356 vpmadd52luq $H2,$S1,$D0lo
3358 vpmadd52huq $H2,$S1,$D0hi
3360 vpmadd52luq $H2,$S2,$D1lo
3362 vpmadd52huq $H2,$S2,$D1hi
3364 vpmadd52luq $H2,$R0,$D2lo
3366 vpmadd52huq $H2,$R0,$D2hi
3394 vpsrldq \$8,$D2hi,$H2
3400 vpaddq $H2,$D2hi,$D2hi
3407 vpermq \$0x2,$D2hi,$H2
3411 vpaddq $H2,$D2hi,${D2hi}{%k1}{z}
3431 vpandq $mask42,$D2lo,$H2
3450 vmovq %x#$H2,16($ctx)
3464 my ($H0,$H1,$H2,$R0,$R1,$R2,$S1,$S2) = map("%ymm$_",(0..5,16,17));
3487 vmovq 16($ctx),%x#$H2
3576 map(s/%y/%z/, $H0,$H1,$H2,$R0,$R1,$R2,$S1,$S2);
3614 vpaddq $T2,$H2,$H2 # accumulate input
3627 #vpaddq $T2,$H2,$H2 # accumulate input
3632 vpmadd52luq $H2,$S1,$D0lo
3634 vpmadd52huq $H2,$S1,$D0hi
3636 vpmadd52luq $H2,$S2,$D1lo
3638 vpmadd52huq $H2,$S2,$D1hi
3640 vpmadd52luq $H2,$R0,$D2lo
3642 vpmadd52huq $H2,$R0,$D2hi
3686 vpandq $mask42,$D2lo,$H2
3689 vpaddq $T2,$H2,$H2 # accumulate input
3706 #vpaddq $T2,$H2,$H2 # accumulate input
3711 vpmadd52luq $H2,$SS1,$D0lo
3713 vpmadd52huq $H2,$SS1,$D0hi
3715 vpmadd52luq $H2,$SS2,$D1lo
3717 vpmadd52huq $H2,$SS2,$D1hi
3719 vpmadd52luq $H2,$RR0,$D2lo
3721 vpmadd52huq $H2,$RR0,$D2hi
3749 vpsrldq \$8,$D2hi,$H2
3755 vpaddq $H2,$D2hi,$D2hi
3762 vpermq \$0x2,$D2hi,$H2
3768 vpaddq $H2,$D2hi,$D2hi
3773 vextracti64x4 \$1,$D2hi,%y#$H2
3776 map(s/%z/%y/, $H0,$H1,$H2,$R0,$R1,$R2,$S1,$S2);
3786 vpaddq $H2,$D2hi,${D2hi}{%k1}{z}
3806 vpandq $mask42,$D2lo,$H2
3823 vmovq %x#$H2,16($ctx)