Lines Matching refs:h2

180 my ($h0,$h1,$h2)=("%r14","%rbx","%r10");
183 # input: copy of $r1 in %rax, $h0-$h2, $r0-$r1
184 # output: $h0-$h2 *= $r0-$r1
202 mov $h2,$h1 # borrow $h1
206 imulq $s1,$h1 # h2*s1
211 imulq $r0,$h2 # h2*r0
214 adc $h2,$d3
217 mov $d3,$h2
219 and \$3,$h2
223 adc \$0,$h2
331 mov 16($ctx),$h2
344 adc $padbit,$h2
359 mov $h2,16($ctx)
441 xor $h2,$h2
504 mov $h2,%rax
547 mov $h2,%rax
587 mov $h2,%rax
640 mov 16($ctx),$h2#d
660 mov $h2,$d1
662 shr \$24,$h2
664 adc \$0,$h2 # can be partially reduced...
667 mov $h2,$d1
668 and $h2,$d2
670 and \$3,$h2
674 adc \$0,$h2
684 adc $padbit,$h2
703 shl \$24,$h2
707 or $r1,$h2 # h[4]
716 vmovd $h2#d,$H4
723 mov $h2,16($ctx) # note that is_base2_26 is zeroed
732 mov $h2#d,16($ctx)
777 mov 16($ctx),$h2#d
790 adc $padbit,$h2
808 shl \$24,$h2
812 or $d2,$h2 # h[4]
818 vmovd $h2#d,$H4
970 # d4 = h4*r0 + h3*r1 + h2*r2 + h1*r3 + h0*r4
971 # d3 = h3*r0 + h2*r1 + h1*r2 + h0*r3 + h4*5*r4
972 # d2 = h2*r0 + h1*r1 + h0*r2 + h4*5*r3 + h3*5*r4
973 # d1 = h1*r0 + h0*r1 + h4*5*r2 + h3*5*r3 + h2*5*r4
974 # d0 = h0*r0 + h4*5*r1 + h3*5*r2 + h2*5*r3 + h1*5*r4
982 vpmuludq $T2,$D4,$D2 # d3 = h2*r0
994 vpmuludq $T2,$H2,$H0 # h2*r1
996 vpaddq $H0,$D3,$D3 # d3 += h2*r1
1001 vpmuludq $T2,$H3,$H0 # h2*r2
1005 vpaddq $H0,$D4,$D4 # d4 += h2*r2
1027 vpmuludq $T2,$H3,$H3 # h2*s3
1028 vpmuludq $T2,$H4,$T2 # h2*s4
1029 vpaddq $H3,$D0,$D0 # d0 += h2*s3
1032 vpaddq $T2,$D1,$D1 # d1 += h2*s4
1075 # d4 = h4*r0 + h3*r1 + h2*r2 + h1*r3 + h0*r4
1076 # d3 = h3*r0 + h2*r1 + h1*r2 + h0*r3 + h4*5*r4
1077 # d2 = h2*r0 + h1*r1 + h0*r2 + h4*5*r3 + h3*5*r4
1078 # d1 = h1*r0 + h0*r1 + h4*5*r2 + h3*5*r3 + h2*5*r4
1079 # d0 = h0*r0 + h4*5*r1 + h3*5*r2 + h2*5*r3 + h1*5*r4
1086 vpmuludq $H2,$T4,$T0 # h2*r0
1095 vpmuludq $H2,$T2,$T1 # h2*r1
1097 vpaddq $T1,$D3,$D3 # d3 += h2*r1
1106 vpmuludq $H2,$T3,$T0 # h2*r2
1108 vpaddq $T0,$D4,$D4 # d4 += h2*r2
1128 vpmuludq $H2,$T3,$T3 # h2*s3
1131 vpaddq $T3,$D0,$D0 # d0 += h2*s3
1133 vpmuludq $H2,$T4,$H2 # h2*s4
1136 vpaddq $H2,$D1,$D1 # d1 += h2*s4
1139 vpaddq $H3,$D2,$H2 # h2 = d2 + h3*s4
1180 vpaddq $D1,$H2,$H2 # h1 -> h2
1188 vpaddq $D2,$H3,$H3 # h2 -> h3
1221 # d4 = h4*r0 + h3*r1 + h2*r2 + h1*r3 + h0*r4
1222 # d3 = h3*r0 + h2*r1 + h1*r2 + h0*r3 + h4*5*r4
1223 # d2 = h2*r0 + h1*r1 + h0*r2 + h4*5*r3 + h3*5*r4
1224 # d1 = h1*r0 + h0*r1 + h4*5*r2 + h3*5*r3 + h2*5*r4
1225 # d0 = h0*r0 + h4*5*r1 + h3*5*r2 + h2*5*r3 + h1*5*r4
1227 vpmuludq $T2,$D4,$D2 # d2 = h2*r0
1237 vpmuludq $T2,$H2,$H1 # h2*r1
1238 vpaddq $H1,$D3,$D3 # d3 += h2*r1
1248 vpmuludq $T2,$H4,$H1 # h2*r2
1249 vpaddq $H1,$D4,$D4 # d4 += h2*r2
1271 vpmuludq $T2,$H4,$H4 # h2*s3
1272 vpaddq $H4,$D0,$D0 # d0 += h2*s3
1279 vpaddq $H0,$D2,$D2 # h2 = d2 + h3*s4
1280 vpmuludq $T2,$H3,$H1 # h2*s4
1281 vpaddq $H1,$D1,$D1 # h1 = d1 + h2*s4
1320 vpmuludq $H2,$T4,$T0 # h2*r0
1321 vpaddq $T0,$D2,$D2 # d2 += h2*r0
1331 vpmuludq $H2,$T2,$T1 # h2*r1
1332 vpaddq $T1,$D3,$D3 # d3 += h2*r1
1342 vpmuludq $H2,$T4,$T1 # h2*r2
1343 vpaddq $T1,$D4,$D4 # d4 += h2*r2
1365 vpmuludq $H2,$T4,$T4 # h2*s3
1366 vpaddq $T4,$D0,$D0 # d0 += h2*s3
1374 vpmuludq $H2,$T3,$T1 # h2*s4
1375 vpaddq $T1,$D1,$D1 # d1 += h2*s4
1410 vpaddq $H1,$D2,$D2 # h1 -> h2
1418 vpaddq $H2,$D3,$D3 # h2 -> h3
1484 adc \$0,%r10 # h2
1562 mov 16($ctx),$h2#d
1582 mov $h2,$d1
1584 shr \$24,$h2
1586 adc \$0,$h2 # can be partially reduced...
1589 mov $h2,$d1
1590 and $h2,$d2
1592 and \$3,$h2
1596 adc \$0,$h2
1607 adc $padbit,$h2
1631 shl \$24,$h2
1635 or $r1,$h2 # h[4]
1644 vmovd $h2#d,%x#$H4
1651 mov $h2,16($ctx) # note that is_base2_26 is zeroed
1660 mov $h2#d,16($ctx)
1705 mov 16($ctx),$h2#d
1719 adc $padbit,$h2
1741 shl \$24,$h2
1745 or $d2,$h2 # h[4]
1751 vmovd $h2#d,%x#$H4
1914 # d4 = h4*r0 + h3*r1 + h2*r2 + h1*r3 + h0*r4
1915 # d3 = h3*r0 + h2*r1 + h1*r2 + h0*r3 + h4*5*r4
1916 # d2 = h2*r0 + h1*r1 + h0*r2 + h4*5*r3 + h3*5*r4
1917 # d1 = h1*r0 + h0*r1 + h4*5*r2 + h3*5*r3 + h2*5*r4
1918 # d0 = h0*r0 + h4*5*r1 + h3*5*r2 + h2*5*r3 + h1*5*r4
1920 # however, as h2 is "chronologically" first one available pull
1923 # d4 = h2*r2 + h4*r0 + h3*r1 + h1*r3 + h0*r4
1924 # d3 = h2*r1 + h3*r0 + h1*r2 + h0*r3 + h4*5*r4
1925 # d2 = h2*r0 + h1*r1 + h0*r2 + h4*5*r3 + h3*5*r4
1926 # d1 = h2*5*r4 + h1*r0 + h0*r1 + h4*5*r2 + h3*5*r3
1927 # d0 = h2*5*r3 + h0*r0 + h4*5*r1 + h3*5*r2 + h1*5*r4
1929 vpmuludq $H2,$T0,$D2 # d2 = h2*r0
1930 vpmuludq $H2,$T1,$D3 # d3 = h2*r1
1931 vpmuludq $H2,$T2,$D4 # d4 = h2*r2
1932 vpmuludq $H2,$T3,$D0 # d0 = h2*s3
1933 vpmuludq $H2,$S4,$D1 # d1 = h2*s4
1984 vpaddq $H3,$D2,$H2 # h2 = d2 + h3*r4
2011 vpaddq $D1,$H2,$H2 # h1 -> h2
2022 vpaddq $D2,$H3,$H3 # h2 -> h3
2064 vpmuludq $H2,$T0,$D2 # d2 = h2*r0
2065 vpmuludq $H2,$T1,$D3 # d3 = h2*r1
2066 vpmuludq $H2,$T2,$D4 # d4 = h2*r2
2067 vpmuludq $H2,$T3,$D0 # d0 = h2*s3
2068 vpmuludq $H2,$S4,$D1 # d1 = h2*s4
2110 vpaddq $H3,$D2,$H2 # h2 = d2 + h3*r4
2159 vpaddq $D1,$H2,$H2 # h1 -> h2
2167 vpaddq $D2,$H3,$H3 # h2 -> h3
2454 # d4 = h4*r0 + h3*r1 + h2*r2 + h1*r3 + h0*r4
2455 # d3 = h3*r0 + h2*r1 + h1*r2 + h0*r3 + h4*5*r4
2456 # d2 = h2*r0 + h1*r1 + h0*r2 + h4*5*r3 + h3*5*r4
2457 # d1 = h1*r0 + h0*r1 + h4*5*r2 + h3*5*r3 + h2*5*r4
2458 # d0 = h0*r0 + h4*5*r1 + h3*5*r2 + h2*5*r3 + h1*5*r4
2460 # however, as h2 is "chronologically" first one available pull
2463 # d3 = h2*r1 + h0*r3 + h1*r2 + h3*r0 + h4*5*r4
2464 # d4 = h2*r2 + h0*r4 + h1*r3 + h3*r1 + h4*r0
2465 # d0 = h2*5*r3 + h0*r0 + h1*5*r4 + h3*5*r2 + h4*5*r1
2466 # d1 = h2*5*r4 + h0*r1 + h1*r0 + h3*5*r3 + h4*5*r2
2467 # d2 = h2*r0 + h0*r2 + h1*r1 + h3*5*r4 + h4*5*r3
2469 vpmuludq $H2,$R1,$D3 # d3 = h2*r1
2471 vpmuludq $H2,$R2,$D4 # d4 = h2*r2
2473 vpmuludq $H2,$S3,$D0 # d0 = h2*s3
2475 vpmuludq $H2,$S4,$D1 # d1 = h2*s4
2477 vpmuludq $H2,$R0,$D2 # d2 = h2*r0
2531 vpaddq $M2,$D2,$H2 # h2 = d3 + h4*s3
2556 vpaddq $D1,$H2,$H2 # h1 -> h2
2567 vpaddq $D2,$D3,$H3 # h2 -> h3
2612 vpmuludq $H2,$R1,$D3 # d3 = h2*r1
2613 vpmuludq $H2,$R2,$D4 # d4 = h2*r2
2614 vpmuludq $H2,$S3,$D0 # d0 = h2*s3
2616 vpmuludq $H2,$S4,$D1 # d1 = h2*s4
2618 vpmuludq $H2,$R0,$D2 # d2 = h2*r0
2671 vpaddq $M2,$D2,$H2 # h2 = d3 + h4*s3
2737 vpaddq $D1,$H2,$H2 # h1 -> h2
2749 vpaddq $D2,$H3,$H3 # h2 -> h3