1#!/usr/local/bin/perl 2# alpha assember 3 4sub mul_add_c 5 { 6 local($a,$b,$c0,$c1,$c2)=@_; 7 local($l1,$h1,$t1,$t2); 8 9print STDERR "count=$cnt\n"; $cnt++; 10 &mul($a,$b,($l1)=&NR(1)); 11 &muh($a,$b,($h1)=&NR(1)); 12 &add($c0,$l1,$c0); 13 &cmpult($c0,$l1,($t1)=&NR(1)); &FR($l1); 14 &add($t1,$h1,$h1); &FR($t1); 15 &add($c1,$h1,$c1); 16 &cmpult($c1,$h1,($t2)=&NR(1)); &FR($h1); 17 &add($c2,$t2,$c2); &FR($t2); 18 } 19 20sub bn_mul_comba4 21 { 22 local($name)=@_; 23 local(@a,@b,$r,$c0,$c1,$c2); 24 25 $cnt=1; 26 &init_pool(3); 27 28 $rp=&wparam(0); 29 $ap=&wparam(1); 30 $bp=&wparam(2); 31 32 &function_begin($name,""); 33 34 &comment(""); 35 36 &ld(($a[0])=&NR(1),&QWPw(0,$ap)); 37 &ld(($b[0])=&NR(1),&QWPw(0,$bp)); 38 &ld(($a[1])=&NR(1),&QWPw(1,$ap)); 39 &ld(($b[1])=&NR(1),&QWPw(1,$bp)); 40 &ld(($a[2])=&NR(1),&QWPw(2,$ap)); 41 &ld(($b[2])=&NR(1),&QWPw(2,$bp)); 42 &ld(($a[3])=&NR(1),&QWPw(3,$ap)); &FR($ap); 43 &ld(($b[3])=&NR(1),&QWPw(3,$bp)); &FR($bp); 44 45 ($c0,$c1,$c2)=&NR(3); 46 &mov("zero",$c2); 47 &mul($a[0],$b[0],$c0); 48 &muh($a[0],$b[0],$c1); 49 &st($c0,&QWPw(0,$rp)); &FR($c0); ($c0)=&NR($c0); 50 ($c0,$c1,$c2)=($c1,$c2,$c0); 51 &mov("zero",$c2); 52 53 &mul_add_c($a[0],$b[1],$c0,$c1,$c2); 54 &mul_add_c($a[1],$b[0],$c0,$c1,$c2); 55 &st($c0,&QWPw(1,$rp)); &FR($c0); ($c0)=&NR($c0); 56 ($c0,$c1,$c2)=($c1,$c2,$c0); 57 &mov("zero",$c2); 58 59 &mul_add_c($a[1],$b[1],$c0,$c1,$c2); 60 &mul_add_c($a[0],$b[2],$c0,$c1,$c2); 61 &mul_add_c($a[2],$b[0],$c0,$c1,$c2); 62 &st($c0,&QWPw(2,$rp)); &FR($c0); ($c0)=&NR($c0); 63 ($c0,$c1,$c2)=($c1,$c2,$c0); 64 &mov("zero",$c2); 65 66 &mul_add_c($a[0],$b[3],$c0,$c1,$c2); &FR($a[0]); 67 &mul_add_c($a[1],$b[2],$c0,$c1,$c2); 68 &mul_add_c($a[2],$b[1],$c0,$c1,$c2); 69 &mul_add_c($a[3],$b[0],$c0,$c1,$c2); &FR($b[0]); 70 &st($c0,&QWPw(3,$rp)); &FR($c0); ($c0)=&NR($c0); 71 ($c0,$c1,$c2)=($c1,$c2,$c0); 72 &mov("zero",$c2); 73 74 &mul_add_c($a[1],$b[3],$c0,$c1,$c2); &FR($a[1]); 75 &mul_add_c($a[2],$b[2],$c0,$c1,$c2); 76 &mul_add_c($a[3],$b[1],$c0,$c1,$c2); &FR($b[1]); 77 &st($c0,&QWPw(4,$rp)); &FR($c0); ($c0)=&NR($c0); 78 ($c0,$c1,$c2)=($c1,$c2,$c0); 79 &mov("zero",$c2); 80 81 &mul_add_c($a[2],$b[3],$c0,$c1,$c2); &FR($a[2]); 82 &mul_add_c($a[3],$b[2],$c0,$c1,$c2); &FR($b[2]); 83 &st($c0,&QWPw(5,$rp)); &FR($c0); ($c0)=&NR($c0); 84 ($c0,$c1,$c2)=($c1,$c2,$c0); 85 &mov("zero",$c2); 86 87 &mul_add_c($a[3],$b[3],$c0,$c1,$c2); &FR($a[3],$b[3]); 88 &st($c0,&QWPw(6,$rp)); 89 &st($c1,&QWPw(7,$rp)); 90 91 &FR($c0,$c1,$c2); 92 93 &function_end($name); 94 95 &fin_pool; 96 } 97 981; 99