98 lines
2.3 KiB
Raku
98 lines
2.3 KiB
Raku
#!/usr/local/bin/perl
|
|
# alpha assember
|
|
|
|
sub mul_add_c
|
|
{
|
|
local($a,$b,$c0,$c1,$c2)=@_;
|
|
local($l1,$h1,$t1,$t2);
|
|
|
|
print STDERR "count=$cnt\n"; $cnt++;
|
|
&mul($a,$b,($l1)=&NR(1));
|
|
&muh($a,$b,($h1)=&NR(1));
|
|
&add($c0,$l1,$c0);
|
|
&cmpult($c0,$l1,($t1)=&NR(1)); &FR($l1);
|
|
&add($t1,$h1,$h1); &FR($t1);
|
|
&add($c1,$h1,$c1);
|
|
&cmpult($c1,$h1,($t2)=&NR(1)); &FR($h1);
|
|
&add($c2,$t2,$c2); &FR($t2);
|
|
}
|
|
|
|
sub bn_mul_comba4
|
|
{
|
|
local($name)=@_;
|
|
local(@a,@b,$r,$c0,$c1,$c2);
|
|
|
|
$cnt=1;
|
|
&init_pool(3);
|
|
|
|
$rp=&wparam(0);
|
|
$ap=&wparam(1);
|
|
$bp=&wparam(2);
|
|
|
|
&function_begin($name,"");
|
|
|
|
&comment("");
|
|
|
|
&ld(($a[0])=&NR(1),&QWPw(0,$ap));
|
|
&ld(($b[0])=&NR(1),&QWPw(0,$bp));
|
|
&ld(($a[1])=&NR(1),&QWPw(1,$ap));
|
|
&ld(($b[1])=&NR(1),&QWPw(1,$bp));
|
|
&ld(($a[2])=&NR(1),&QWPw(2,$ap));
|
|
&ld(($b[2])=&NR(1),&QWPw(2,$bp));
|
|
&ld(($a[3])=&NR(1),&QWPw(3,$ap)); &FR($ap);
|
|
&ld(($b[3])=&NR(1),&QWPw(3,$bp)); &FR($bp);
|
|
|
|
($c0,$c1,$c2)=&NR(3);
|
|
&mov("zero",$c2);
|
|
&mul($a[0],$b[0],$c0);
|
|
&muh($a[0],$b[0],$c1);
|
|
&st($c0,&QWPw(0,$rp)); &FR($c0); ($c0)=&NR($c0);
|
|
($c0,$c1,$c2)=($c1,$c2,$c0);
|
|
&mov("zero",$c2);
|
|
|
|
&mul_add_c($a[0],$b[1],$c0,$c1,$c2);
|
|
&mul_add_c($a[1],$b[0],$c0,$c1,$c2);
|
|
&st($c0,&QWPw(1,$rp)); &FR($c0); ($c0)=&NR($c0);
|
|
($c0,$c1,$c2)=($c1,$c2,$c0);
|
|
&mov("zero",$c2);
|
|
|
|
&mul_add_c($a[1],$b[1],$c0,$c1,$c2);
|
|
&mul_add_c($a[0],$b[2],$c0,$c1,$c2);
|
|
&mul_add_c($a[2],$b[0],$c0,$c1,$c2);
|
|
&st($c0,&QWPw(2,$rp)); &FR($c0); ($c0)=&NR($c0);
|
|
($c0,$c1,$c2)=($c1,$c2,$c0);
|
|
&mov("zero",$c2);
|
|
|
|
&mul_add_c($a[0],$b[3],$c0,$c1,$c2); &FR($a[0]);
|
|
&mul_add_c($a[1],$b[2],$c0,$c1,$c2);
|
|
&mul_add_c($a[2],$b[1],$c0,$c1,$c2);
|
|
&mul_add_c($a[3],$b[0],$c0,$c1,$c2); &FR($b[0]);
|
|
&st($c0,&QWPw(3,$rp)); &FR($c0); ($c0)=&NR($c0);
|
|
($c0,$c1,$c2)=($c1,$c2,$c0);
|
|
&mov("zero",$c2);
|
|
|
|
&mul_add_c($a[1],$b[3],$c0,$c1,$c2); &FR($a[1]);
|
|
&mul_add_c($a[2],$b[2],$c0,$c1,$c2);
|
|
&mul_add_c($a[3],$b[1],$c0,$c1,$c2); &FR($b[1]);
|
|
&st($c0,&QWPw(4,$rp)); &FR($c0); ($c0)=&NR($c0);
|
|
($c0,$c1,$c2)=($c1,$c2,$c0);
|
|
&mov("zero",$c2);
|
|
|
|
&mul_add_c($a[2],$b[3],$c0,$c1,$c2); &FR($a[2]);
|
|
&mul_add_c($a[3],$b[2],$c0,$c1,$c2); &FR($b[2]);
|
|
&st($c0,&QWPw(5,$rp)); &FR($c0); ($c0)=&NR($c0);
|
|
($c0,$c1,$c2)=($c1,$c2,$c0);
|
|
&mov("zero",$c2);
|
|
|
|
&mul_add_c($a[3],$b[3],$c0,$c1,$c2); &FR($a[3],$b[3]);
|
|
&st($c0,&QWPw(6,$rp));
|
|
&st($c1,&QWPw(7,$rp));
|
|
|
|
&FR($c0,$c1,$c2);
|
|
|
|
&function_end($name);
|
|
|
|
&fin_pool;
|
|
}
|
|
|
|
1;
|