and added files
[bcm963xx.git] / userapps / opensource / openssl / crypto / bn / asm / alpha / mul_add.pl
diff --git a/userapps/opensource/openssl/crypto/bn/asm/alpha/mul_add.pl b/userapps/opensource/openssl/crypto/bn/asm/alpha/mul_add.pl
new file mode 100755 (executable)
index 0000000..0d6df69
--- /dev/null
@@ -0,0 +1,123 @@
+#!/usr/local/bin/perl
+# alpha assember 
+
+sub bn_mul_add_words
+       {
+       local($name)=@_;
+       local($cc,$a,$b,$r,$couny);
+
+       &init_pool(4);
+       ($cc)=GR("r0");
+
+       $rp=&wparam(0);
+       $ap=&wparam(1);
+       $count=&wparam(2);
+       $word=&wparam(3);
+
+       &function_begin($name,"");
+
+       &comment("");
+       &sub($count,4,$count);
+        &mov("zero",$cc);
+       ###
+        &blt($count,&label("finish"));
+
+       &ld(($a0)=&NR(1),&QWPw(0,$ap));
+
+$a=<<'EOF';
+##########################################################
+       &set_label("loop");
+
+       &ld(($r0)=&NR(1),&QWPw(0,$rp));
+        &ld(($a1)=&NR(1),&QWPw(1,$ap));
+       &muh($a0,$word,($h0)=&NR(1));
+        &ld(($r1)=&NR(1),&QWPw(1,$rp));
+       &ld(($a2)=&NR(1),&QWPw(2,$ap));
+        ###
+       &mul($a0,$word,($l0)=&NR(1));   &FR($a0);
+        &ld(($r2)=&NR(1),&QWPw(2,$rp));
+       &muh($a1,$word,($h1)=&NR(1));
+        &ld(($a3)=&NR(1),&QWPw(3,$ap));
+       &mul($a1,$word,($l1)=&NR(1));   &FR($a1);
+        &ld(($r3)=&NR(1),&QWPw(3,$rp));
+       &add($r0,$l0,$r0);
+        &add($r1,$l1,$r1);
+       &cmpult($r0,$l0,($t0)=&NR(1));  &FR($l0);
+        &cmpult($r1,$l1,($t1)=&NR(1)); &FR($l1);
+       &muh($a2,$word,($h2)=&NR(1));
+        &add($r0,$cc,$r0);
+       &add($h0,$t0,$h0);              &FR($t0);
+        &cmpult($r0,$cc,$cc);
+       &add($h1,$t1,$h1);              &FR($t1);
+        &add($h0,$cc,$cc);             &FR($h0);
+       &mul($a2,$word,($l2)=&NR(1));   &FR($a2);
+        &add($r1,$cc,$r1);
+       &cmpult($r1,$cc,$cc);
+        &add($r2,$l2,$r2);
+       &add($h1,$cc,$cc);              &FR($h1);
+        &cmpult($r2,$l2,($t2)=&NR(1)); &FR($l2);
+       &muh($a3,$word,($h3)=&NR(1));
+        &add($r2,$cc,$r2);
+       &st($r0,&QWPw(0,$rp)); &FR($r0);
+        &add($h2,$t2,$h2);             &FR($t2);
+       &st($r1,&QWPw(1,$rp)); &FR($r1);
+        &cmpult($r2,$cc,$cc);
+       &mul($a3,$word,($l3)=&NR(1));   &FR($a3);
+        &add($h2,$cc,$cc);             &FR($h2);
+       &st($r2,&QWPw(2,$rp)); &FR($r2);
+        &sub($count,4,$count); # count-=4
+        &add($rp,4*$QWS,$rp);  # count+=4
+       &add($r3,$l3,$r3);
+        &add($ap,4*$QWS,$ap);  # count+=4
+       &cmpult($r3,$l3,($t3)=&NR(1));  &FR($l3);
+        &add($r3,$cc,$r3);
+       &add($h3,$t3,$h3);              &FR($t3);
+        &cmpult($r3,$cc,$cc);
+       &st($r3,&QWPw(-1,$rp)); &FR($r3);
+        &add($h3,$cc,$cc);             &FR($h3);
+
+       ###
+        &blt($count,&label("finish"));
+       &ld(($a0)=&NR(1),&QWPw(0,$ap));
+        &br(&label("loop"));
+EOF
+##################################################
+       # Do the last 0..3 words
+
+       &set_label("last_loop");
+
+       &ld(($a0)=&NR(1),&QWPw(0,$ap)); # get a
+        &ld(($r0)=&NR(1),&QWPw(0,$rp));        # get b
+       ###
+        ###
+       &muh($a0,$word,($h0)=&NR(1));   &FR($a0);
+        ### wait 8
+       &mul($a0,$word,($l0)=&NR(1));   &FR($a0);
+        &add($rp,$QWS,$rp);
+       &add($ap,$QWS,$ap);
+        &sub($count,1,$count);
+       ### wait 3 until l0 is available
+       &add($r0,$l0,$r0);
+        ###
+       &cmpult($r0,$l0,($t0)=&NR(1));  &FR($l0);
+        &add($r0,$cc,$r0);
+       &add($h0,$t0,$h0);              &FR($t0);
+        &cmpult($r0,$cc,$cc);
+       &add($h0,$cc,$cc);              &FR($h0);
+
+       &st($r0,&QWPw(-1,$rp));         &FR($r0);
+        &bgt($count,&label("last_loop"));
+       &function_end_A($name);
+
+######################################################
+       &set_label("finish");
+       &add($count,4,$count);
+        &bgt($count,&label("last_loop"));
+
+       &set_label("end");
+       &function_end($name);
+
+       &fin_pool;
+       }
+
+1;