6 push(@INC,"perlasm","../../perlasm");
9 &asm_init($ARGV[0],"bn-586.pl");
11 &bn_mul_add_words("bn_mul_add_words");
12 &bn_mul_words("bn_mul_words");
13 &bn_sqr_words("bn_sqr_words");
14 &bn_div64("bn_div64");
15 &bn_add_words("bn_add_words");
23 &function_begin($name,"");
33 &xor($c,$c); # clear carry
34 &mov($r,&wparam(0)); #
36 &mov("ecx",&wparam(2)); #
37 &mov($a,&wparam(1)); #
39 &and("ecx",0xfffffff8); # num / 8
40 &mov($w,&wparam(3)); #
42 &push("ecx"); # Up the stack for a tmp variable
44 &jz(&label("maw_finish"));
46 &set_label("maw_loop",0);
48 &mov(&swtmp(0),"ecx"); #
50 for ($i=0; $i<32; $i+=4)
54 &mov("eax",&DWP($i,$a,"",0)); # *a
56 &add("eax",$c); # L(t)+= *r
57 &mov($c,&DWP($i,$r,"",0)); # L(t)+= *r
58 &adc("edx",0); # H(t)+=carry
59 &add("eax",$c); # L(t)+=c
60 &adc("edx",0); # H(t)+=carry
61 &mov(&DWP($i,$r,"",0),"eax"); # *r= L(t);
62 &mov($c,"edx"); # c= H(t);
66 &mov("ecx",&swtmp(0)); #
70 &jnz(&label("maw_loop"));
72 &set_label("maw_finish",0);
73 &mov("ecx",&wparam(2)); # get num
75 &jnz(&label("maw_finish2")); # helps branch prediction
76 &jmp(&label("maw_end"));
78 &set_label("maw_finish2",1);
79 for ($i=0; $i<7; $i++)
81 &comment("Tail Round $i");
82 &mov("eax",&DWP($i*4,$a,"",0));# *a
84 &add("eax",$c); # L(t)+=c
85 &mov($c,&DWP($i*4,$r,"",0)); # L(t)+= *r
86 &adc("edx",0); # H(t)+=carry
88 &adc("edx",0); # H(t)+=carry
89 &dec("ecx") if ($i != 7-1);
90 &mov(&DWP($i*4,$r,"",0),"eax"); # *r= L(t);
91 &mov($c,"edx"); # c= H(t);
92 &jz(&label("maw_end")) if ($i != 7-1);
94 &set_label("maw_end",0);
97 &pop("ecx"); # clear variable from
106 &function_begin($name,"");
117 &xor($c,$c); # clear carry
118 &mov($r,&wparam(0)); #
119 &mov($a,&wparam(1)); #
120 &mov($num,&wparam(2)); #
121 &mov($w,&wparam(3)); #
123 &and($num,0xfffffff8); # num / 8
124 &jz(&label("mw_finish"));
126 &set_label("mw_loop",0);
127 for ($i=0; $i<32; $i+=4)
129 &comment("Round $i");
131 &mov("eax",&DWP($i,$a,"",0)); # *a
133 &add("eax",$c); # L(t)+=c
136 &adc("edx",0); # H(t)+=carry
137 &mov(&DWP($i,$r,"",0),"eax"); # *r= L(t);
139 &mov($c,"edx"); # c= H(t);
146 &jz(&label("mw_finish"));
147 &jmp(&label("mw_loop"));
149 &set_label("mw_finish",0);
150 &mov($num,&wparam(2)); # get num
152 &jnz(&label("mw_finish2"));
153 &jmp(&label("mw_end"));
155 &set_label("mw_finish2",1);
156 for ($i=0; $i<7; $i++)
158 &comment("Tail Round $i");
159 &mov("eax",&DWP($i*4,$a,"",0));# *a
161 &add("eax",$c); # L(t)+=c
163 &adc("edx",0); # H(t)+=carry
164 &mov(&DWP($i*4,$r,"",0),"eax");# *r= L(t);
165 &mov($c,"edx"); # c= H(t);
166 &dec($num) if ($i != 7-1);
167 &jz(&label("mw_end")) if ($i != 7-1);
169 &set_label("mw_end",0);
172 &function_end($name);
179 &function_begin($name,"");
186 &mov($r,&wparam(0)); #
187 &mov($a,&wparam(1)); #
188 &mov($num,&wparam(2)); #
190 &and($num,0xfffffff8); # num / 8
191 &jz(&label("sw_finish"));
193 &set_label("sw_loop",0);
194 for ($i=0; $i<32; $i+=4)
196 &comment("Round $i");
197 &mov("eax",&DWP($i,$a,"",0)); # *a
199 &mul("eax"); # *a * *a
200 &mov(&DWP($i*2,$r,"",0),"eax"); #
201 &mov(&DWP($i*2+4,$r,"",0),"edx");#
208 &jnz(&label("sw_loop"));
210 &set_label("sw_finish",0);
211 &mov($num,&wparam(2)); # get num
213 &jz(&label("sw_end"));
215 for ($i=0; $i<7; $i++)
217 &comment("Tail Round $i");
218 &mov("eax",&DWP($i*4,$a,"",0)); # *a
220 &mul("eax"); # *a * *a
221 &mov(&DWP($i*8,$r,"",0),"eax"); #
222 &dec($num) if ($i != 7-1);
223 &mov(&DWP($i*8+4,$r,"",0),"edx");
224 &jz(&label("sw_end")) if ($i != 7-1);
226 &set_label("sw_end",0);
228 &function_end($name);
235 &function_begin($name,"");
236 &mov("edx",&wparam(0)); #
237 &mov("eax",&wparam(1)); #
238 &mov("ebx",&wparam(2)); #
240 &function_end($name);
247 &function_begin($name,"");
258 &mov($r,&wparam(0)); # get r
259 &mov($a,&wparam(1)); # get a
260 &mov($b,&wparam(2)); # get b
261 &mov($num,&wparam(3)); # get num
262 &xor($c,$c); # clear carry
263 &and($num,0xfffffff8); # num / 8
265 &jz(&label("aw_finish"));
267 &set_label("aw_loop",0);
268 for ($i=0; $i<8; $i++)
270 &comment("Round $i");
272 &mov($tmp1,&DWP($i*4,$a,"",0)); # *a
273 &mov($tmp2,&DWP($i*4,$b,"",0)); # *b
279 &mov(&DWP($i*4,$r,"",0),$tmp1); # *r
287 &jnz(&label("aw_loop"));
289 &set_label("aw_finish",0);
290 &mov($num,&wparam(3)); # get num
292 &jz(&label("aw_end"));
294 for ($i=0; $i<7; $i++)
296 &comment("Tail Round $i");
297 &mov($tmp1,&DWP($i*4,$a,"",0)); # *a
298 &mov($tmp2,&DWP($i*4,$b,"",0));# *b
304 &dec($num) if ($i != 6);
305 &mov(&DWP($i*4,$r,"",0),$tmp1); # *a
306 &jz(&label("aw_end")) if ($i != 6);
308 &set_label("aw_end",0);
312 &function_end($name);