diff options
Diffstat (limited to 'src/lib/libcrypto/bn/asm/bn-586.pl')
-rw-r--r-- | src/lib/libcrypto/bn/asm/bn-586.pl | 295 |
1 files changed, 287 insertions, 8 deletions
diff --git a/src/lib/libcrypto/bn/asm/bn-586.pl b/src/lib/libcrypto/bn/asm/bn-586.pl index 19d425ee96..33f6125920 100644 --- a/src/lib/libcrypto/bn/asm/bn-586.pl +++ b/src/lib/libcrypto/bn/asm/bn-586.pl | |||
@@ -1,18 +1,17 @@ | |||
1 | #!/usr/bin/perl | ||
2 | # | ||
3 | |||
4 | #!/usr/local/bin/perl | 1 | #!/usr/local/bin/perl |
5 | 2 | ||
6 | push(@INC,"perlasm","../../perlasm"); | 3 | push(@INC,"perlasm","../../perlasm"); |
7 | require "x86asm.pl"; | 4 | require "x86asm.pl"; |
8 | 5 | ||
9 | &asm_init($ARGV[0],"bn-586.pl"); | 6 | &asm_init($ARGV[0],$0); |
10 | 7 | ||
11 | &bn_mul_add_words("bn_mul_add_words"); | 8 | &bn_mul_add_words("bn_mul_add_words"); |
12 | &bn_mul_words("bn_mul_words"); | 9 | &bn_mul_words("bn_mul_words"); |
13 | &bn_sqr_words("bn_sqr_words"); | 10 | &bn_sqr_words("bn_sqr_words"); |
14 | &bn_div64("bn_div64"); | 11 | &bn_div_words("bn_div_words"); |
15 | &bn_add_words("bn_add_words"); | 12 | &bn_add_words("bn_add_words"); |
13 | &bn_sub_words("bn_sub_words"); | ||
14 | &bn_sub_part_words("bn_sub_part_words"); | ||
16 | 15 | ||
17 | &asm_finish(); | 16 | &asm_finish(); |
18 | 17 | ||
@@ -228,7 +227,7 @@ sub bn_sqr_words | |||
228 | &function_end($name); | 227 | &function_end($name); |
229 | } | 228 | } |
230 | 229 | ||
231 | sub bn_div64 | 230 | sub bn_div_words |
232 | { | 231 | { |
233 | local($name)=@_; | 232 | local($name)=@_; |
234 | 233 | ||
@@ -302,12 +301,292 @@ sub bn_add_words | |||
302 | &add($tmp1,$tmp2); | 301 | &add($tmp1,$tmp2); |
303 | &adc($c,0); | 302 | &adc($c,0); |
304 | &dec($num) if ($i != 6); | 303 | &dec($num) if ($i != 6); |
305 | &mov(&DWP($i*4,$r,"",0),$tmp1); # *a | 304 | &mov(&DWP($i*4,$r,"",0),$tmp1); # *r |
306 | &jz(&label("aw_end")) if ($i != 6); | 305 | &jz(&label("aw_end")) if ($i != 6); |
307 | } | 306 | } |
308 | &set_label("aw_end",0); | 307 | &set_label("aw_end",0); |
309 | 308 | ||
310 | &mov("eax",$c); | 309 | # &mov("eax",$c); # $c is "eax" |
310 | |||
311 | &function_end($name); | ||
312 | } | ||
313 | |||
314 | sub bn_sub_words | ||
315 | { | ||
316 | local($name)=@_; | ||
317 | |||
318 | &function_begin($name,""); | ||
319 | |||
320 | &comment(""); | ||
321 | $a="esi"; | ||
322 | $b="edi"; | ||
323 | $c="eax"; | ||
324 | $r="ebx"; | ||
325 | $tmp1="ecx"; | ||
326 | $tmp2="edx"; | ||
327 | $num="ebp"; | ||
328 | |||
329 | &mov($r,&wparam(0)); # get r | ||
330 | &mov($a,&wparam(1)); # get a | ||
331 | &mov($b,&wparam(2)); # get b | ||
332 | &mov($num,&wparam(3)); # get num | ||
333 | &xor($c,$c); # clear carry | ||
334 | &and($num,0xfffffff8); # num / 8 | ||
335 | |||
336 | &jz(&label("aw_finish")); | ||
337 | |||
338 | &set_label("aw_loop",0); | ||
339 | for ($i=0; $i<8; $i++) | ||
340 | { | ||
341 | &comment("Round $i"); | ||
342 | |||
343 | &mov($tmp1,&DWP($i*4,$a,"",0)); # *a | ||
344 | &mov($tmp2,&DWP($i*4,$b,"",0)); # *b | ||
345 | &sub($tmp1,$c); | ||
346 | &mov($c,0); | ||
347 | &adc($c,$c); | ||
348 | &sub($tmp1,$tmp2); | ||
349 | &adc($c,0); | ||
350 | &mov(&DWP($i*4,$r,"",0),$tmp1); # *r | ||
351 | } | ||
352 | |||
353 | &comment(""); | ||
354 | &add($a,32); | ||
355 | &add($b,32); | ||
356 | &add($r,32); | ||
357 | &sub($num,8); | ||
358 | &jnz(&label("aw_loop")); | ||
359 | |||
360 | &set_label("aw_finish",0); | ||
361 | &mov($num,&wparam(3)); # get num | ||
362 | &and($num,7); | ||
363 | &jz(&label("aw_end")); | ||
364 | |||
365 | for ($i=0; $i<7; $i++) | ||
366 | { | ||
367 | &comment("Tail Round $i"); | ||
368 | &mov($tmp1,&DWP($i*4,$a,"",0)); # *a | ||
369 | &mov($tmp2,&DWP($i*4,$b,"",0));# *b | ||
370 | &sub($tmp1,$c); | ||
371 | &mov($c,0); | ||
372 | &adc($c,$c); | ||
373 | &sub($tmp1,$tmp2); | ||
374 | &adc($c,0); | ||
375 | &dec($num) if ($i != 6); | ||
376 | &mov(&DWP($i*4,$r,"",0),$tmp1); # *r | ||
377 | &jz(&label("aw_end")) if ($i != 6); | ||
378 | } | ||
379 | &set_label("aw_end",0); | ||
380 | |||
381 | # &mov("eax",$c); # $c is "eax" | ||
382 | |||
383 | &function_end($name); | ||
384 | } | ||
385 | |||
386 | sub bn_sub_part_words | ||
387 | { | ||
388 | local($name)=@_; | ||
389 | |||
390 | &function_begin($name,""); | ||
391 | |||
392 | &comment(""); | ||
393 | $a="esi"; | ||
394 | $b="edi"; | ||
395 | $c="eax"; | ||
396 | $r="ebx"; | ||
397 | $tmp1="ecx"; | ||
398 | $tmp2="edx"; | ||
399 | $num="ebp"; | ||
400 | |||
401 | &mov($r,&wparam(0)); # get r | ||
402 | &mov($a,&wparam(1)); # get a | ||
403 | &mov($b,&wparam(2)); # get b | ||
404 | &mov($num,&wparam(3)); # get num | ||
405 | &xor($c,$c); # clear carry | ||
406 | &and($num,0xfffffff8); # num / 8 | ||
407 | |||
408 | &jz(&label("aw_finish")); | ||
409 | |||
410 | &set_label("aw_loop",0); | ||
411 | for ($i=0; $i<8; $i++) | ||
412 | { | ||
413 | &comment("Round $i"); | ||
414 | |||
415 | &mov($tmp1,&DWP($i*4,$a,"",0)); # *a | ||
416 | &mov($tmp2,&DWP($i*4,$b,"",0)); # *b | ||
417 | &sub($tmp1,$c); | ||
418 | &mov($c,0); | ||
419 | &adc($c,$c); | ||
420 | &sub($tmp1,$tmp2); | ||
421 | &adc($c,0); | ||
422 | &mov(&DWP($i*4,$r,"",0),$tmp1); # *r | ||
423 | } | ||
424 | |||
425 | &comment(""); | ||
426 | &add($a,32); | ||
427 | &add($b,32); | ||
428 | &add($r,32); | ||
429 | &sub($num,8); | ||
430 | &jnz(&label("aw_loop")); | ||
431 | |||
432 | &set_label("aw_finish",0); | ||
433 | &mov($num,&wparam(3)); # get num | ||
434 | &and($num,7); | ||
435 | &jz(&label("aw_end")); | ||
436 | |||
437 | for ($i=0; $i<7; $i++) | ||
438 | { | ||
439 | &comment("Tail Round $i"); | ||
440 | &mov($tmp1,&DWP(0,$a,"",0)); # *a | ||
441 | &mov($tmp2,&DWP(0,$b,"",0));# *b | ||
442 | &sub($tmp1,$c); | ||
443 | &mov($c,0); | ||
444 | &adc($c,$c); | ||
445 | &sub($tmp1,$tmp2); | ||
446 | &adc($c,0); | ||
447 | &mov(&DWP(0,$r,"",0),$tmp1); # *r | ||
448 | &add($a, 4); | ||
449 | &add($b, 4); | ||
450 | &add($r, 4); | ||
451 | &dec($num) if ($i != 6); | ||
452 | &jz(&label("aw_end")) if ($i != 6); | ||
453 | } | ||
454 | &set_label("aw_end",0); | ||
455 | |||
456 | &cmp(&wparam(4),0); | ||
457 | &je(&label("pw_end")); | ||
458 | |||
459 | &mov($num,&wparam(4)); # get dl | ||
460 | &cmp($num,0); | ||
461 | &je(&label("pw_end")); | ||
462 | &jge(&label("pw_pos")); | ||
463 | |||
464 | &comment("pw_neg"); | ||
465 | &mov($tmp2,0); | ||
466 | &sub($tmp2,$num); | ||
467 | &mov($num,$tmp2); | ||
468 | &and($num,0xfffffff8); # num / 8 | ||
469 | &jz(&label("pw_neg_finish")); | ||
470 | |||
471 | &set_label("pw_neg_loop",0); | ||
472 | for ($i=0; $i<8; $i++) | ||
473 | { | ||
474 | &comment("dl<0 Round $i"); | ||
475 | |||
476 | &mov($tmp1,0); | ||
477 | &mov($tmp2,&DWP($i*4,$b,"",0)); # *b | ||
478 | &sub($tmp1,$c); | ||
479 | &mov($c,0); | ||
480 | &adc($c,$c); | ||
481 | &sub($tmp1,$tmp2); | ||
482 | &adc($c,0); | ||
483 | &mov(&DWP($i*4,$r,"",0),$tmp1); # *r | ||
484 | } | ||
485 | |||
486 | &comment(""); | ||
487 | &add($b,32); | ||
488 | &add($r,32); | ||
489 | &sub($num,8); | ||
490 | &jnz(&label("pw_neg_loop")); | ||
491 | |||
492 | &set_label("pw_neg_finish",0); | ||
493 | &mov($tmp2,&wparam(4)); # get dl | ||
494 | &mov($num,0); | ||
495 | &sub($num,$tmp2); | ||
496 | &and($num,7); | ||
497 | &jz(&label("pw_end")); | ||
498 | |||
499 | for ($i=0; $i<7; $i++) | ||
500 | { | ||
501 | &comment("dl<0 Tail Round $i"); | ||
502 | &mov($tmp1,0); | ||
503 | &mov($tmp2,&DWP($i*4,$b,"",0));# *b | ||
504 | &sub($tmp1,$c); | ||
505 | &mov($c,0); | ||
506 | &adc($c,$c); | ||
507 | &sub($tmp1,$tmp2); | ||
508 | &adc($c,0); | ||
509 | &dec($num) if ($i != 6); | ||
510 | &mov(&DWP($i*4,$r,"",0),$tmp1); # *r | ||
511 | &jz(&label("pw_end")) if ($i != 6); | ||
512 | } | ||
513 | |||
514 | &jmp(&label("pw_end")); | ||
515 | |||
516 | &set_label("pw_pos",0); | ||
517 | |||
518 | &and($num,0xfffffff8); # num / 8 | ||
519 | &jz(&label("pw_pos_finish")); | ||
520 | |||
521 | &set_label("pw_pos_loop",0); | ||
522 | |||
523 | for ($i=0; $i<8; $i++) | ||
524 | { | ||
525 | &comment("dl>0 Round $i"); | ||
526 | |||
527 | &mov($tmp1,&DWP($i*4,$a,"",0)); # *a | ||
528 | &sub($tmp1,$c); | ||
529 | &mov(&DWP($i*4,$r,"",0),$tmp1); # *r | ||
530 | &jnc(&label("pw_nc".$i)); | ||
531 | } | ||
532 | |||
533 | &comment(""); | ||
534 | &add($a,32); | ||
535 | &add($r,32); | ||
536 | &sub($num,8); | ||
537 | &jnz(&label("pw_pos_loop")); | ||
538 | |||
539 | &set_label("pw_pos_finish",0); | ||
540 | &mov($num,&wparam(4)); # get dl | ||
541 | &and($num,7); | ||
542 | &jz(&label("pw_end")); | ||
543 | |||
544 | for ($i=0; $i<7; $i++) | ||
545 | { | ||
546 | &comment("dl>0 Tail Round $i"); | ||
547 | &mov($tmp1,&DWP($i*4,$a,"",0)); # *a | ||
548 | &sub($tmp1,$c); | ||
549 | &mov(&DWP($i*4,$r,"",0),$tmp1); # *r | ||
550 | &jnc(&label("pw_tail_nc".$i)); | ||
551 | &dec($num) if ($i != 6); | ||
552 | &jz(&label("pw_end")) if ($i != 6); | ||
553 | } | ||
554 | &mov($c,1); | ||
555 | &jmp(&label("pw_end")); | ||
556 | |||
557 | &set_label("pw_nc_loop",0); | ||
558 | for ($i=0; $i<8; $i++) | ||
559 | { | ||
560 | &mov($tmp1,&DWP($i*4,$a,"",0)); # *a | ||
561 | &mov(&DWP($i*4,$r,"",0),$tmp1); # *r | ||
562 | &set_label("pw_nc".$i,0); | ||
563 | } | ||
564 | |||
565 | &comment(""); | ||
566 | &add($a,32); | ||
567 | &add($r,32); | ||
568 | &sub($num,8); | ||
569 | &jnz(&label("pw_nc_loop")); | ||
570 | |||
571 | &mov($num,&wparam(4)); # get dl | ||
572 | &and($num,7); | ||
573 | &jz(&label("pw_nc_end")); | ||
574 | |||
575 | for ($i=0; $i<7; $i++) | ||
576 | { | ||
577 | &mov($tmp1,&DWP($i*4,$a,"",0)); # *a | ||
578 | &mov(&DWP($i*4,$r,"",0),$tmp1); # *r | ||
579 | &set_label("pw_tail_nc".$i,0); | ||
580 | &dec($num) if ($i != 6); | ||
581 | &jz(&label("pw_nc_end")) if ($i != 6); | ||
582 | } | ||
583 | |||
584 | &set_label("pw_nc_end",0); | ||
585 | &mov($c,0); | ||
586 | |||
587 | &set_label("pw_end",0); | ||
588 | |||
589 | # &mov("eax",$c); # $c is "eax" | ||
311 | 590 | ||
312 | &function_end($name); | 591 | &function_end($name); |
313 | } | 592 | } |