summaryrefslogtreecommitdiff
path: root/src/lib/libcrypto/bn/asm
diff options
context:
space:
mode:
authorderaadt <>2023-04-25 04:42:26 +0000
committerderaadt <>2023-04-25 04:42:26 +0000
commite2118101444d3cf3cab87297b363cecd5357ae89 (patch)
treeb4ae043f669d9d718f1fecb4ca705a0cf2d2ddc7 /src/lib/libcrypto/bn/asm
parentc6490b97c04798e5cd36a489e3ba5ffc4a66550b (diff)
downloadopenbsd-e2118101444d3cf3cab87297b363cecd5357ae89.tar.gz
openbsd-e2118101444d3cf3cab87297b363cecd5357ae89.tar.bz2
openbsd-e2118101444d3cf3cab87297b363cecd5357ae89.zip
Add endbr64 where needed by inspection. Passes regresson tests.
ok jsing, and kind of tb an earlier version
Diffstat (limited to 'src/lib/libcrypto/bn/asm')
-rw-r--r--src/lib/libcrypto/bn/asm/modexp512-x86_64.pl5
-rwxr-xr-xsrc/lib/libcrypto/bn/asm/x86_64-mont.pl3
-rwxr-xr-xsrc/lib/libcrypto/bn/asm/x86_64-mont5.pl5
3 files changed, 13 insertions, 0 deletions
diff --git a/src/lib/libcrypto/bn/asm/modexp512-x86_64.pl b/src/lib/libcrypto/bn/asm/modexp512-x86_64.pl
index 2e71a7f03d..af78fff541 100644
--- a/src/lib/libcrypto/bn/asm/modexp512-x86_64.pl
+++ b/src/lib/libcrypto/bn/asm/modexp512-x86_64.pl
@@ -347,6 +347,7 @@ $code.=<<___;
347.type MULADD_128x512,\@abi-omnipotent 347.type MULADD_128x512,\@abi-omnipotent
348.align 16 348.align 16
349MULADD_128x512: 349MULADD_128x512:
350 endbr64
350___ 351___
351 &MULSTEP_512([map("%r$_",(8..15))], "(+8*0)(%rcx)", "%rsi", "%rbp", "%rbx"); 352 &MULSTEP_512([map("%r$_",(8..15))], "(+8*0)(%rcx)", "%rsi", "%rbp", "%rbx");
352$code.=<<___; 353$code.=<<___;
@@ -414,6 +415,7 @@ $code.=<<___;
414.type mont_reduce,\@abi-omnipotent 415.type mont_reduce,\@abi-omnipotent
415.align 16 416.align 16
416mont_reduce: 417mont_reduce:
418 endbr64
417___ 419___
418 420
419my $STACK_DEPTH = 8; 421my $STACK_DEPTH = 8;
@@ -676,6 +678,7 @@ $code.=<<___;
676.type mont_mul_a3b,\@abi-omnipotent 678.type mont_mul_a3b,\@abi-omnipotent
677.align 16 679.align 16
678mont_mul_a3b: 680mont_mul_a3b:
681 endbr64
679 # 682 #
680 # multiply tmp = src1 * src2 683 # multiply tmp = src1 * src2
681 # For multiply: dst = rcx, src1 = rdi, src2 = rsi 684 # For multiply: dst = rcx, src1 = rdi, src2 = rsi
@@ -1077,6 +1080,7 @@ $code.=<<___;
1077.type sqr_reduce,\@abi-omnipotent 1080.type sqr_reduce,\@abi-omnipotent
1078.align 16 1081.align 16
1079sqr_reduce: 1082sqr_reduce:
1083 endbr64
1080 mov (+$pResult_offset+8)(%rsp), %rcx 1084 mov (+$pResult_offset+8)(%rsp), %rcx
1081___ 1085___
1082 &SQR_512("%rsp+$tmp16_offset+8", "%rcx", [map("%r$_",(10..15,8..9))], "%rbx", "%rbp", "%rsi", "%rdi"); 1086 &SQR_512("%rsp+$tmp16_offset+8", "%rcx", [map("%r$_",(10..15,8..9))], "%rbx", "%rbp", "%rsi", "%rdi");
@@ -1106,6 +1110,7 @@ $code.=<<___;
1106.globl mod_exp_512 1110.globl mod_exp_512
1107.type mod_exp_512,\@function,4 1111.type mod_exp_512,\@function,4
1108mod_exp_512: 1112mod_exp_512:
1113 endbr64
1109 push %rbp 1114 push %rbp
1110 push %rbx 1115 push %rbx
1111 push %r12 1116 push %r12
diff --git a/src/lib/libcrypto/bn/asm/x86_64-mont.pl b/src/lib/libcrypto/bn/asm/x86_64-mont.pl
index cae7309d5b..6f5ab331e2 100755
--- a/src/lib/libcrypto/bn/asm/x86_64-mont.pl
+++ b/src/lib/libcrypto/bn/asm/x86_64-mont.pl
@@ -63,6 +63,7 @@ $code=<<___;
63.type bn_mul_mont,\@function,6 63.type bn_mul_mont,\@function,6
64.align 16 64.align 16
65bn_mul_mont: 65bn_mul_mont:
66 endbr64
66 test \$3,${num}d 67 test \$3,${num}d
67 jnz .Lmul_enter 68 jnz .Lmul_enter
68 cmp \$8,${num}d 69 cmp \$8,${num}d
@@ -278,6 +279,7 @@ $code.=<<___;
278.align 16 279.align 16
279bn_mul4x_mont: 280bn_mul4x_mont:
280.Lmul4x_enter: 281.Lmul4x_enter:
282 endbr64
281 push %rbx 283 push %rbx
282 push %rbp 284 push %rbp
283 push %r12 285 push %r12
@@ -705,6 +707,7 @@ $code.=<<___;
705.align 16 707.align 16
706bn_sqr4x_mont: 708bn_sqr4x_mont:
707.Lsqr4x_enter: 709.Lsqr4x_enter:
710 endbr64
708 push %rbx 711 push %rbx
709 push %rbp 712 push %rbp
710 push %r12 713 push %r12
diff --git a/src/lib/libcrypto/bn/asm/x86_64-mont5.pl b/src/lib/libcrypto/bn/asm/x86_64-mont5.pl
index 7b9c6df273..3b3325a6cc 100755
--- a/src/lib/libcrypto/bn/asm/x86_64-mont5.pl
+++ b/src/lib/libcrypto/bn/asm/x86_64-mont5.pl
@@ -57,6 +57,7 @@ $code=<<___;
57.type bn_mul_mont_gather5,\@function,6 57.type bn_mul_mont_gather5,\@function,6
58.align 64 58.align 64
59bn_mul_mont_gather5: 59bn_mul_mont_gather5:
60 endbr64
60 test \$3,${num}d 61 test \$3,${num}d
61 jnz .Lmul_enter 62 jnz .Lmul_enter
62 cmp \$8,${num}d 63 cmp \$8,${num}d
@@ -387,6 +388,7 @@ $code.=<<___;
387.type bn_mul4x_mont_gather5,\@function,6 388.type bn_mul4x_mont_gather5,\@function,6
388.align 16 389.align 16
389bn_mul4x_mont_gather5: 390bn_mul4x_mont_gather5:
391 endbr64
390.Lmul4x_enter: 392.Lmul4x_enter:
391 mov ${num}d,${num}d 393 mov ${num}d,${num}d
392 movd `($win64?56:8)`(%rsp),%xmm5 # load 7th argument 394 movd `($win64?56:8)`(%rsp),%xmm5 # load 7th argument
@@ -925,6 +927,7 @@ $code.=<<___;
925.type bn_scatter5,\@abi-omnipotent 927.type bn_scatter5,\@abi-omnipotent
926.align 16 928.align 16
927bn_scatter5: 929bn_scatter5:
930 endbr64
928 cmp \$0, $num 931 cmp \$0, $num
929 jz .Lscatter_epilogue 932 jz .Lscatter_epilogue
930 lea ($tbl,$idx,8),$tbl 933 lea ($tbl,$idx,8),$tbl
@@ -943,6 +946,7 @@ bn_scatter5:
943.type bn_gather5,\@abi-omnipotent 946.type bn_gather5,\@abi-omnipotent
944.align 16 947.align 16
945bn_gather5: 948bn_gather5:
949 endbr64
946.LSEH_begin_bn_gather5: # Win64 thing, but harmless in other cases 950.LSEH_begin_bn_gather5: # Win64 thing, but harmless in other cases
947 # I can't trust assembler to use specific encoding:-( 951 # I can't trust assembler to use specific encoding:-(
948 .byte 0x4c,0x8d,0x14,0x24 # lea (%rsp),%r10 952 .byte 0x4c,0x8d,0x14,0x24 # lea (%rsp),%r10
@@ -1053,6 +1057,7 @@ $code.=<<___;
1053.type mul_handler,\@abi-omnipotent 1057.type mul_handler,\@abi-omnipotent
1054.align 16 1058.align 16
1055mul_handler: 1059mul_handler:
1060 endbr64
1056 push %rsi 1061 push %rsi
1057 push %rdi 1062 push %rdi
1058 push %rbx 1063 push %rbx