diff options
| author | bcook <> | 2015-09-11 12:17:57 +0000 |
|---|---|---|
| committer | bcook <> | 2015-09-11 12:17:57 +0000 |
| commit | eafebfdd3adba0417a72d6cc8a75f367fc2fbbdb (patch) | |
| tree | 03ee90a380bddd9dac65bed24366a6dc8e0abd01 /src/lib/libcrypto/bn | |
| parent | 2a8f39dde4eb3fc8b492e8c665128c557ff500af (diff) | |
| download | openbsd-eafebfdd3adba0417a72d6cc8a75f367fc2fbbdb.tar.gz openbsd-eafebfdd3adba0417a72d6cc8a75f367fc2fbbdb.tar.bz2 openbsd-eafebfdd3adba0417a72d6cc8a75f367fc2fbbdb.zip | |
Fixup inter-bank movq/movd operations, emit bytes for pclmulqdq again.
Fixes builds gcc + Apple's assembler, working on reenabling builds with older
OpenBSD releases.
based on OpenSSL commit:
https://git.openssl.org/?p=openssl.git;a=commitdiff;h=902b30df193afc3417a96ba72a81ed390bd50de3
ok miod@
Diffstat (limited to 'src/lib/libcrypto/bn')
| -rw-r--r-- | src/lib/libcrypto/bn/asm/x86_64-gf2m.pl | 12 | ||||
| -rwxr-xr-x | src/lib/libcrypto/bn/asm/x86_64-mont5.pl | 12 |
2 files changed, 12 insertions, 12 deletions
diff --git a/src/lib/libcrypto/bn/asm/x86_64-gf2m.pl b/src/lib/libcrypto/bn/asm/x86_64-gf2m.pl index 226c66c35e..8e45c7479b 100644 --- a/src/lib/libcrypto/bn/asm/x86_64-gf2m.pl +++ b/src/lib/libcrypto/bn/asm/x86_64-gf2m.pl | |||
| @@ -143,12 +143,12 @@ $code.=<<___; | |||
| 143 | mov (%rsp,$i1,8),$t1 | 143 | mov (%rsp,$i1,8),$t1 |
| 144 | mov $t1,$t0 | 144 | mov $t1,$t0 |
| 145 | shl \$`8*$n-4`,$t1 | 145 | shl \$`8*$n-4`,$t1 |
| 146 | movq $R,$i0 | 146 | movd $R,$i0 |
| 147 | shr \$`64-(8*$n-4)`,$t0 | 147 | shr \$`64-(8*$n-4)`,$t0 |
| 148 | xor $t1,$lo | 148 | xor $t1,$lo |
| 149 | psrldq \$8,$R | 149 | psrldq \$8,$R |
| 150 | xor $t0,$hi | 150 | xor $t0,$hi |
| 151 | movq $R,$i1 | 151 | movd $R,$i1 |
| 152 | xor $i0,$lo | 152 | xor $i0,$lo |
| 153 | xor $i1,$hi | 153 | xor $i1,$hi |
| 154 | 154 | ||
| @@ -171,15 +171,15 @@ bn_GF2m_mul_2x2: | |||
| 171 | bt \$33,%rax | 171 | bt \$33,%rax |
| 172 | jnc .Lvanilla_mul_2x2 | 172 | jnc .Lvanilla_mul_2x2 |
| 173 | 173 | ||
| 174 | movq $a1,%xmm0 | 174 | movd $a1,%xmm0 |
| 175 | movq $b1,%xmm1 | 175 | movd $b1,%xmm1 |
| 176 | movq $a0,%xmm2 | 176 | movd $a0,%xmm2 |
| 177 | ___ | 177 | ___ |
| 178 | $code.=<<___ if ($win64); | 178 | $code.=<<___ if ($win64); |
| 179 | movq 40(%rsp),%xmm3 | 179 | movq 40(%rsp),%xmm3 |
| 180 | ___ | 180 | ___ |
| 181 | $code.=<<___ if (!$win64); | 181 | $code.=<<___ if (!$win64); |
| 182 | movq $b0,%xmm3 | 182 | movd $b0,%xmm3 |
| 183 | ___ | 183 | ___ |
| 184 | $code.=<<___; | 184 | $code.=<<___; |
| 185 | movdqa %xmm0,%xmm4 | 185 | movdqa %xmm0,%xmm4 |
diff --git a/src/lib/libcrypto/bn/asm/x86_64-mont5.pl b/src/lib/libcrypto/bn/asm/x86_64-mont5.pl index 9c88884d42..81e5c53728 100755 --- a/src/lib/libcrypto/bn/asm/x86_64-mont5.pl +++ b/src/lib/libcrypto/bn/asm/x86_64-mont5.pl | |||
| @@ -120,7 +120,7 @@ $code.=<<___; | |||
| 120 | lea $STRIDE($bp),$bp | 120 | lea $STRIDE($bp),$bp |
| 121 | por %xmm3,%xmm0 | 121 | por %xmm3,%xmm0 |
| 122 | 122 | ||
| 123 | movq %xmm0,$m0 # m0=bp[0] | 123 | movd %xmm0,$m0 # m0=bp[0] |
| 124 | 124 | ||
| 125 | mov ($n0),$n0 # pull n0[0] value | 125 | mov ($n0),$n0 # pull n0[0] value |
| 126 | mov ($ap),%rax | 126 | mov ($ap),%rax |
| @@ -183,7 +183,7 @@ $code.=<<___; | |||
| 183 | cmp $num,$j | 183 | cmp $num,$j |
| 184 | jl .L1st | 184 | jl .L1st |
| 185 | 185 | ||
| 186 | movq %xmm0,$m0 # bp[1] | 186 | movd %xmm0,$m0 # bp[1] |
| 187 | 187 | ||
| 188 | add %rax,$hi1 | 188 | add %rax,$hi1 |
| 189 | mov ($ap),%rax # ap[0] | 189 | mov ($ap),%rax # ap[0] |
| @@ -266,7 +266,7 @@ $code.=<<___; | |||
| 266 | cmp $num,$j | 266 | cmp $num,$j |
| 267 | jl .Linner | 267 | jl .Linner |
| 268 | 268 | ||
| 269 | movq %xmm0,$m0 # bp[i+1] | 269 | movd %xmm0,$m0 # bp[i+1] |
| 270 | 270 | ||
| 271 | add %rax,$hi1 | 271 | add %rax,$hi1 |
| 272 | mov ($ap),%rax # ap[0] | 272 | mov ($ap),%rax # ap[0] |
| @@ -403,7 +403,7 @@ $code.=<<___; | |||
| 403 | lea $STRIDE($bp),$bp | 403 | lea $STRIDE($bp),$bp |
| 404 | por %xmm3,%xmm0 | 404 | por %xmm3,%xmm0 |
| 405 | 405 | ||
| 406 | movq %xmm0,$m0 # m0=bp[0] | 406 | movd %xmm0,$m0 # m0=bp[0] |
| 407 | mov ($n0),$n0 # pull n0[0] value | 407 | mov ($n0),$n0 # pull n0[0] value |
| 408 | mov ($ap),%rax | 408 | mov ($ap),%rax |
| 409 | 409 | ||
| @@ -550,7 +550,7 @@ $code.=<<___; | |||
| 550 | mov $N[1],-16(%rsp,$j,8) # tp[j-1] | 550 | mov $N[1],-16(%rsp,$j,8) # tp[j-1] |
| 551 | mov %rdx,$N[0] | 551 | mov %rdx,$N[0] |
| 552 | 552 | ||
| 553 | movq %xmm0,$m0 # bp[1] | 553 | movd %xmm0,$m0 # bp[1] |
| 554 | 554 | ||
| 555 | xor $N[1],$N[1] | 555 | xor $N[1],$N[1] |
| 556 | add $A[0],$N[0] | 556 | add $A[0],$N[0] |
| @@ -718,7 +718,7 @@ $code.=<<___; | |||
| 718 | mov $N[0],-24(%rsp,$j,8) # tp[j-1] | 718 | mov $N[0],-24(%rsp,$j,8) # tp[j-1] |
| 719 | mov %rdx,$N[0] | 719 | mov %rdx,$N[0] |
| 720 | 720 | ||
| 721 | movq %xmm0,$m0 # bp[i+1] | 721 | movd %xmm0,$m0 # bp[i+1] |
| 722 | mov $N[1],-16(%rsp,$j,8) # tp[j-1] | 722 | mov $N[1],-16(%rsp,$j,8) # tp[j-1] |
| 723 | 723 | ||
| 724 | xor $N[1],$N[1] | 724 | xor $N[1],$N[1] |
