forked from pool/openssl-1_1
b51c004cd8
- Performance enhancements for cryptography from OpenSSL 3.x [jsc#PED-5086, jsc#PED-3514] * Add patches: - openssl-ec-Use-static-linkage-on-nistp521-felem_-square-mul-.patch - openssl-ec-56-bit-Limb-Solinas-Strategy-for-secp384r1.patch - openssl-ec-powerpc64le-Add-asm-implementation-of-felem_-squa.patch - openssl-ecc-Remove-extraneous-parentheses-in-secp384r1.patch - openssl-powerpc-ecc-Fix-stack-allocation-secp384r1-asm.patch - openssl-Improve-performance-for-6x-unrolling-with-vpermxor-i.patch OBS-URL: https://build.opensuse.org/request/show/1119558 OBS-URL: https://build.opensuse.org/package/show/security:tls/openssl-1_1?expand=0&rev=148
97 lines
2.1 KiB
Diff
97 lines
2.1 KiB
Diff
From 50f8b936b00dc18ce1f622a7a6aa46daf03da48b Mon Sep 17 00:00:00 2001
|
|
From: Rohan McLure <rohanmclure@linux.ibm.com>
|
|
Date: Wed, 16 Aug 2023 16:52:47 +1000
|
|
Subject: [PATCH] powerpc: ecc: Fix stack allocation secp384r1 asm
|
|
|
|
Assembly acceleration secp384r1 opts to not use any callee-save VSRs, as
|
|
VSX enabled systems make extensive use of renaming, and so writebacks in
|
|
felem_{mul,square}() can be reordered for best cache effects.
|
|
|
|
Remove stack allocations. This in turn fixes unmatched push/pops in
|
|
felem_{mul,square}().
|
|
|
|
Signed-off-by: Rohan McLure <rohan.mclure@linux.ibm.com>
|
|
|
|
Reviewed-by: Tomas Mraz <tomas@openssl.org>
|
|
Reviewed-by: Shane Lontis <shane.lontis@oracle.com>
|
|
Reviewed-by: Hugo Landau <hlandau@openssl.org>
|
|
(Merged from https://github.com/openssl/openssl/pull/21749)
|
|
---
|
|
crypto/ec/asm/ecp_nistp384-ppc64.pl | 49 -----------------------------
|
|
1 file changed, 49 deletions(-)
|
|
|
|
diff --git a/crypto/ec/asm/ecp_nistp384-ppc64.pl b/crypto/ec/asm/ecp_nistp384-ppc64.pl
|
|
index 3f86b391af69..28f4168e5218 100755
|
|
--- a/crypto/ec/asm/ecp_nistp384-ppc64.pl
|
|
+++ b/crypto/ec/asm/ecp_nistp384-ppc64.pl
|
|
@@ -62,51 +62,6 @@ ($)
|
|
___
|
|
}
|
|
|
|
-
|
|
-sub push_vrs($$)
|
|
-{
|
|
- my ($min, $max) = @_;
|
|
-
|
|
- my $count = $max - $min + 1;
|
|
-
|
|
- $code.=<<___;
|
|
- mr $savesp,$sp
|
|
- stdu $sp,-16*`$count+1`($sp)
|
|
-
|
|
-___
|
|
- for (my $i = $min; $i <= $max; $i++) {
|
|
- my $mult = $max - $i + 1;
|
|
- $code.=<<___;
|
|
- stxv $i,-16*$mult($savesp)
|
|
-___
|
|
-
|
|
- }
|
|
-
|
|
- $code.=<<___;
|
|
-
|
|
-___
|
|
-}
|
|
-
|
|
-sub pop_vrs($$)
|
|
-{
|
|
- my ($min, $max) = @_;
|
|
-
|
|
- $code.=<<___;
|
|
- ld $savesp,0($sp)
|
|
-___
|
|
- for (my $i = $min; $i <= $max; $i++) {
|
|
- my $mult = $max - $i + 1;
|
|
- $code.=<<___;
|
|
- lxv $i,-16*$mult($savesp)
|
|
-___
|
|
- }
|
|
-
|
|
- $code.=<<___;
|
|
- mr $sp,$savesp
|
|
-
|
|
-___
|
|
-}
|
|
-
|
|
sub load_vrs($$)
|
|
{
|
|
my ($pointer, $reg_list) = @_;
|
|
@@ -162,8 +117,6 @@ ($$)
|
|
|
|
startproc("p384_felem_mul");
|
|
|
|
- push_vrs(52, 63);
|
|
-
|
|
$code.=<<___;
|
|
vspltisw $vzero,0
|
|
|
|
@@ -268,8 +221,6 @@ ($$)
|
|
|
|
startproc("p384_felem_square");
|
|
|
|
- push_vrs(52, 63);
|
|
-
|
|
$code.=<<___;
|
|
vspltisw $vzero,0
|
|
|