From 6feb92a58fdc36731fc87e9d1ed11cf7f54ef053 Mon Sep 17 00:00:00 2001 From: Harmen Stoppels Date: Tue, 5 May 2020 13:46:04 +0200 Subject: [PATCH] Add OpenBLAS patch for aarch64 (#987) --- ...on-to-zero-in-the-NEON-SGEMM_BETA-ke.patch | 40 +++++++++++++++++++ ...on-to-zero-in-the-NEON-SGEMM_BETA-ke.patch | 40 +++++++++++++++++++ 2 files changed, 80 insertions(+) create mode 100644 O/OpenBLAS/OpenBLAS32@0.3.9/bundled/patches/fix-initialization-to-zero-in-the-NEON-SGEMM_BETA-ke.patch create mode 100644 O/OpenBLAS/OpenBLAS@0.3.9/bundled/patches/fix-initialization-to-zero-in-the-NEON-SGEMM_BETA-ke.patch diff --git a/O/OpenBLAS/OpenBLAS32@0.3.9/bundled/patches/fix-initialization-to-zero-in-the-NEON-SGEMM_BETA-ke.patch b/O/OpenBLAS/OpenBLAS32@0.3.9/bundled/patches/fix-initialization-to-zero-in-the-NEON-SGEMM_BETA-ke.patch new file mode 100644 index 00000000000..3b39aa593c7 --- /dev/null +++ b/O/OpenBLAS/OpenBLAS32@0.3.9/bundled/patches/fix-initialization-to-zero-in-the-NEON-SGEMM_BETA-ke.patch @@ -0,0 +1,40 @@ +From 1c64c55baca23e2a18b78a8391d83cfbc2cb56a7 Mon Sep 17 00:00:00 2001 +From: Martin Kroeker +Date: Tue, 31 Mar 2020 16:53:56 +0200 +Subject: [PATCH] fix initialization to zero in the NEON SGEMM_BETA kernel as + well + +--- + kernel/arm64/sgemm_beta.S | 16 ++++++++-------- + 1 file changed, 8 insertions(+), 8 deletions(-) + +diff --git a/kernel/arm64/sgemm_beta.S b/kernel/arm64/sgemm_beta.S +index a3b97e23..574485bc 100755 +--- a/kernel/arm64/sgemm_beta.S ++++ b/kernel/arm64/sgemm_beta.S +@@ -81,14 +81,14 @@ USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. + .endm + + .macro INIT_ZERO +- fmul v0.4s, v0.4s, betaV0 +- fmul v1.4s, v1.4s, betaV0 +- fmul v2.4s, v2.4s, betaV0 +- fmul v3.4s, v3.4s, betaV0 +- fmul v4.4s, v4.4s, betaV0 +- fmul v5.4s, v5.4s, betaV0 +- fmul v6.4s, v6.4s, betaV0 +- fmul v7.4s, v7.4s, betaV0 ++ movi v0.4s, #0x0 ++ movi v1.4s, #0x0 ++ movi v2.4s, #0x0 ++ movi v3.4s, #0x0 ++ movi v4.4s, #0x0 ++ movi v5.4s, #0x0 ++ movi v6.4s, #0x0 ++ movi v7.4s, #0x0 + .endm + + /************************************************************************************** +-- +2.25.1 + diff --git a/O/OpenBLAS/OpenBLAS@0.3.9/bundled/patches/fix-initialization-to-zero-in-the-NEON-SGEMM_BETA-ke.patch b/O/OpenBLAS/OpenBLAS@0.3.9/bundled/patches/fix-initialization-to-zero-in-the-NEON-SGEMM_BETA-ke.patch new file mode 100644 index 00000000000..3b39aa593c7 --- /dev/null +++ b/O/OpenBLAS/OpenBLAS@0.3.9/bundled/patches/fix-initialization-to-zero-in-the-NEON-SGEMM_BETA-ke.patch @@ -0,0 +1,40 @@ +From 1c64c55baca23e2a18b78a8391d83cfbc2cb56a7 Mon Sep 17 00:00:00 2001 +From: Martin Kroeker +Date: Tue, 31 Mar 2020 16:53:56 +0200 +Subject: [PATCH] fix initialization to zero in the NEON SGEMM_BETA kernel as + well + +--- + kernel/arm64/sgemm_beta.S | 16 ++++++++-------- + 1 file changed, 8 insertions(+), 8 deletions(-) + +diff --git a/kernel/arm64/sgemm_beta.S b/kernel/arm64/sgemm_beta.S +index a3b97e23..574485bc 100755 +--- a/kernel/arm64/sgemm_beta.S ++++ b/kernel/arm64/sgemm_beta.S +@@ -81,14 +81,14 @@ USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. + .endm + + .macro INIT_ZERO +- fmul v0.4s, v0.4s, betaV0 +- fmul v1.4s, v1.4s, betaV0 +- fmul v2.4s, v2.4s, betaV0 +- fmul v3.4s, v3.4s, betaV0 +- fmul v4.4s, v4.4s, betaV0 +- fmul v5.4s, v5.4s, betaV0 +- fmul v6.4s, v6.4s, betaV0 +- fmul v7.4s, v7.4s, betaV0 ++ movi v0.4s, #0x0 ++ movi v1.4s, #0x0 ++ movi v2.4s, #0x0 ++ movi v3.4s, #0x0 ++ movi v4.4s, #0x0 ++ movi v5.4s, #0x0 ++ movi v6.4s, #0x0 ++ movi v7.4s, #0x0 + .endm + + /************************************************************************************** +-- +2.25.1 +