-
Notifications
You must be signed in to change notification settings - Fork 545
Commit
This commit does not belong to any branch on this repository, and may belong to a fork outside of the repository.
[OpenBLAS] Update patches to improve performance
* Remove fallback to generic aarch kernels on neoverse. This was fixed before 0.3.20, so the optimized kernels should be fine to use now. * Backport threshold increase for gemv multithreading to improve performance. This is included in 0.3.27.
- Loading branch information
Showing
10 changed files
with
91 additions
and
77 deletions.
There are no files selected for viewing
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
22 changes: 22 additions & 0 deletions
22
O/OpenBLAS/[email protected]/bundled/patches/60-gemv-multithreading.patch
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,22 @@ | ||
From d2fc4f3b4d7f41527bc7dc8f62e9aa6229cfac89 Mon Sep 17 00:00:00 2001 | ||
From: Martin Kroeker <[email protected]> | ||
Date: Wed, 17 Jan 2024 20:59:24 +0100 | ||
Subject: [PATCH] Increase multithreading threshold by a factor of 50 | ||
|
||
--- | ||
interface/gemv.c | 2 +- | ||
1 file changed, 1 insertion(+), 1 deletion(-) | ||
|
||
diff --git a/interface/gemv.c b/interface/gemv.c | ||
index 1f07635799..2c121f1308 100644 | ||
--- a/interface/gemv.c | ||
+++ b/interface/gemv.c | ||
@@ -226,7 +226,7 @@ void CNAME(enum CBLAS_ORDER order, | ||
|
||
#ifdef SMP | ||
|
||
- if ( 1L * m * n < 2304L * GEMM_MULTITHREAD_THRESHOLD ) | ||
+ if ( 1L * m * n < 115200L * GEMM_MULTITHREAD_THRESHOLD ) | ||
nthreads = 1; | ||
else | ||
nthreads = num_cpu_avail(2); |
19 changes: 0 additions & 19 deletions
19
O/OpenBLAS/[email protected]/bundled/patches/neoverse-generic-kernels.patch
This file was deleted.
Oops, something went wrong.
19 changes: 0 additions & 19 deletions
19
O/OpenBLAS/[email protected]/bundled/patches/10-neoverse-generic-kernels.patch
This file was deleted.
Oops, something went wrong.
22 changes: 22 additions & 0 deletions
22
O/OpenBLAS/[email protected]/bundled/patches/60-gemv-multithreading.patch
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,22 @@ | ||
From d2fc4f3b4d7f41527bc7dc8f62e9aa6229cfac89 Mon Sep 17 00:00:00 2001 | ||
From: Martin Kroeker <[email protected]> | ||
Date: Wed, 17 Jan 2024 20:59:24 +0100 | ||
Subject: [PATCH] Increase multithreading threshold by a factor of 50 | ||
|
||
--- | ||
interface/gemv.c | 2 +- | ||
1 file changed, 1 insertion(+), 1 deletion(-) | ||
|
||
diff --git a/interface/gemv.c b/interface/gemv.c | ||
index 1f07635799..2c121f1308 100644 | ||
--- a/interface/gemv.c | ||
+++ b/interface/gemv.c | ||
@@ -226,7 +226,7 @@ void CNAME(enum CBLAS_ORDER order, | ||
|
||
#ifdef SMP | ||
|
||
- if ( 1L * m * n < 2304L * GEMM_MULTITHREAD_THRESHOLD ) | ||
+ if ( 1L * m * n < 115200L * GEMM_MULTITHREAD_THRESHOLD ) | ||
nthreads = 1; | ||
else | ||
nthreads = num_cpu_avail(2); |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
22 changes: 22 additions & 0 deletions
22
O/OpenBLAS/[email protected]/bundled/patches/60-gemv-multithreading.patch
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,22 @@ | ||
From d2fc4f3b4d7f41527bc7dc8f62e9aa6229cfac89 Mon Sep 17 00:00:00 2001 | ||
From: Martin Kroeker <[email protected]> | ||
Date: Wed, 17 Jan 2024 20:59:24 +0100 | ||
Subject: [PATCH] Increase multithreading threshold by a factor of 50 | ||
|
||
--- | ||
interface/gemv.c | 2 +- | ||
1 file changed, 1 insertion(+), 1 deletion(-) | ||
|
||
diff --git a/interface/gemv.c b/interface/gemv.c | ||
index 1f07635799..2c121f1308 100644 | ||
--- a/interface/gemv.c | ||
+++ b/interface/gemv.c | ||
@@ -226,7 +226,7 @@ void CNAME(enum CBLAS_ORDER order, | ||
|
||
#ifdef SMP | ||
|
||
- if ( 1L * m * n < 2304L * GEMM_MULTITHREAD_THRESHOLD ) | ||
+ if ( 1L * m * n < 115200L * GEMM_MULTITHREAD_THRESHOLD ) | ||
nthreads = 1; | ||
else | ||
nthreads = num_cpu_avail(2); |
19 changes: 0 additions & 19 deletions
19
O/OpenBLAS/[email protected]/bundled/patches/neoverse-generic-kernels.patch
This file was deleted.
Oops, something went wrong.
19 changes: 0 additions & 19 deletions
19
O/OpenBLAS/[email protected]/bundled/patches/10-neoverse-generic-kernels.patch
This file was deleted.
Oops, something went wrong.
22 changes: 22 additions & 0 deletions
22
O/OpenBLAS/[email protected]/bundled/patches/60-gemv-multithreading.patch
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,22 @@ | ||
From d2fc4f3b4d7f41527bc7dc8f62e9aa6229cfac89 Mon Sep 17 00:00:00 2001 | ||
From: Martin Kroeker <[email protected]> | ||
Date: Wed, 17 Jan 2024 20:59:24 +0100 | ||
Subject: [PATCH] Increase multithreading threshold by a factor of 50 | ||
|
||
--- | ||
interface/gemv.c | 2 +- | ||
1 file changed, 1 insertion(+), 1 deletion(-) | ||
|
||
diff --git a/interface/gemv.c b/interface/gemv.c | ||
index 1f07635799..2c121f1308 100644 | ||
--- a/interface/gemv.c | ||
+++ b/interface/gemv.c | ||
@@ -226,7 +226,7 @@ void CNAME(enum CBLAS_ORDER order, | ||
|
||
#ifdef SMP | ||
|
||
- if ( 1L * m * n < 2304L * GEMM_MULTITHREAD_THRESHOLD ) | ||
+ if ( 1L * m * n < 115200L * GEMM_MULTITHREAD_THRESHOLD ) | ||
nthreads = 1; | ||
else | ||
nthreads = num_cpu_avail(2); |