summaryrefslogtreecommitdiff
diff options
context:
space:
mode:
authorMartin Kroeker <martin@ruby.chemie.uni-freiburg.de>2022-06-28 16:09:36 +0200
committerGitHub <noreply@github.com>2022-06-28 16:09:36 +0200
commitbe5500e704e6758647f5d07daf9a3b2d06de538b (patch)
treec0f785c564a6b2233051efb8a40c428dac9b558a
parent92275a79020c9eff410024915e88b1822028fbc9 (diff)
parent2062280c6fab0cf02046b7c5c783b3fc124c5a27 (diff)
downloadopenblas-be5500e704e6758647f5d07daf9a3b2d06de538b.tar.gz
openblas-be5500e704e6758647f5d07daf9a3b2d06de538b.tar.bz2
openblas-be5500e704e6758647f5d07daf9a3b2d06de538b.zip
Merge pull request #3669 from VFerrari/fix_small_matrix_kernel
POWER: fix issues with the small matrix kernel
-rw-r--r--Makefile.system2
-rw-r--r--kernel/power/gemm_small_kernel_permit_power10.c4
2 files changed, 5 insertions, 1 deletions
diff --git a/Makefile.system b/Makefile.system
index 8a62eb3a3..217d5289e 100644
--- a/Makefile.system
+++ b/Makefile.system
@@ -261,7 +261,7 @@ endif
#For small matrix optimization
ifeq ($(ARCH), x86_64)
SMALL_MATRIX_OPT = 1
-else ifeq ($(CORE), POWER10)
+else ifeq ($(ARCH), power)
SMALL_MATRIX_OPT = 1
endif
ifeq ($(SMALL_MATRIX_OPT), 1)
diff --git a/kernel/power/gemm_small_kernel_permit_power10.c b/kernel/power/gemm_small_kernel_permit_power10.c
index 9b38e457b..3a146d8fa 100644
--- a/kernel/power/gemm_small_kernel_permit_power10.c
+++ b/kernel/power/gemm_small_kernel_permit_power10.c
@@ -69,6 +69,7 @@ int CNAME(int transa, int transb, BLASLONG M, BLASLONG N, BLASLONG K, FLOAT alph
#endif
+#ifdef SMP
// Multi-threading execution outperforms (or approaches) the execution of the
// small kernel.
if (num_cpu_avail(3) > 1) {
@@ -77,6 +78,9 @@ int CNAME(int transa, int transb, BLASLONG M, BLASLONG N, BLASLONG K, FLOAT alph
} else {
return 1;
}
+#else
+ return 1;
+#endif
#endif