summaryrefslogtreecommitdiff
diff options
context:
space:
mode:
authorMartin Kroeker <martin@ruby.chemie.uni-freiburg.de>2018-12-03 13:06:43 +0100
committerGitHub <noreply@github.com>2018-12-03 13:06:43 +0100
commit701ea88347461e4c5d896765438dc870281b3834 (patch)
tree115afc11b9a21085cb0498c38bcbc7e8d7b00097
parent721c56c224fb3ae9db64f4c673c8b5a375ef4e3d (diff)
downloadopenblas-701ea88347461e4c5d896765438dc870281b3834.tar.gz
openblas-701ea88347461e4c5d896765438dc870281b3834.tar.bz2
openblas-701ea88347461e4c5d896765438dc870281b3834.zip
Use p2align instead of align for OSX compatibility
fixes #1902
-rw-r--r--kernel/x86_64/dgemm_kernel_4x8_skylakex.c6
1 files changed, 3 insertions, 3 deletions
diff --git a/kernel/x86_64/dgemm_kernel_4x8_skylakex.c b/kernel/x86_64/dgemm_kernel_4x8_skylakex.c
index a83ca98fa..6257e569e 100644
--- a/kernel/x86_64/dgemm_kernel_4x8_skylakex.c
+++ b/kernel/x86_64/dgemm_kernel_4x8_skylakex.c
@@ -869,7 +869,7 @@ CNAME(BLASLONG m, BLASLONG n, BLASLONG k, double alpha, double * __restrict__ A,
"vmovapd %%zmm1, %%zmm27\n"
"vmovapd %%zmm1, %%zmm28\n"
"jmp .label24\n"
- ".align 32\n"
+ ".p2align 5\n"
/* Inner math loop */
".label24:\n"
"vmovupd -128(%[AO]),%%zmm0\n"
@@ -1037,7 +1037,7 @@ CNAME(BLASLONG m, BLASLONG n, BLASLONG k, double alpha, double * __restrict__ A,
"vmovapd %%zmm1, %%zmm17\n"
"vmovapd %%zmm1, %%zmm18\n"
"jmp .label16\n"
- ".align 32\n"
+ ".p2align 5\n"
/* Inner math loop */
".label16:\n"
"vmovupd -128(%[AO]),%%zmm0\n"
@@ -1165,7 +1165,7 @@ CNAME(BLASLONG m, BLASLONG n, BLASLONG k, double alpha, double * __restrict__ A,
"vmovapd %%zmm1, %%zmm8\n"
"vbroadcastsd (%[alpha]), %%zmm9\n"
"jmp .label1\n"
- ".align 32\n"
+ ".p2align 5\n"
/* Inner math loop */
".label1:\n"
"vmovupd -128(%[AO]),%%zmm0\n"