summaryrefslogtreecommitdiff
diff options
context:
space:
mode:
authorwjc404 <52632443+wjc404@users.noreply.github.com>2019-07-17 22:39:15 +0800
committerGitHub <noreply@github.com>2019-07-17 22:39:15 +0800
commit211ab03b1402a3c39311b7ca769aaad736ca554c (patch)
treea5a5210ea33c69657f1366519b90e6b02b2b4a3e
parent1733f927e6b892610bda045538a42d495faa1af5 (diff)
downloadopenblas-211ab03b1402a3c39311b7ca769aaad736ca554c.tar.gz
openblas-211ab03b1402a3c39311b7ca769aaad736ca554c.tar.bz2
openblas-211ab03b1402a3c39311b7ca769aaad736ca554c.zip
Update dgemm_kernel_4x8_haswell.S
-rw-r--r--kernel/x86_64/dgemm_kernel_4x8_haswell.S7
1 files changed, 4 insertions, 3 deletions
diff --git a/kernel/x86_64/dgemm_kernel_4x8_haswell.S b/kernel/x86_64/dgemm_kernel_4x8_haswell.S
index b30ecccea..3f7f9a98e 100644
--- a/kernel/x86_64/dgemm_kernel_4x8_haswell.S
+++ b/kernel/x86_64/dgemm_kernel_4x8_haswell.S
@@ -267,23 +267,24 @@ USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
.macro SAVE4x12
+ prefetcht0 128(%rsp) /*BUFFER 1*/
vbroadcastsd ALPHA, %ymm0
vmulpd %ymm0 , %ymm4 , %ymm4
vmulpd %ymm0 , %ymm5 , %ymm5
vmulpd %ymm0 , %ymm6 , %ymm6
vmulpd %ymm0 , %ymm7 , %ymm7
-
+ prefetcht0 192(%rsp)
vmulpd %ymm0 , %ymm8 , %ymm8
vmulpd %ymm0 , %ymm9 , %ymm9
vmulpd %ymm0 , %ymm10, %ymm10
vmulpd %ymm0 , %ymm11, %ymm11
-
+ prefetcht0 256(%rsp)
vmulpd %ymm0 , %ymm12, %ymm12
vmulpd %ymm0 , %ymm13, %ymm13
vmulpd %ymm0 , %ymm14, %ymm14
vmulpd %ymm0 , %ymm15, %ymm15
-
+ prefetcht0 320(%rsp)
vpermilpd $ 0x05 , %ymm5, %ymm5
vpermilpd $ 0x05 , %ymm7, %ymm7