Skip to content

Commit 182b06d

Browse files
authored
Update dgemm_kernel_4x8_haswell.S
1 parent 7a9050d commit 182b06d

File tree

1 file changed

+20
-20
lines changed

1 file changed

+20
-20
lines changed

kernel/x86_64/dgemm_kernel_4x8_haswell.S

Lines changed: 20 additions & 20 deletions
Original file line numberDiff line numberDiff line change
@@ -317,10 +317,10 @@ USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
317317
vmovups %ymm6 , (%rax)
318318
vmovups %ymm7 , (%rax, LDC)
319319

320-
prefetcht0 32(CO1)
321-
prefetcht0 32(CO1,LDC)
322-
prefetcht0 32(%rax)
323-
prefetcht0 32(%rax,LDC)
320+
prefetcht0 56(CO1)
321+
prefetcht0 56(CO1,LDC)
322+
prefetcht0 56(%rax)
323+
prefetcht0 56(%rax,LDC)
324324

325325
vpermilpd $ 0x05 , %ymm9 , %ymm9
326326
vpermilpd $ 0x05 , %ymm11, %ymm11
@@ -356,10 +356,10 @@ USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
356356
vmovups %ymm6 , (%rbp)
357357
vmovups %ymm7 , (%rbp, LDC)
358358

359-
prefetcht0 32(%rax)
360-
prefetcht0 32(%rax,LDC)
361-
prefetcht0 32(%rbp)
362-
prefetcht0 32(%rbp,LDC)
359+
prefetcht0 56(%rax)
360+
prefetcht0 56(%rax,LDC)
361+
prefetcht0 56(%rbp)
362+
prefetcht0 56(%rbp,LDC)
363363

364364
vpermilpd $ 0x05 , %ymm13, %ymm13
365365
vpermilpd $ 0x05 , %ymm15, %ymm15
@@ -395,10 +395,10 @@ USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
395395
vmovups %ymm6 , (%rbp)
396396
vmovups %ymm7 , (%rbp, LDC)
397397

398-
prefetcht0 32(%rax)
399-
prefetcht0 32(%rax,LDC)
400-
prefetcht0 32(%rbp)
401-
prefetcht0 32(%rbp,LDC)
398+
prefetcht0 56(%rax)
399+
prefetcht0 56(%rax,LDC)
400+
prefetcht0 56(%rbp)
401+
prefetcht0 56(%rbp,LDC)
402402

403403
addq $ 4*SIZE, CO1
404404
.endm
@@ -826,10 +826,10 @@ USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
826826
vmovups %ymm6 , (%rax)
827827
vmovups %ymm7 , (%rax, LDC)
828828

829-
prefetcht0 32(CO1)
830-
prefetcht0 32(CO1,LDC)
831-
prefetcht0 32(%rax)
832-
prefetcht0 32(%rax,LDC)
829+
prefetcht0 56(CO1)
830+
prefetcht0 56(CO1,LDC)
831+
prefetcht0 56(%rax)
832+
prefetcht0 56(%rax,LDC)
833833

834834
vpermilpd $ 0x05 , %ymm9 , %ymm9
835835
vpermilpd $ 0x05 , %ymm11, %ymm11
@@ -865,10 +865,10 @@ USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
865865
vmovups %ymm6 , (%rbp)
866866
vmovups %ymm7 , (%rbp, LDC)
867867

868-
prefetcht0 32(%rax)
869-
prefetcht0 32(%rax,LDC)
870-
prefetcht0 32(%rbp)
871-
prefetcht0 32(%rbp,LDC)
868+
prefetcht0 56(%rax)
869+
prefetcht0 56(%rax,LDC)
870+
prefetcht0 56(%rbp)
871+
prefetcht0 56(%rbp,LDC)
872872

873873
addq $ 4*SIZE, CO1
874874
.endm

0 commit comments

Comments
 (0)