@@ -536,8 +536,12 @@ body: |
536
536
...
537
537
# GCN-LABEL: name: dgemm16x16_mfma_write_vgpr_mfma_srca_read_overlap
538
538
# GCN: V_MFMA
539
- # GCN-NEXT: S_NOP 7
540
- # GCN-NEXT: S_NOP 2
539
+ # GFX940-NEXT: S_NOP 7
540
+ # GFX940-NEXT: S_NOP 2
541
+
542
+ # GFX950-NEXT: S_NOP 7
543
+ # GFX950-NEXT: S_NOP 7
544
+ # GFX950-NEXT: S_NOP 2
541
545
# GCN-NEXT: V_MFMA
542
546
name : dgemm16x16_mfma_write_vgpr_mfma_srca_read_overlap
543
547
body : |
@@ -562,7 +566,7 @@ body: |
562
566
563
567
# GFX950-NEXT: S_NOP 7
564
568
# GFX950-NEXT: S_NOP 7
565
- # GFX950-NEXT: S_NOP 0
569
+ # GFX950-NEXT: S_NOP 2
566
570
# GCN-NEXT: V_MFMA
567
571
name : dgemm16x16_mfma_write_vgpr_sgemm_mfma_srca_read_overlap
568
572
body : |
@@ -632,8 +636,12 @@ body: |
632
636
...
633
637
# GCN-LABEL: name: dgemm16x16_mfma_write_vgpr_mfma_srcb_read_overlap
634
638
# GCN: V_MFMA
635
- # GCN-NEXT: S_NOP 7
636
- # GCN-NEXT: S_NOP 2
639
+ # GFX940-NEXT: S_NOP 7
640
+ # GFX940-NEXT: S_NOP 2
641
+
642
+ # GFX950-NEXT: S_NOP 7
643
+ # GFX950-NEXT: S_NOP 7
644
+ # GFX950-NEXT: S_NOP 2
637
645
# GCN-NEXT: V_MFMA
638
646
name : dgemm16x16_mfma_write_vgpr_mfma_srcb_read_overlap
639
647
body : |
@@ -643,8 +651,12 @@ body: |
643
651
...
644
652
# GCN-LABEL: name: dgemm16x16_mfma_write_vgpr_smfmac_srcb_read_overlap
645
653
# GCN: V_MFMA
646
- # GCN-NEXT: S_NOP 7
647
- # GCN-NEXT: S_NOP 2
654
+ # GFX940-NEXT: S_NOP 7
655
+ # GFX940-NEXT: S_NOP 2
656
+
657
+ # GFX950-NEXT: S_NOP 7
658
+ # GFX950-NEXT: S_NOP 7
659
+ # GFX950-NEXT: S_NOP 2
648
660
# GCN-NEXT: V_SMFMAC
649
661
name : dgemm16x16_mfma_write_vgpr_smfmac_srcb_read_overlap
650
662
body : |
@@ -654,8 +666,13 @@ body: |
654
666
...
655
667
# GCN-LABEL: name: dgemm16x16_mfma_write_vgpr_smfmac_srcc_read_overlap
656
668
# GCN: V_MFMA
657
- # GCN-NEXT: S_NOP 7
658
- # GCN-NEXT: S_NOP 2
669
+ # GFX940-NEXT: S_NOP 7
670
+ # GFX940-NEXT: S_NOP 2
671
+
672
+ # GFX950-NEXT: S_NOP 7
673
+ # GFX950-NEXT: S_NOP 7
674
+ # GFX950-NEXT: S_NOP 2
675
+
659
676
# GCN-NEXT: V_SMFMAC
660
677
name : dgemm16x16_mfma_write_vgpr_smfmac_srcc_read_overlap
661
678
body : |
@@ -1452,8 +1469,12 @@ body: |
1452
1469
...
1453
1470
# GCN-LABEL: name: dgemm16x16_mfma_write_agpr_mfma_srca_read_overlap
1454
1471
# GCN: V_MFMA
1455
- # GCN-NEXT: S_NOP 7
1456
- # GCN-NEXT: S_NOP 2
1472
+ # GFX940-NEXT: S_NOP 7
1473
+ # GFX940-NEXT: S_NOP 2
1474
+
1475
+ # GFX950-NEXT: S_NOP 7
1476
+ # GFX950-NEXT: S_NOP 7
1477
+ # GFX950-NEXT: S_NOP 2
1457
1478
# GCN-NEXT: V_MFMA
1458
1479
name : dgemm16x16_mfma_write_agpr_mfma_srca_read_overlap
1459
1480
body : |
@@ -1473,8 +1494,13 @@ body: |
1473
1494
...
1474
1495
# GCN-LABEL: name: dgemm16x16_mfma_write_agpr_sgemm_mfma_srca_read_overlap
1475
1496
# GCN: V_MFMA
1476
- # GCN-NEXT: S_NOP 7
1477
- # GCN-NEXT: S_NOP 2
1497
+ # GFX940-NEXT: S_NOP 7
1498
+ # GFX940-NEXT: S_NOP 2
1499
+
1500
+ # GFX950-NEXT: S_NOP 7
1501
+ # GFX950-NEXT: S_NOP 7
1502
+ # GFX950-NEXT: S_NOP 2
1503
+
1478
1504
# GCN-NEXT: V_MFMA
1479
1505
name : dgemm16x16_mfma_write_agpr_sgemm_mfma_srca_read_overlap
1480
1506
body : |
@@ -1504,8 +1530,12 @@ body: |
1504
1530
...
1505
1531
# GCN-LABEL: name: dgemm16x16_mfma_write_agpr_mfma_srcb_read_overlap
1506
1532
# GCN: V_MFMA
1507
- # GCN-NEXT: S_NOP 7
1508
- # GCN-NEXT: S_NOP 2
1533
+ # GFX940-NEXT: S_NOP 7
1534
+ # GFX940-NEXT: S_NOP 2
1535
+
1536
+ # GFX950-NEXT: S_NOP 7
1537
+ # GFX950-NEXT: S_NOP 7
1538
+ # GFX950-NEXT: S_NOP 2
1509
1539
# GCN-NEXT: V_MFMA
1510
1540
name : dgemm16x16_mfma_write_agpr_mfma_srcb_read_overlap
1511
1541
body : |
0 commit comments