|
24 | 24 | ret void
|
25 | 25 | }
|
26 | 26 |
|
| 27 | + define amdgpu_kernel void @inflate_result_to_agpr__V_MFMA_F32_32X32X8F16_mac_vgprcd_e64_two_chained_uses_cannot_rewrite_final_use() #0 { |
| 28 | + ret void |
| 29 | + } |
| 30 | + |
27 | 31 | attributes #0 = { "amdgpu-wave-limiter"="true" "amdgpu-waves-per-eu"="8,8" }
|
28 | 32 | ...
|
29 | 33 |
|
@@ -489,3 +493,81 @@ body: |
|
489 | 493 | S_ENDPGM 0
|
490 | 494 |
|
491 | 495 | ...
|
| 496 | + |
| 497 | +--- |
| 498 | +name: inflate_result_to_agpr__V_MFMA_F32_32X32X8F16_mac_vgprcd_e64_two_chained_uses_cannot_rewrite_final_use |
| 499 | +tracksRegLiveness: true |
| 500 | +machineFunctionInfo: |
| 501 | + isEntryFunction: true |
| 502 | + stackPtrOffsetReg: '$sgpr32' |
| 503 | + occupancy: 10 |
| 504 | + sgprForEXECCopy: '$sgpr100_sgpr101' |
| 505 | +body: | |
| 506 | + ; CHECK-LABEL: name: inflate_result_to_agpr__V_MFMA_F32_32X32X8F16_mac_vgprcd_e64_two_chained_uses_cannot_rewrite_final_use |
| 507 | + ; CHECK: bb.0: |
| 508 | + ; CHECK-NEXT: successors: %bb.1(0x80000000) |
| 509 | + ; CHECK-NEXT: {{ $}} |
| 510 | + ; CHECK-NEXT: S_NOP 0, implicit-def $agpr0 |
| 511 | + ; CHECK-NEXT: renamable $sgpr0 = S_MOV_B32 0 |
| 512 | + ; CHECK-NEXT: renamable $vgpr8 = V_MOV_B32_e32 0, implicit $exec |
| 513 | + ; CHECK-NEXT: renamable $sgpr1 = COPY renamable $sgpr0 |
| 514 | + ; CHECK-NEXT: renamable $vgpr0_vgpr1 = COPY killed renamable $sgpr0_sgpr1 |
| 515 | + ; CHECK-NEXT: renamable $vcc = S_AND_B64 $exec, -1, implicit-def dead $scc |
| 516 | + ; CHECK-NEXT: dead renamable $vgpr9 = COPY renamable $vgpr8 |
| 517 | + ; CHECK-NEXT: {{ $}} |
| 518 | + ; CHECK-NEXT: bb.1: |
| 519 | + ; CHECK-NEXT: successors: %bb.1(0x40000000), %bb.2(0x40000000) |
| 520 | + ; CHECK-NEXT: liveins: $vcc, $vgpr0_vgpr1 |
| 521 | + ; CHECK-NEXT: {{ $}} |
| 522 | + ; CHECK-NEXT: renamable $agpr0_agpr1 = GLOBAL_LOAD_DWORDX2 undef renamable $vgpr0_vgpr1, 0, 0, implicit $exec :: (load (s64), addrspace 1) |
| 523 | + ; CHECK-NEXT: renamable $agpr0_agpr1_agpr2_agpr3_agpr4_agpr5_agpr6_agpr7_agpr8_agpr9_agpr10_agpr11_agpr12_agpr13_agpr14_agpr15 = V_MFMA_F32_32X32X8F16_mac_e64 $vgpr0_vgpr1, $vgpr0_vgpr1, $agpr0_agpr1_agpr2_agpr3_agpr4_agpr5_agpr6_agpr7_agpr8_agpr9_agpr10_agpr11_agpr12_agpr13_agpr14_agpr15, 0, 0, 0, implicit $mode, implicit $exec |
| 524 | + ; CHECK-NEXT: renamable $agpr0_agpr1_agpr2_agpr3_agpr4_agpr5_agpr6_agpr7_agpr8_agpr9_agpr10_agpr11_agpr12_agpr13_agpr14_agpr15 = V_MFMA_F32_32X32X8F16_mac_e64 $vgpr0_vgpr1, $vgpr0_vgpr1, killed $agpr0_agpr1_agpr2_agpr3_agpr4_agpr5_agpr6_agpr7_agpr8_agpr9_agpr10_agpr11_agpr12_agpr13_agpr14_agpr15, 0, 0, 0, implicit $mode, implicit $exec |
| 525 | + ; CHECK-NEXT: S_CBRANCH_VCCNZ %bb.1, implicit $vcc |
| 526 | + ; CHECK-NEXT: S_BRANCH %bb.2 |
| 527 | + ; CHECK-NEXT: {{ $}} |
| 528 | + ; CHECK-NEXT: bb.2: |
| 529 | + ; CHECK-NEXT: liveins: $agpr0_agpr1_agpr2_agpr3_agpr4_agpr5_agpr6_agpr7_agpr8_agpr9_agpr10_agpr11_agpr12_agpr13_agpr14_agpr15:0x00000000FFFFFFFF |
| 530 | + ; CHECK-NEXT: {{ $}} |
| 531 | + ; CHECK-NEXT: S_NOP 0, implicit-def $vgpr0_vgpr1_vgpr2_vgpr3_vgpr4_vgpr5_vgpr6_vgpr7 |
| 532 | + ; CHECK-NEXT: S_NOP 0, implicit-def $vgpr8_vgpr9_vgpr10_vgpr11_vgpr12_vgpr13_vgpr14_vgpr15 |
| 533 | + ; CHECK-NEXT: S_NOP 0, implicit-def $vgpr16_vgpr17_vgpr18_vgpr19_vgpr20_vgpr21_vgpr22_vgpr23 |
| 534 | + ; CHECK-NEXT: S_NOP 0, implicit-def $vgpr24_vgpr25_vgpr26_vgpr27_vgpr28_vgpr29_vgpr30_vgpr31 |
| 535 | + ; CHECK-NEXT: S_NOP 0, implicit-def $vgpr32_vgpr33_vgpr34_vgpr35_vgpr36_vgpr37_vgpr38_vgpr39 |
| 536 | + ; CHECK-NEXT: S_NOP 0, implicit-def $vgpr40_vgpr41_vgpr42_vgpr43_vgpr44_vgpr45_vgpr46_vgpr47 |
| 537 | + ; CHECK-NEXT: S_NOP 0, implicit-def $vgpr48_vgpr49_vgpr50_vgpr51_vgpr52_vgpr53_vgpr54_vgpr55 |
| 538 | + ; CHECK-NEXT: S_NOP 0, implicit-def $vgpr56_vgpr57_vgpr58_vgpr59_vgpr60_vgpr61_vgpr62_vgpr63 |
| 539 | + ; CHECK-NEXT: renamable $vgpr0_vgpr1_vgpr2_vgpr3_vgpr4_vgpr5_vgpr6_vgpr7_vgpr8_vgpr9_vgpr10_vgpr11_vgpr12_vgpr13_vgpr14_vgpr15 = COPY killed renamable $agpr0_agpr1_agpr2_agpr3_agpr4_agpr5_agpr6_agpr7_agpr8_agpr9_agpr10_agpr11_agpr12_agpr13_agpr14_agpr15 |
| 540 | + ; CHECK-NEXT: INLINEASM &"; use $0 ", 1 /* sideeffect attdialect */, 27983881 /* reguse:VReg_512_Align2 */, killed renamable $vgpr0_vgpr1_vgpr2_vgpr3_vgpr4_vgpr5_vgpr6_vgpr7_vgpr8_vgpr9_vgpr10_vgpr11_vgpr12_vgpr13_vgpr14_vgpr15 |
| 541 | + ; CHECK-NEXT: S_ENDPGM 0 |
| 542 | + bb.0: |
| 543 | + S_NOP 0, implicit-def $agpr0 |
| 544 | + renamable $sgpr0 = S_MOV_B32 0 |
| 545 | + undef %0.sub8:vreg_512_align2 = V_MOV_B32_e32 0, implicit $exec |
| 546 | + renamable $sgpr1 = COPY renamable $sgpr0 |
| 547 | + %1:vreg_64_align2 = COPY killed renamable $sgpr0_sgpr1 |
| 548 | + renamable $vcc = S_AND_B64 $exec, -1, implicit-def dead $scc |
| 549 | + %0.sub9:vreg_512_align2 = COPY %0.sub8 |
| 550 | +
|
| 551 | + bb.1: |
| 552 | + liveins: $vcc |
| 553 | +
|
| 554 | + undef %0.sub0_sub1:vreg_512_align2 = GLOBAL_LOAD_DWORDX2 undef %3:vreg_64_align2, 0, 0, implicit $exec :: (load (s64), addrspace 1) |
| 555 | + %0:vreg_512_align2 = V_MFMA_F32_32X32X8F16_mac_vgprcd_e64 %1, %1, %0, 0, 0, 0, implicit $mode, implicit $exec |
| 556 | + %0:vreg_512_align2 = V_MFMA_F32_32X32X8F16_mac_vgprcd_e64 %1, %1, %0, 0, 0, 0, implicit $mode, implicit $exec |
| 557 | + S_CBRANCH_VCCNZ %bb.1, implicit $vcc |
| 558 | + S_BRANCH %bb.2 |
| 559 | +
|
| 560 | + bb.2: |
| 561 | + ; No VGPRs available for %0 |
| 562 | + S_NOP 0, implicit-def $vgpr0_vgpr1_vgpr2_vgpr3_vgpr4_vgpr5_vgpr6_vgpr7 |
| 563 | + S_NOP 0, implicit-def $vgpr8_vgpr9_vgpr10_vgpr11_vgpr12_vgpr13_vgpr14_vgpr15 |
| 564 | + S_NOP 0, implicit-def $vgpr16_vgpr17_vgpr18_vgpr19_vgpr20_vgpr21_vgpr22_vgpr23 |
| 565 | + S_NOP 0, implicit-def $vgpr24_vgpr25_vgpr26_vgpr27_vgpr28_vgpr29_vgpr30_vgpr31 |
| 566 | + S_NOP 0, implicit-def $vgpr32_vgpr33_vgpr34_vgpr35_vgpr36_vgpr37_vgpr38_vgpr39 |
| 567 | + S_NOP 0, implicit-def $vgpr40_vgpr41_vgpr42_vgpr43_vgpr44_vgpr45_vgpr46_vgpr47 |
| 568 | + S_NOP 0, implicit-def $vgpr48_vgpr49_vgpr50_vgpr51_vgpr52_vgpr53_vgpr54_vgpr55 |
| 569 | + S_NOP 0, implicit-def $vgpr56_vgpr57_vgpr58_vgpr59_vgpr60_vgpr61_vgpr62_vgpr63 |
| 570 | + INLINEASM &"; use $0 ", 1 /* sideeffect attdialect */, 27983881 /* reguse:VReg_512_Align2 */, %0:vreg_512_align2 |
| 571 | + S_ENDPGM 0 |
| 572 | +
|
| 573 | +... |
0 commit comments