|
16 | 16 | ret void
|
17 | 17 | }
|
18 | 18 |
|
| 19 | + define amdgpu_kernel void @inflate_result_to_agpr__V_MFMA_F32_32X32X8F16_mac_vgprcd_e64_two_chained_uses_cannot_rewrite_final_use() #0 { |
| 20 | + ret void |
| 21 | + } |
| 22 | + |
19 | 23 | attributes #0 = { "amdgpu-wave-limiter"="true" "amdgpu-waves-per-eu"="8,8" }
|
20 | 24 | ...
|
21 | 25 |
|
@@ -311,3 +315,81 @@ body: |
|
311 | 315 | $agpr0 = COPY %0
|
312 | 316 |
|
313 | 317 | ...
|
| 318 | + |
| 319 | +--- |
| 320 | +name: inflate_result_to_agpr__V_MFMA_F32_32X32X8F16_mac_vgprcd_e64_two_chained_uses_cannot_rewrite_final_use |
| 321 | +tracksRegLiveness: true |
| 322 | +machineFunctionInfo: |
| 323 | + isEntryFunction: true |
| 324 | + stackPtrOffsetReg: '$sgpr32' |
| 325 | + occupancy: 10 |
| 326 | + sgprForEXECCopy: '$sgpr100_sgpr101' |
| 327 | +body: | |
| 328 | + ; CHECK-LABEL: name: inflate_result_to_agpr__V_MFMA_F32_32X32X8F16_mac_vgprcd_e64_two_chained_uses_cannot_rewrite_final_use |
| 329 | + ; CHECK: bb.0: |
| 330 | + ; CHECK-NEXT: successors: %bb.1(0x80000000) |
| 331 | + ; CHECK-NEXT: {{ $}} |
| 332 | + ; CHECK-NEXT: S_NOP 0, implicit-def $agpr0 |
| 333 | + ; CHECK-NEXT: renamable $sgpr0 = S_MOV_B32 0 |
| 334 | + ; CHECK-NEXT: renamable $vgpr8 = V_MOV_B32_e32 0, implicit $exec |
| 335 | + ; CHECK-NEXT: renamable $sgpr1 = COPY renamable $sgpr0 |
| 336 | + ; CHECK-NEXT: renamable $vgpr0_vgpr1 = COPY killed renamable $sgpr0_sgpr1 |
| 337 | + ; CHECK-NEXT: renamable $vcc = S_AND_B64 $exec, -1, implicit-def dead $scc |
| 338 | + ; CHECK-NEXT: dead renamable $vgpr9 = COPY renamable $vgpr8 |
| 339 | + ; CHECK-NEXT: {{ $}} |
| 340 | + ; CHECK-NEXT: bb.1: |
| 341 | + ; CHECK-NEXT: successors: %bb.1(0x40000000), %bb.2(0x40000000) |
| 342 | + ; CHECK-NEXT: liveins: $vcc, $vgpr0_vgpr1 |
| 343 | + ; CHECK-NEXT: {{ $}} |
| 344 | + ; CHECK-NEXT: renamable $agpr0_agpr1 = GLOBAL_LOAD_DWORDX2 undef renamable $vgpr0_vgpr1, 0, 0, implicit $exec :: (load (s64), addrspace 1) |
| 345 | + ; CHECK-NEXT: renamable $agpr0_agpr1_agpr2_agpr3_agpr4_agpr5_agpr6_agpr7_agpr8_agpr9_agpr10_agpr11_agpr12_agpr13_agpr14_agpr15 = V_MFMA_F32_32X32X8F16_mac_e64 $vgpr0_vgpr1, $vgpr0_vgpr1, $agpr0_agpr1_agpr2_agpr3_agpr4_agpr5_agpr6_agpr7_agpr8_agpr9_agpr10_agpr11_agpr12_agpr13_agpr14_agpr15, 0, 0, 0, implicit $mode, implicit $exec |
| 346 | + ; CHECK-NEXT: renamable $agpr0_agpr1_agpr2_agpr3_agpr4_agpr5_agpr6_agpr7_agpr8_agpr9_agpr10_agpr11_agpr12_agpr13_agpr14_agpr15 = V_MFMA_F32_32X32X8F16_mac_e64 $vgpr0_vgpr1, $vgpr0_vgpr1, killed $agpr0_agpr1_agpr2_agpr3_agpr4_agpr5_agpr6_agpr7_agpr8_agpr9_agpr10_agpr11_agpr12_agpr13_agpr14_agpr15, 0, 0, 0, implicit $mode, implicit $exec |
| 347 | + ; CHECK-NEXT: S_CBRANCH_VCCNZ %bb.1, implicit $vcc |
| 348 | + ; CHECK-NEXT: S_BRANCH %bb.2 |
| 349 | + ; CHECK-NEXT: {{ $}} |
| 350 | + ; CHECK-NEXT: bb.2: |
| 351 | + ; CHECK-NEXT: liveins: $agpr0_agpr1_agpr2_agpr3_agpr4_agpr5_agpr6_agpr7_agpr8_agpr9_agpr10_agpr11_agpr12_agpr13_agpr14_agpr15:0x00000000FFFFFFFF |
| 352 | + ; CHECK-NEXT: {{ $}} |
| 353 | + ; CHECK-NEXT: S_NOP 0, implicit-def $vgpr0_vgpr1_vgpr2_vgpr3_vgpr4_vgpr5_vgpr6_vgpr7 |
| 354 | + ; CHECK-NEXT: S_NOP 0, implicit-def $vgpr8_vgpr9_vgpr10_vgpr11_vgpr12_vgpr13_vgpr14_vgpr15 |
| 355 | + ; CHECK-NEXT: S_NOP 0, implicit-def $vgpr16_vgpr17_vgpr18_vgpr19_vgpr20_vgpr21_vgpr22_vgpr23 |
| 356 | + ; CHECK-NEXT: S_NOP 0, implicit-def $vgpr24_vgpr25_vgpr26_vgpr27_vgpr28_vgpr29_vgpr30_vgpr31 |
| 357 | + ; CHECK-NEXT: S_NOP 0, implicit-def $vgpr32_vgpr33_vgpr34_vgpr35_vgpr36_vgpr37_vgpr38_vgpr39 |
| 358 | + ; CHECK-NEXT: S_NOP 0, implicit-def $vgpr40_vgpr41_vgpr42_vgpr43_vgpr44_vgpr45_vgpr46_vgpr47 |
| 359 | + ; CHECK-NEXT: S_NOP 0, implicit-def $vgpr48_vgpr49_vgpr50_vgpr51_vgpr52_vgpr53_vgpr54_vgpr55 |
| 360 | + ; CHECK-NEXT: S_NOP 0, implicit-def $vgpr56_vgpr57_vgpr58_vgpr59_vgpr60_vgpr61_vgpr62_vgpr63 |
| 361 | + ; CHECK-NEXT: renamable $vgpr0_vgpr1_vgpr2_vgpr3_vgpr4_vgpr5_vgpr6_vgpr7_vgpr8_vgpr9_vgpr10_vgpr11_vgpr12_vgpr13_vgpr14_vgpr15 = COPY killed renamable $agpr0_agpr1_agpr2_agpr3_agpr4_agpr5_agpr6_agpr7_agpr8_agpr9_agpr10_agpr11_agpr12_agpr13_agpr14_agpr15 |
| 362 | + ; CHECK-NEXT: INLINEASM &"; use $0 ", 1 /* sideeffect attdialect */, 27983881 /* reguse:VReg_512_Align2 */, killed renamable $vgpr0_vgpr1_vgpr2_vgpr3_vgpr4_vgpr5_vgpr6_vgpr7_vgpr8_vgpr9_vgpr10_vgpr11_vgpr12_vgpr13_vgpr14_vgpr15 |
| 363 | + ; CHECK-NEXT: S_ENDPGM 0 |
| 364 | + bb.0: |
| 365 | + S_NOP 0, implicit-def $agpr0 |
| 366 | + renamable $sgpr0 = S_MOV_B32 0 |
| 367 | + undef %0.sub8:vreg_512_align2 = V_MOV_B32_e32 0, implicit $exec |
| 368 | + renamable $sgpr1 = COPY renamable $sgpr0 |
| 369 | + %1:vreg_64_align2 = COPY killed renamable $sgpr0_sgpr1 |
| 370 | + renamable $vcc = S_AND_B64 $exec, -1, implicit-def dead $scc |
| 371 | + %0.sub9:vreg_512_align2 = COPY %0.sub8 |
| 372 | +
|
| 373 | + bb.1: |
| 374 | + liveins: $vcc |
| 375 | +
|
| 376 | + undef %0.sub0_sub1:vreg_512_align2 = GLOBAL_LOAD_DWORDX2 undef %3:vreg_64_align2, 0, 0, implicit $exec :: (load (s64), addrspace 1) |
| 377 | + %0:vreg_512_align2 = V_MFMA_F32_32X32X8F16_mac_vgprcd_e64 %1, %1, %0, 0, 0, 0, implicit $mode, implicit $exec |
| 378 | + %0:vreg_512_align2 = V_MFMA_F32_32X32X8F16_mac_vgprcd_e64 %1, %1, %0, 0, 0, 0, implicit $mode, implicit $exec |
| 379 | + S_CBRANCH_VCCNZ %bb.1, implicit $vcc |
| 380 | + S_BRANCH %bb.2 |
| 381 | +
|
| 382 | + bb.2: |
| 383 | + ; No VGPRs available for %0 |
| 384 | + S_NOP 0, implicit-def $vgpr0_vgpr1_vgpr2_vgpr3_vgpr4_vgpr5_vgpr6_vgpr7 |
| 385 | + S_NOP 0, implicit-def $vgpr8_vgpr9_vgpr10_vgpr11_vgpr12_vgpr13_vgpr14_vgpr15 |
| 386 | + S_NOP 0, implicit-def $vgpr16_vgpr17_vgpr18_vgpr19_vgpr20_vgpr21_vgpr22_vgpr23 |
| 387 | + S_NOP 0, implicit-def $vgpr24_vgpr25_vgpr26_vgpr27_vgpr28_vgpr29_vgpr30_vgpr31 |
| 388 | + S_NOP 0, implicit-def $vgpr32_vgpr33_vgpr34_vgpr35_vgpr36_vgpr37_vgpr38_vgpr39 |
| 389 | + S_NOP 0, implicit-def $vgpr40_vgpr41_vgpr42_vgpr43_vgpr44_vgpr45_vgpr46_vgpr47 |
| 390 | + S_NOP 0, implicit-def $vgpr48_vgpr49_vgpr50_vgpr51_vgpr52_vgpr53_vgpr54_vgpr55 |
| 391 | + S_NOP 0, implicit-def $vgpr56_vgpr57_vgpr58_vgpr59_vgpr60_vgpr61_vgpr62_vgpr63 |
| 392 | + INLINEASM &"; use $0 ", 1 /* sideeffect attdialect */, 27983881 /* reguse:VReg_512_Align2 */, %0:vreg_512_align2 |
| 393 | + S_ENDPGM 0 |
| 394 | +
|
| 395 | +... |
0 commit comments