@@ -495,17 +495,17 @@ define amdgpu_kernel void @usage_direct_recursion(i32 %n) #0 {
495495; GCN: NumVgprs: max(43, multi_stage_recurse1.num_vgpr)
496496; GCN: ScratchSize: 16+max(multi_stage_recurse1.private_seg_size)
497497; GCN-LABEL: {{^}}multi_stage_recurse1:
498- ; GCN: .set multi_stage_recurse1.num_vgpr, max(48, amdgpu.max_num_vgpr )
499- ; GCN: .set multi_stage_recurse1.num_agpr, max(0, amdgpu.max_num_agpr )
500- ; GCN: .set multi_stage_recurse1.numbered_sgpr, max(34, amdgpu.max_num_sgpr )
498+ ; GCN: .set multi_stage_recurse1.num_vgpr, max(48, 43 )
499+ ; GCN: .set multi_stage_recurse1.num_agpr, max(0, 0 )
500+ ; GCN: .set multi_stage_recurse1.numbered_sgpr, max(34, 34 )
501501; GCN: .set multi_stage_recurse1.private_seg_size, 16
502502; GCN: .set multi_stage_recurse1.uses_vcc, 1
503503; GCN: .set multi_stage_recurse1.uses_flat_scratch, 0
504504; GCN: .set multi_stage_recurse1.has_dyn_sized_stack, 0
505505; GCN: .set multi_stage_recurse1.has_recursion, 1
506506; GCN: .set multi_stage_recurse1.has_indirect_call, 0
507- ; GCN: TotalNumSgprs: multi_stage_recurse1.numbered_sgpr+4
508- ; GCN: NumVgprs: max(48, amdgpu.max_num_vgpr)
507+ ; GCN: TotalNumSgprs: 38
508+ ; GCN: NumVgprs: 48
509509; GCN: ScratchSize: 16
510510define void @multi_stage_recurse1 (i32 %val ) #2 {
511511 call void @multi_stage_recurse2 (i32 %val )
@@ -528,8 +528,8 @@ define void @multi_stage_recurse2(i32 %val) #2 {
528528; GCN: .set usage_multi_stage_recurse.has_dyn_sized_stack, or(0, multi_stage_recurse1.has_dyn_sized_stack)
529529; GCN: .set usage_multi_stage_recurse.has_recursion, or(1, multi_stage_recurse1.has_recursion)
530530; GCN: .set usage_multi_stage_recurse.has_indirect_call, or(0, multi_stage_recurse1.has_indirect_call)
531- ; GCN: TotalNumSgprs: usage_multi_stage_recurse.numbered_sgpr+6
532- ; GCN: NumVgprs: usage_multi_stage_recurse.num_vgpr
531+ ; GCN: TotalNumSgprs: 40
532+ ; GCN: NumVgprs: 48
533533; GCN: ScratchSize: 16
534534define amdgpu_kernel void @usage_multi_stage_recurse (i32 %n ) #0 {
535535 call void @multi_stage_recurse1 (i32 %n )
@@ -550,17 +550,17 @@ define amdgpu_kernel void @usage_multi_stage_recurse(i32 %n) #0 {
550550; GCN: NumVgprs: max(41, multi_stage_recurse_noattr1.num_vgpr)
551551; GCN: ScratchSize: 16+max(multi_stage_recurse_noattr1.private_seg_size)
552552; GCN-LABEL: {{^}}multi_stage_recurse_noattr1:
553- ; GCN: .set multi_stage_recurse_noattr1.num_vgpr, max(41, amdgpu.max_num_vgpr )
554- ; GCN: .set multi_stage_recurse_noattr1.num_agpr, max(0, amdgpu.max_num_agpr )
555- ; GCN: .set multi_stage_recurse_noattr1.numbered_sgpr, max(57, amdgpu.max_num_sgpr )
553+ ; GCN: .set multi_stage_recurse_noattr1.num_vgpr, max(41, 41 )
554+ ; GCN: .set multi_stage_recurse_noattr1.num_agpr, max(0, 0 )
555+ ; GCN: .set multi_stage_recurse_noattr1.numbered_sgpr, max(57, 54 )
556556; GCN: .set multi_stage_recurse_noattr1.private_seg_size, 16
557557; GCN: .set multi_stage_recurse_noattr1.uses_vcc, 1
558558; GCN: .set multi_stage_recurse_noattr1.uses_flat_scratch, 0
559559; GCN: .set multi_stage_recurse_noattr1.has_dyn_sized_stack, 0
560560; GCN: .set multi_stage_recurse_noattr1.has_recursion, 0
561561; GCN: .set multi_stage_recurse_noattr1.has_indirect_call, 0
562- ; GCN: TotalNumSgprs: multi_stage_recurse_noattr1.numbered_sgpr+4
563- ; GCN: NumVgprs: max(41, amdgpu.max_num_vgpr)
562+ ; GCN: TotalNumSgprs: 61
563+ ; GCN: NumVgprs: 41
564564; GCN: ScratchSize: 16
565565define void @multi_stage_recurse_noattr1 (i32 %val ) #0 {
566566 call void @multi_stage_recurse_noattr2 (i32 %val )
@@ -583,8 +583,8 @@ define void @multi_stage_recurse_noattr2(i32 %val) #0 {
583583; GCN: .set usage_multi_stage_recurse_noattrs.has_dyn_sized_stack, or(0, multi_stage_recurse_noattr1.has_dyn_sized_stack)
584584; GCN: .set usage_multi_stage_recurse_noattrs.has_recursion, or(0, multi_stage_recurse_noattr1.has_recursion)
585585; GCN: .set usage_multi_stage_recurse_noattrs.has_indirect_call, or(0, multi_stage_recurse_noattr1.has_indirect_call)
586- ; GCN: TotalNumSgprs: usage_multi_stage_recurse_noattrs.numbered_sgpr+6
587- ; GCN: NumVgprs: usage_multi_stage_recurse_noattrs.num_vgpr
586+ ; GCN: TotalNumSgprs: 63
587+ ; GCN: NumVgprs: 41
588588; GCN: ScratchSize: 16
589589define amdgpu_kernel void @usage_multi_stage_recurse_noattrs (i32 %n ) #0 {
590590 call void @multi_stage_recurse_noattr1 (i32 %n )
@@ -601,8 +601,8 @@ define amdgpu_kernel void @usage_multi_stage_recurse_noattrs(i32 %n) #0 {
601601; GCN: .set multi_call_with_multi_stage_recurse.has_dyn_sized_stack, or(0, use_stack0.has_dyn_sized_stack, use_stack1.has_dyn_sized_stack, multi_stage_recurse1.has_dyn_sized_stack)
602602; GCN: .set multi_call_with_multi_stage_recurse.has_recursion, or(1, use_stack0.has_recursion, use_stack1.has_recursion, multi_stage_recurse1.has_recursion)
603603; GCN: .set multi_call_with_multi_stage_recurse.has_indirect_call, or(0, use_stack0.has_indirect_call, use_stack1.has_indirect_call, multi_stage_recurse1.has_indirect_call)
604- ; GCN: TotalNumSgprs: multi_call_with_multi_stage_recurse.numbered_sgpr+6
605- ; GCN: NumVgprs: multi_call_with_multi_stage_recurse.num_vgpr
604+ ; GCN: TotalNumSgprs: 59
605+ ; GCN: NumVgprs: 48
606606; GCN: ScratchSize: 2052
607607define amdgpu_kernel void @multi_call_with_multi_stage_recurse (i32 %n ) #0 {
608608 call void @use_stack0 ()
0 commit comments