@@ -84,8 +84,6 @@ define amdgpu_kernel void @lds_atomic_inc_ret_i32(ptr addrspace(1) %out, ptr add
8484; GFX11-NEXT: buffer_gl0_inv
8585; GFX11-NEXT: v_mov_b32_e32 v1, 0
8686; GFX11-NEXT: global_store_b32 v1, v0, s[0:1]
87- ; GFX11-NEXT: s_nop 0
88- ; GFX11-NEXT: s_sendmsg sendmsg(MSG_DEALLOC_VGPRS)
8987; GFX11-NEXT: s_endpgm
9088 %result = atomicrmw uinc_wrap ptr addrspace (3 ) %ptr , i32 42 syncscope("agent" ) seq_cst , align 4
9189 store i32 %result , ptr addrspace (1 ) %out , align 4
@@ -163,8 +161,6 @@ define amdgpu_kernel void @lds_atomic_inc_ret_i32_offset(ptr addrspace(1) %out,
163161; GFX11-NEXT: buffer_gl0_inv
164162; GFX11-NEXT: v_mov_b32_e32 v1, 0
165163; GFX11-NEXT: global_store_b32 v1, v0, s[0:1]
166- ; GFX11-NEXT: s_nop 0
167- ; GFX11-NEXT: s_sendmsg sendmsg(MSG_DEALLOC_VGPRS)
168164; GFX11-NEXT: s_endpgm
169165 %gep = getelementptr i32 , ptr addrspace (3 ) %ptr , i32 4
170166 %result = atomicrmw uinc_wrap ptr addrspace (3 ) %gep , i32 42 syncscope("agent" ) seq_cst , align 4
@@ -353,8 +349,6 @@ define amdgpu_kernel void @global_atomic_inc_ret_i32(ptr addrspace(1) %out, ptr
353349; GFX11-NEXT: buffer_gl1_inv
354350; GFX11-NEXT: buffer_gl0_inv
355351; GFX11-NEXT: global_store_b32 v1, v0, s[0:1]
356- ; GFX11-NEXT: s_nop 0
357- ; GFX11-NEXT: s_sendmsg sendmsg(MSG_DEALLOC_VGPRS)
358352; GFX11-NEXT: s_endpgm
359353 %result = atomicrmw uinc_wrap ptr addrspace (1 ) %ptr , i32 42 syncscope("agent" ) seq_cst , align 4
360354 store i32 %result , ptr addrspace (1 ) %out , align 4
@@ -431,8 +425,6 @@ define amdgpu_kernel void @global_atomic_inc_ret_i32_offset(ptr addrspace(1) %ou
431425; GFX11-NEXT: buffer_gl1_inv
432426; GFX11-NEXT: buffer_gl0_inv
433427; GFX11-NEXT: global_store_b32 v1, v0, s[0:1]
434- ; GFX11-NEXT: s_nop 0
435- ; GFX11-NEXT: s_sendmsg sendmsg(MSG_DEALLOC_VGPRS)
436428; GFX11-NEXT: s_endpgm
437429 %gep = getelementptr i32 , ptr addrspace (1 ) %ptr , i32 4
438430 %result = atomicrmw uinc_wrap ptr addrspace (1 ) %gep , i32 42 syncscope("agent" ) seq_cst , align 4
@@ -510,8 +502,6 @@ define amdgpu_kernel void @global_atomic_inc_ret_i32_offset_sistem(ptr addrspace
510502; GFX11-NEXT: buffer_gl1_inv
511503; GFX11-NEXT: buffer_gl0_inv
512504; GFX11-NEXT: global_store_b32 v1, v0, s[0:1]
513- ; GFX11-NEXT: s_nop 0
514- ; GFX11-NEXT: s_sendmsg sendmsg(MSG_DEALLOC_VGPRS)
515505; GFX11-NEXT: s_endpgm
516506 %gep = getelementptr i32 , ptr addrspace (1 ) %ptr , i32 4
517507 %result = atomicrmw uinc_wrap ptr addrspace (1 ) %gep , i32 42 seq_cst , align 4
@@ -797,8 +787,6 @@ define amdgpu_kernel void @global_atomic_inc_ret_i32_offset_addr64(ptr addrspace
797787; GFX11-NEXT: buffer_gl1_inv
798788; GFX11-NEXT: buffer_gl0_inv
799789; GFX11-NEXT: global_store_b32 v0, v1, s[0:1]
800- ; GFX11-NEXT: s_nop 0
801- ; GFX11-NEXT: s_sendmsg sendmsg(MSG_DEALLOC_VGPRS)
802790; GFX11-NEXT: s_endpgm
803791 %id = call i32 @llvm.amdgcn.workitem.id.x ()
804792 %gep.tid = getelementptr i32 , ptr addrspace (1 ) %ptr , i32 %id
@@ -967,8 +955,6 @@ define amdgpu_kernel void @atomic_inc_shl_base_lds_0_i32(ptr addrspace(1) %out,
967955; GFX11-NEXT: s_clause 0x1
968956; GFX11-NEXT: global_store_b32 v2, v0, s[2:3]
969957; GFX11-NEXT: global_store_b32 v2, v1, s[0:1]
970- ; GFX11-NEXT: s_nop 0
971- ; GFX11-NEXT: s_sendmsg sendmsg(MSG_DEALLOC_VGPRS)
972958; GFX11-NEXT: s_endpgm
973959 %tid.x = tail call i32 @llvm.amdgcn.workitem.id.x () #2
974960 %idx.0 = add nsw i32 %tid.x , 2
@@ -1055,8 +1041,6 @@ define amdgpu_kernel void @lds_atomic_inc_ret_i64(ptr addrspace(1) %out, ptr add
10551041; GFX11-NEXT: buffer_gl0_inv
10561042; GFX11-NEXT: v_mov_b32_e32 v2, 0
10571043; GFX11-NEXT: global_store_b64 v2, v[0:1], s[0:1]
1058- ; GFX11-NEXT: s_nop 0
1059- ; GFX11-NEXT: s_sendmsg sendmsg(MSG_DEALLOC_VGPRS)
10601044; GFX11-NEXT: s_endpgm
10611045 %result = atomicrmw uinc_wrap ptr addrspace (3 ) %ptr , i64 42 syncscope("agent" ) seq_cst , align 8
10621046 store i64 %result , ptr addrspace (1 ) %out , align 4
@@ -1139,8 +1123,6 @@ define amdgpu_kernel void @lds_atomic_inc_ret_i64_offset(ptr addrspace(1) %out,
11391123; GFX11-NEXT: buffer_gl0_inv
11401124; GFX11-NEXT: v_mov_b32_e32 v2, 0
11411125; GFX11-NEXT: global_store_b64 v2, v[0:1], s[0:1]
1142- ; GFX11-NEXT: s_nop 0
1143- ; GFX11-NEXT: s_sendmsg sendmsg(MSG_DEALLOC_VGPRS)
11441126; GFX11-NEXT: s_endpgm
11451127 %gep = getelementptr i64 , ptr addrspace (3 ) %ptr , i32 4
11461128 %result = atomicrmw uinc_wrap ptr addrspace (3 ) %gep , i64 42 syncscope("agent" ) seq_cst , align 8
@@ -1344,8 +1326,6 @@ define amdgpu_kernel void @global_atomic_inc_ret_i64(ptr addrspace(1) %out, ptr
13441326; GFX11-NEXT: buffer_gl1_inv
13451327; GFX11-NEXT: buffer_gl0_inv
13461328; GFX11-NEXT: global_store_b64 v2, v[0:1], s[0:1]
1347- ; GFX11-NEXT: s_nop 0
1348- ; GFX11-NEXT: s_sendmsg sendmsg(MSG_DEALLOC_VGPRS)
13491329; GFX11-NEXT: s_endpgm
13501330 %result = atomicrmw uinc_wrap ptr addrspace (1 ) %ptr , i64 42 syncscope("agent" ) seq_cst , align 8
13511331 store i64 %result , ptr addrspace (1 ) %out , align 4
@@ -1427,8 +1407,6 @@ define amdgpu_kernel void @global_atomic_inc_ret_i64_offset(ptr addrspace(1) %ou
14271407; GFX11-NEXT: buffer_gl1_inv
14281408; GFX11-NEXT: buffer_gl0_inv
14291409; GFX11-NEXT: global_store_b64 v2, v[0:1], s[0:1]
1430- ; GFX11-NEXT: s_nop 0
1431- ; GFX11-NEXT: s_sendmsg sendmsg(MSG_DEALLOC_VGPRS)
14321410; GFX11-NEXT: s_endpgm
14331411 %gep = getelementptr i64 , ptr addrspace (1 ) %ptr , i32 4
14341412 %result = atomicrmw uinc_wrap ptr addrspace (1 ) %gep , i64 42 syncscope("agent" ) seq_cst , align 8
@@ -1511,8 +1489,6 @@ define amdgpu_kernel void @global_atomic_inc_ret_i64_offset_system(ptr addrspace
15111489; GFX11-NEXT: buffer_gl1_inv
15121490; GFX11-NEXT: buffer_gl0_inv
15131491; GFX11-NEXT: global_store_b64 v2, v[0:1], s[0:1]
1514- ; GFX11-NEXT: s_nop 0
1515- ; GFX11-NEXT: s_sendmsg sendmsg(MSG_DEALLOC_VGPRS)
15161492; GFX11-NEXT: s_endpgm
15171493 %gep = getelementptr i64 , ptr addrspace (1 ) %ptr , i32 4
15181494 %result = atomicrmw uinc_wrap ptr addrspace (1 ) %gep , i64 42 seq_cst , align 8
@@ -1818,8 +1794,6 @@ define amdgpu_kernel void @global_atomic_inc_ret_i64_offset_addr64(ptr addrspace
18181794; GFX11-NEXT: buffer_gl1_inv
18191795; GFX11-NEXT: buffer_gl0_inv
18201796; GFX11-NEXT: global_store_b64 v2, v[0:1], s[0:1]
1821- ; GFX11-NEXT: s_nop 0
1822- ; GFX11-NEXT: s_sendmsg sendmsg(MSG_DEALLOC_VGPRS)
18231797; GFX11-NEXT: s_endpgm
18241798 %id = call i32 @llvm.amdgcn.workitem.id.x ()
18251799 %gep.tid = getelementptr i64 , ptr addrspace (1 ) %ptr , i32 %id
@@ -2680,8 +2654,6 @@ define amdgpu_kernel void @atomic_inc_shl_base_lds_0_i64(ptr addrspace(1) %out,
26802654; GFX11-NEXT: s_clause 0x1
26812655; GFX11-NEXT: global_store_b32 v3, v2, s[2:3]
26822656; GFX11-NEXT: global_store_b64 v3, v[0:1], s[0:1]
2683- ; GFX11-NEXT: s_nop 0
2684- ; GFX11-NEXT: s_sendmsg sendmsg(MSG_DEALLOC_VGPRS)
26852657; GFX11-NEXT: s_endpgm
26862658 %tid.x = tail call i32 @llvm.amdgcn.workitem.id.x () #2
26872659 %idx.0 = add nsw i32 %tid.x , 2
@@ -3541,8 +3513,6 @@ define amdgpu_kernel void @nocse_lds_atomic_inc_ret_i32(ptr addrspace(1) %out0,
35413513; GFX11-NEXT: s_clause 0x1
35423514; GFX11-NEXT: global_store_b32 v1, v2, s[0:1]
35433515; GFX11-NEXT: global_store_b32 v1, v0, s[2:3]
3544- ; GFX11-NEXT: s_nop 0
3545- ; GFX11-NEXT: s_sendmsg sendmsg(MSG_DEALLOC_VGPRS)
35463516; GFX11-NEXT: s_endpgm
35473517 %result0 = atomicrmw uinc_wrap ptr addrspace (3 ) %ptr , i32 42 syncscope("agent" ) seq_cst , align 4
35483518 %result1 = atomicrmw uinc_wrap ptr addrspace (3 ) %ptr , i32 42 syncscope("agent" ) seq_cst , align 4
0 commit comments