@@ -156,8 +156,6 @@ main_body:
156156 ret void
157157}
158158
159- ; There are 8 pseudo registers defined to track LDS DMA dependencies.
160-
161159define amdgpu_kernel void @buffer_load_lds_dword_10_arrays (<4 x i32 > %rsrc , i32 %i1 , i32 %i2 , i32 %i3 , i32 %i4 , i32 %i5 , i32 %i6 , i32 %i7 , i32 %i8 , i32 %i9 , ptr addrspace (1 ) %out ) {
162160; GFX9-LABEL: buffer_load_lds_dword_10_arrays:
163161; GFX9: ; %bb.0: ; %main_body
@@ -226,6 +224,7 @@ define amdgpu_kernel void @buffer_load_lds_dword_10_arrays(<4 x i32> %rsrc, i32
226224; GFX9-NEXT: s_waitcnt vmcnt(0)
227225; GFX9-NEXT: ds_read_b32 v8, v9 offset:2048
228226; GFX9-NEXT: ; wave barrier
227+ ; GFX9-NEXT: s_waitcnt vmcnt(0)
229228; GFX9-NEXT: ds_read_b32 v9, v9 offset:2304
230229; GFX9-NEXT: s_waitcnt lgkmcnt(0)
231230; GFX9-NEXT: global_store_dwordx4 v10, v[0:3], s[0:1]
@@ -292,6 +291,7 @@ define amdgpu_kernel void @buffer_load_lds_dword_10_arrays(<4 x i32> %rsrc, i32
292291; GFX10-NEXT: s_waitcnt vmcnt(0)
293292; GFX10-NEXT: ds_read_b32 v8, v9 offset:2048
294293; GFX10-NEXT: ; wave barrier
294+ ; GFX10-NEXT: s_waitcnt vmcnt(0)
295295; GFX10-NEXT: ds_read_b32 v9, v9 offset:2304
296296; GFX10-NEXT: s_waitcnt lgkmcnt(0)
297297; GFX10-NEXT: global_store_dwordx4 v10, v[0:3], s[0:1]
0 commit comments