@@ -124,6 +124,7 @@ define void @test_flat_amdgcn_cooperative_atomic_store_32x4B_release(ptr noundef
124124; GFX1250: ; %bb.0: ; %entry
125125; GFX1250-NEXT: s_wait_loadcnt_dscnt 0x0
126126; GFX1250-NEXT: s_wait_kmcnt 0x0
127+ ; GFX1250-NEXT: s_wait_storecnt 0x0
127128; GFX1250-NEXT: flat_store_b32 v[0:1], v2 scope:SCOPE_DEV
128129; GFX1250-NEXT: s_wait_dscnt 0x0
129130; GFX1250-NEXT: s_set_pc_i64 s[30:31]
@@ -137,6 +138,7 @@ define void @test_flat_amdgcn_cooperative_atomic_store_16x8B_release(ptr noundef
137138; GFX1250: ; %bb.0: ; %entry
138139; GFX1250-NEXT: s_wait_loadcnt_dscnt 0x0
139140; GFX1250-NEXT: s_wait_kmcnt 0x0
141+ ; GFX1250-NEXT: s_wait_storecnt 0x0
140142; GFX1250-NEXT: flat_store_b64 v[0:1], v[2:3] scope:SCOPE_DEV
141143; GFX1250-NEXT: s_wait_dscnt 0x0
142144; GFX1250-NEXT: s_set_pc_i64 s[30:31]
@@ -150,6 +152,7 @@ define void @test_flat_amdgcn_cooperative_atomic_store_8x16B_release(ptr noundef
150152; GFX1250: ; %bb.0: ; %entry
151153; GFX1250-NEXT: s_wait_loadcnt_dscnt 0x0
152154; GFX1250-NEXT: s_wait_kmcnt 0x0
155+ ; GFX1250-NEXT: s_wait_storecnt 0x0
153156; GFX1250-NEXT: flat_store_b128 v[0:1], v[2:5] scope:SCOPE_DEV
154157; GFX1250-NEXT: s_wait_dscnt 0x0
155158; GFX1250-NEXT: s_set_pc_i64 s[30:31]
@@ -163,6 +166,7 @@ define i32 @test_flat_amdgcn_cooperative_atomic_load_32x4B_seq_cst(ptr noundef r
163166; GFX1250: ; %bb.0: ; %entry
164167; GFX1250-NEXT: s_wait_loadcnt_dscnt 0x0
165168; GFX1250-NEXT: s_wait_kmcnt 0x0
169+ ; GFX1250-NEXT: s_wait_storecnt 0x0
166170; GFX1250-NEXT: flat_load_b32 v0, v[0:1] scope:SCOPE_DEV
167171; GFX1250-NEXT: s_wait_loadcnt_dscnt 0x0
168172; GFX1250-NEXT: s_set_pc_i64 s[30:31]
@@ -176,6 +180,7 @@ define <2 x i32> @test_flat_amdgcn_cooperative_atomic_load_16x8B_seq_cst(ptr nou
176180; GFX1250: ; %bb.0: ; %entry
177181; GFX1250-NEXT: s_wait_loadcnt_dscnt 0x0
178182; GFX1250-NEXT: s_wait_kmcnt 0x0
183+ ; GFX1250-NEXT: s_wait_storecnt 0x0
179184; GFX1250-NEXT: flat_load_b64 v[0:1], v[0:1] scope:SCOPE_DEV
180185; GFX1250-NEXT: s_wait_loadcnt_dscnt 0x0
181186; GFX1250-NEXT: s_set_pc_i64 s[30:31]
@@ -189,6 +194,7 @@ define <4 x i32> @test_flat_amdgcn_cooperative_atomic_load_8x16B_seq_cst(ptr nou
189194; GFX1250: ; %bb.0: ; %entry
190195; GFX1250-NEXT: s_wait_loadcnt_dscnt 0x0
191196; GFX1250-NEXT: s_wait_kmcnt 0x0
197+ ; GFX1250-NEXT: s_wait_storecnt 0x0
192198; GFX1250-NEXT: flat_load_b128 v[0:3], v[0:1] scope:SCOPE_DEV
193199; GFX1250-NEXT: s_wait_loadcnt_dscnt 0x0
194200; GFX1250-NEXT: s_set_pc_i64 s[30:31]
@@ -202,6 +208,7 @@ define void @test_flat_amdgcn_cooperative_atomic_store_32x4B_seq_cst(ptr noundef
202208; GFX1250: ; %bb.0: ; %entry
203209; GFX1250-NEXT: s_wait_loadcnt_dscnt 0x0
204210; GFX1250-NEXT: s_wait_kmcnt 0x0
211+ ; GFX1250-NEXT: s_wait_storecnt 0x0
205212; GFX1250-NEXT: flat_store_b32 v[0:1], v2 scope:SCOPE_DEV
206213; GFX1250-NEXT: s_wait_dscnt 0x0
207214; GFX1250-NEXT: s_set_pc_i64 s[30:31]
@@ -215,6 +222,7 @@ define void @test_flat_amdgcn_cooperative_atomic_store_16x8B_seq_cst(ptr noundef
215222; GFX1250: ; %bb.0: ; %entry
216223; GFX1250-NEXT: s_wait_loadcnt_dscnt 0x0
217224; GFX1250-NEXT: s_wait_kmcnt 0x0
225+ ; GFX1250-NEXT: s_wait_storecnt 0x0
218226; GFX1250-NEXT: flat_store_b64 v[0:1], v[2:3] scope:SCOPE_DEV
219227; GFX1250-NEXT: s_wait_dscnt 0x0
220228; GFX1250-NEXT: s_set_pc_i64 s[30:31]
@@ -228,6 +236,7 @@ define void @test_flat_amdgcn_cooperative_atomic_store_8x16B_seq_cst(ptr noundef
228236; GFX1250: ; %bb.0: ; %entry
229237; GFX1250-NEXT: s_wait_loadcnt_dscnt 0x0
230238; GFX1250-NEXT: s_wait_kmcnt 0x0
239+ ; GFX1250-NEXT: s_wait_storecnt 0x0
231240; GFX1250-NEXT: flat_store_b128 v[0:1], v[2:5] scope:SCOPE_DEV
232241; GFX1250-NEXT: s_wait_dscnt 0x0
233242; GFX1250-NEXT: s_set_pc_i64 s[30:31]
@@ -358,6 +367,7 @@ define void @test_one_as_flat_amdgcn_cooperative_atomic_store_32x4B_release(ptr
358367; GFX1250: ; %bb.0: ; %entry
359368; GFX1250-NEXT: s_wait_loadcnt_dscnt 0x0
360369; GFX1250-NEXT: s_wait_kmcnt 0x0
370+ ; GFX1250-NEXT: s_wait_storecnt 0x0
361371; GFX1250-NEXT: flat_store_b32 v[0:1], v2 scope:SCOPE_DEV
362372; GFX1250-NEXT: s_wait_dscnt 0x0
363373; GFX1250-NEXT: s_set_pc_i64 s[30:31]
@@ -371,6 +381,7 @@ define void @test_one_as_flat_amdgcn_cooperative_atomic_store_16x8B_release(ptr
371381; GFX1250: ; %bb.0: ; %entry
372382; GFX1250-NEXT: s_wait_loadcnt_dscnt 0x0
373383; GFX1250-NEXT: s_wait_kmcnt 0x0
384+ ; GFX1250-NEXT: s_wait_storecnt 0x0
374385; GFX1250-NEXT: flat_store_b64 v[0:1], v[2:3] scope:SCOPE_DEV
375386; GFX1250-NEXT: s_wait_dscnt 0x0
376387; GFX1250-NEXT: s_set_pc_i64 s[30:31]
@@ -384,6 +395,7 @@ define void @test_one_as_flat_amdgcn_cooperative_atomic_store_8x16B_release(ptr
384395; GFX1250: ; %bb.0: ; %entry
385396; GFX1250-NEXT: s_wait_loadcnt_dscnt 0x0
386397; GFX1250-NEXT: s_wait_kmcnt 0x0
398+ ; GFX1250-NEXT: s_wait_storecnt 0x0
387399; GFX1250-NEXT: flat_store_b128 v[0:1], v[2:5] scope:SCOPE_DEV
388400; GFX1250-NEXT: s_wait_dscnt 0x0
389401; GFX1250-NEXT: s_set_pc_i64 s[30:31]
@@ -397,6 +409,7 @@ define i32 @test_one_as_flat_amdgcn_cooperative_atomic_load_32x4B_seq_cst(ptr no
397409; GFX1250: ; %bb.0: ; %entry
398410; GFX1250-NEXT: s_wait_loadcnt_dscnt 0x0
399411; GFX1250-NEXT: s_wait_kmcnt 0x0
412+ ; GFX1250-NEXT: s_wait_storecnt 0x0
400413; GFX1250-NEXT: flat_load_b32 v0, v[0:1] scope:SCOPE_DEV
401414; GFX1250-NEXT: s_wait_loadcnt_dscnt 0x0
402415; GFX1250-NEXT: s_set_pc_i64 s[30:31]
@@ -410,6 +423,7 @@ define <2 x i32> @test_one_as_flat_amdgcn_cooperative_atomic_load_16x8B_seq_cst(
410423; GFX1250: ; %bb.0: ; %entry
411424; GFX1250-NEXT: s_wait_loadcnt_dscnt 0x0
412425; GFX1250-NEXT: s_wait_kmcnt 0x0
426+ ; GFX1250-NEXT: s_wait_storecnt 0x0
413427; GFX1250-NEXT: flat_load_b64 v[0:1], v[0:1] scope:SCOPE_DEV
414428; GFX1250-NEXT: s_wait_loadcnt_dscnt 0x0
415429; GFX1250-NEXT: s_set_pc_i64 s[30:31]
@@ -423,6 +437,7 @@ define <4 x i32> @test_one_as_flat_amdgcn_cooperative_atomic_load_8x16B_seq_cst(
423437; GFX1250: ; %bb.0: ; %entry
424438; GFX1250-NEXT: s_wait_loadcnt_dscnt 0x0
425439; GFX1250-NEXT: s_wait_kmcnt 0x0
440+ ; GFX1250-NEXT: s_wait_storecnt 0x0
426441; GFX1250-NEXT: flat_load_b128 v[0:3], v[0:1] scope:SCOPE_DEV
427442; GFX1250-NEXT: s_wait_loadcnt_dscnt 0x0
428443; GFX1250-NEXT: s_set_pc_i64 s[30:31]
@@ -436,6 +451,7 @@ define void @test_one_as_flat_amdgcn_cooperative_atomic_store_32x4B_seq_cst(ptr
436451; GFX1250: ; %bb.0: ; %entry
437452; GFX1250-NEXT: s_wait_loadcnt_dscnt 0x0
438453; GFX1250-NEXT: s_wait_kmcnt 0x0
454+ ; GFX1250-NEXT: s_wait_storecnt 0x0
439455; GFX1250-NEXT: flat_store_b32 v[0:1], v2 scope:SCOPE_DEV
440456; GFX1250-NEXT: s_wait_dscnt 0x0
441457; GFX1250-NEXT: s_set_pc_i64 s[30:31]
@@ -449,6 +465,7 @@ define void @test_one_as_flat_amdgcn_cooperative_atomic_store_16x8B_seq_cst(ptr
449465; GFX1250: ; %bb.0: ; %entry
450466; GFX1250-NEXT: s_wait_loadcnt_dscnt 0x0
451467; GFX1250-NEXT: s_wait_kmcnt 0x0
468+ ; GFX1250-NEXT: s_wait_storecnt 0x0
452469; GFX1250-NEXT: flat_store_b64 v[0:1], v[2:3] scope:SCOPE_DEV
453470; GFX1250-NEXT: s_wait_dscnt 0x0
454471; GFX1250-NEXT: s_set_pc_i64 s[30:31]
@@ -462,6 +479,7 @@ define void @test_one_as_flat_amdgcn_cooperative_atomic_store_8x16B_seq_cst(ptr
462479; GFX1250: ; %bb.0: ; %entry
463480; GFX1250-NEXT: s_wait_loadcnt_dscnt 0x0
464481; GFX1250-NEXT: s_wait_kmcnt 0x0
482+ ; GFX1250-NEXT: s_wait_storecnt 0x0
465483; GFX1250-NEXT: flat_store_b128 v[0:1], v[2:5] scope:SCOPE_DEV
466484; GFX1250-NEXT: s_wait_dscnt 0x0
467485; GFX1250-NEXT: s_set_pc_i64 s[30:31]
0 commit comments