@@ -10733,15 +10733,16 @@ define void @flat_atomic_fmaximum_f64_ret_a_a(ptr %ptr) #0 {
1073310733; GFX90A-NEXT: buffer_load_dword v0, v6, s[0:3], 0 offen
1073410734; GFX90A-NEXT: buffer_load_dword v1, v6, s[0:3], 0 offen offset:4
1073510735; GFX90A-NEXT: v_mov_b32_e32 v7, 0x7ff80000
10736+ ; GFX90A-NEXT: s_waitcnt vmcnt(1)
10737+ ; GFX90A-NEXT: v_accvgpr_write_b32 a0, v0
1073610738; GFX90A-NEXT: s_waitcnt vmcnt(0)
1073710739; GFX90A-NEXT: v_max_f64 v[2:3], v[0:1], v[4:5]
1073810740; GFX90A-NEXT: v_cmp_u_f64_e32 vcc, v[0:1], v[4:5]
10739- ; GFX90A-NEXT: v_accvgpr_write_b32 a0, v0
1074010741; GFX90A-NEXT: v_cndmask_b32_e64 v2, v2, 0, vcc
1074110742; GFX90A-NEXT: v_accvgpr_write_b32 a1, v1
10742- ; GFX90A-NEXT: v_cndmask_b32_e32 v3 , v3, v7, vcc
10743+ ; GFX90A-NEXT: v_cndmask_b32_e32 v0 , v3, v7, vcc
1074310744; GFX90A-NEXT: buffer_store_dword v2, v6, s[0:3], 0 offen
10744- ; GFX90A-NEXT: buffer_store_dword v3 , v6, s[0:3], 0 offen offset:4
10745+ ; GFX90A-NEXT: buffer_store_dword v0 , v6, s[0:3], 0 offen offset:4
1074510746; GFX90A-NEXT: .LBB135_6: ; %atomicrmw.phi
1074610747; GFX90A-NEXT: s_or_b64 exec, exec, s[4:5]
1074710748; GFX90A-NEXT: ;;#ASMSTART
@@ -11000,15 +11001,16 @@ define void @flat_atomic_fminimum_f64_ret_a_a(ptr %ptr) #0 {
1100011001; GFX90A-NEXT: buffer_load_dword v0, v6, s[0:3], 0 offen
1100111002; GFX90A-NEXT: buffer_load_dword v1, v6, s[0:3], 0 offen offset:4
1100211003; GFX90A-NEXT: v_mov_b32_e32 v7, 0x7ff80000
11004+ ; GFX90A-NEXT: s_waitcnt vmcnt(1)
11005+ ; GFX90A-NEXT: v_accvgpr_write_b32 a0, v0
1100311006; GFX90A-NEXT: s_waitcnt vmcnt(0)
1100411007; GFX90A-NEXT: v_min_f64 v[2:3], v[0:1], v[4:5]
1100511008; GFX90A-NEXT: v_cmp_u_f64_e32 vcc, v[0:1], v[4:5]
11006- ; GFX90A-NEXT: v_accvgpr_write_b32 a0, v0
1100711009; GFX90A-NEXT: v_cndmask_b32_e64 v2, v2, 0, vcc
1100811010; GFX90A-NEXT: v_accvgpr_write_b32 a1, v1
11009- ; GFX90A-NEXT: v_cndmask_b32_e32 v3 , v3, v7, vcc
11011+ ; GFX90A-NEXT: v_cndmask_b32_e32 v0 , v3, v7, vcc
1101011012; GFX90A-NEXT: buffer_store_dword v2, v6, s[0:3], 0 offen
11011- ; GFX90A-NEXT: buffer_store_dword v3 , v6, s[0:3], 0 offen offset:4
11013+ ; GFX90A-NEXT: buffer_store_dword v0 , v6, s[0:3], 0 offen offset:4
1101211014; GFX90A-NEXT: .LBB137_6: ; %atomicrmw.phi
1101311015; GFX90A-NEXT: s_or_b64 exec, exec, s[4:5]
1101411016; GFX90A-NEXT: ;;#ASMSTART
@@ -19023,15 +19025,16 @@ define void @flat_atomic_fmaximum_f64_saddr_ret_a_a(ptr inreg %ptr) #0 {
1902319025; GFX90A-NEXT: buffer_load_dword v0, v6, s[0:3], 0 offen
1902419026; GFX90A-NEXT: buffer_load_dword v1, v6, s[0:3], 0 offen offset:4
1902519027; GFX90A-NEXT: v_mov_b32_e32 v7, 0x7ff80000
19028+ ; GFX90A-NEXT: s_waitcnt vmcnt(1)
19029+ ; GFX90A-NEXT: v_accvgpr_write_b32 a0, v0
1902619030; GFX90A-NEXT: s_waitcnt vmcnt(0)
1902719031; GFX90A-NEXT: v_max_f64 v[2:3], v[0:1], v[4:5]
1902819032; GFX90A-NEXT: v_cmp_u_f64_e32 vcc, v[0:1], v[4:5]
19029- ; GFX90A-NEXT: v_accvgpr_write_b32 a0, v0
1903019033; GFX90A-NEXT: v_cndmask_b32_e64 v2, v2, 0, vcc
1903119034; GFX90A-NEXT: v_accvgpr_write_b32 a1, v1
19032- ; GFX90A-NEXT: v_cndmask_b32_e32 v3 , v3, v7, vcc
19035+ ; GFX90A-NEXT: v_cndmask_b32_e32 v0 , v3, v7, vcc
1903319036; GFX90A-NEXT: buffer_store_dword v2, v6, s[0:3], 0 offen
19034- ; GFX90A-NEXT: buffer_store_dword v3 , v6, s[0:3], 0 offen offset:4
19037+ ; GFX90A-NEXT: buffer_store_dword v0 , v6, s[0:3], 0 offen offset:4
1903519038; GFX90A-NEXT: .LBB243_6: ; %atomicrmw.phi
1903619039; GFX90A-NEXT: ;;#ASMSTART
1903719040; GFX90A-NEXT: ; use a[0:1]
@@ -19282,15 +19285,16 @@ define void @flat_atomic_fminimum_f64_saddr_ret_a_a(ptr inreg %ptr) #0 {
1928219285; GFX90A-NEXT: buffer_load_dword v0, v6, s[0:3], 0 offen
1928319286; GFX90A-NEXT: buffer_load_dword v1, v6, s[0:3], 0 offen offset:4
1928419287; GFX90A-NEXT: v_mov_b32_e32 v7, 0x7ff80000
19288+ ; GFX90A-NEXT: s_waitcnt vmcnt(1)
19289+ ; GFX90A-NEXT: v_accvgpr_write_b32 a0, v0
1928519290; GFX90A-NEXT: s_waitcnt vmcnt(0)
1928619291; GFX90A-NEXT: v_min_f64 v[2:3], v[0:1], v[4:5]
1928719292; GFX90A-NEXT: v_cmp_u_f64_e32 vcc, v[0:1], v[4:5]
19288- ; GFX90A-NEXT: v_accvgpr_write_b32 a0, v0
1928919293; GFX90A-NEXT: v_cndmask_b32_e64 v2, v2, 0, vcc
1929019294; GFX90A-NEXT: v_accvgpr_write_b32 a1, v1
19291- ; GFX90A-NEXT: v_cndmask_b32_e32 v3 , v3, v7, vcc
19295+ ; GFX90A-NEXT: v_cndmask_b32_e32 v0 , v3, v7, vcc
1929219296; GFX90A-NEXT: buffer_store_dword v2, v6, s[0:3], 0 offen
19293- ; GFX90A-NEXT: buffer_store_dword v3 , v6, s[0:3], 0 offen offset:4
19297+ ; GFX90A-NEXT: buffer_store_dword v0 , v6, s[0:3], 0 offen offset:4
1929419298; GFX90A-NEXT: .LBB245_6: ; %atomicrmw.phi
1929519299; GFX90A-NEXT: ;;#ASMSTART
1929619300; GFX90A-NEXT: ; use a[0:1]
0 commit comments