@@ -15780,16 +15780,18 @@ define amdgpu_gfx void @test_call_external_void_func_v32i32_i32_inreg(i32) #0 {
1578015780; GFX9-NEXT: v_writelane_b32 v40, s14, 10
1578115781; GFX9-NEXT: v_writelane_b32 v40, s15, 11
1578215782; GFX9-NEXT: v_writelane_b32 v40, s16, 12
15783- ; GFX9-NEXT: s_load_dwordx2 s[34:35], s[34:35], 0x0
1578415783; GFX9-NEXT: v_writelane_b32 v40, s17, 13
1578515784; GFX9-NEXT: v_writelane_b32 v40, s18, 14
15785+ ; GFX9-NEXT: s_load_dwordx2 s[34:35], s[34:35], 0x0
1578615786; GFX9-NEXT: v_writelane_b32 v40, s19, 15
1578715787; GFX9-NEXT: v_writelane_b32 v40, s20, 16
1578815788; GFX9-NEXT: v_writelane_b32 v40, s21, 17
15789- ; GFX9-NEXT: s_waitcnt lgkmcnt(0)
15790- ; GFX9-NEXT: s_load_dword s52, s[34:35], 0x0
1579115789; GFX9-NEXT: v_writelane_b32 v40, s22, 18
1579215790; GFX9-NEXT: v_writelane_b32 v40, s23, 19
15791+ ; GFX9-NEXT: s_waitcnt lgkmcnt(0)
15792+ ; GFX9-NEXT: s_load_dword s52, s[34:35], 0x0
15793+ ; GFX9-NEXT: ; kill: killed $sgpr34_sgpr35
15794+ ; GFX9-NEXT: ; kill: killed $sgpr34_sgpr35
1579315795; GFX9-NEXT: s_load_dwordx16 s[36:51], s[34:35], 0x40
1579415796; GFX9-NEXT: s_load_dwordx16 s[4:19], s[34:35], 0x0
1579515797; GFX9-NEXT: v_writelane_b32 v40, s24, 20
@@ -15812,8 +15814,6 @@ define amdgpu_gfx void @test_call_external_void_func_v32i32_i32_inreg(i32) #0 {
1581215814; GFX9-NEXT: buffer_store_dword v0, off, s[0:3], s32 offset:12
1581315815; GFX9-NEXT: v_mov_b32_e32 v0, s50
1581415816; GFX9-NEXT: v_writelane_b32 v40, s30, 26
15815- ; GFX9-NEXT: ; kill: killed $sgpr34_sgpr35
15816- ; GFX9-NEXT: ; kill: killed $sgpr34_sgpr35
1581715817; GFX9-NEXT: buffer_store_dword v0, off, s[0:3], s32 offset:16
1581815818; GFX9-NEXT: v_mov_b32_e32 v0, s51
1581915819; GFX9-NEXT: s_mov_b32 s35, external_void_func_v32i32_i32_inreg@abs32@hi
@@ -15880,20 +15880,14 @@ define amdgpu_gfx void @test_call_external_void_func_v32i32_i32_inreg(i32) #0 {
1588015880; GFX10-NEXT: v_writelane_b32 v40, s34, 28
1588115881; GFX10-NEXT: s_load_dwordx2 s[34:35], s[34:35], 0x0
1588215882; GFX10-NEXT: s_addk_i32 s32, 0x200
15883- ; GFX10-NEXT: ; kill: killed $sgpr34_sgpr35
15884- ; GFX10-NEXT: ; kill: killed $sgpr34_sgpr35
1588515883; GFX10-NEXT: v_writelane_b32 v40, s4, 0
1588615884; GFX10-NEXT: v_writelane_b32 v40, s5, 1
1588715885; GFX10-NEXT: v_writelane_b32 v40, s6, 2
1588815886; GFX10-NEXT: v_writelane_b32 v40, s7, 3
15889- ; GFX10-NEXT: s_waitcnt lgkmcnt(0)
15890- ; GFX10-NEXT: s_load_dword s52, s[34:35], 0x0
1589115887; GFX10-NEXT: v_writelane_b32 v40, s8, 4
1589215888; GFX10-NEXT: v_writelane_b32 v40, s9, 5
1589315889; GFX10-NEXT: v_writelane_b32 v40, s10, 6
1589415890; GFX10-NEXT: v_writelane_b32 v40, s11, 7
15895- ; GFX10-NEXT: s_waitcnt lgkmcnt(0)
15896- ; GFX10-NEXT: v_mov_b32_e32 v0, s52
1589715891; GFX10-NEXT: v_writelane_b32 v40, s12, 8
1589815892; GFX10-NEXT: v_writelane_b32 v40, s13, 9
1589915893; GFX10-NEXT: v_writelane_b32 v40, s14, 10
@@ -15902,39 +15896,44 @@ define amdgpu_gfx void @test_call_external_void_func_v32i32_i32_inreg(i32) #0 {
1590215896; GFX10-NEXT: v_writelane_b32 v40, s17, 13
1590315897; GFX10-NEXT: v_writelane_b32 v40, s18, 14
1590415898; GFX10-NEXT: v_writelane_b32 v40, s19, 15
15905- ; GFX10-NEXT: s_clause 0x1
15899+ ; GFX10-NEXT: s_waitcnt lgkmcnt(0)
15900+ ; GFX10-NEXT: s_clause 0x2
15901+ ; GFX10-NEXT: s_load_dword s52, s[34:35], 0x0
15902+ ; GFX10-NEXT: ; meta instruction
15903+ ; GFX10-NEXT: ; meta instruction
1590615904; GFX10-NEXT: s_load_dwordx16 s[36:51], s[34:35], 0x40
1590715905; GFX10-NEXT: s_load_dwordx16 s[4:19], s[34:35], 0x0
15908- ; GFX10-NEXT: buffer_store_dword v0, off, s[0:3], s32 offset:24
1590915906; GFX10-NEXT: s_mov_b32 s35, external_void_func_v32i32_i32_inreg@abs32@hi
1591015907; GFX10-NEXT: s_mov_b32 s34, external_void_func_v32i32_i32_inreg@abs32@lo
1591115908; GFX10-NEXT: v_writelane_b32 v40, s20, 16
1591215909; GFX10-NEXT: v_writelane_b32 v40, s21, 17
1591315910; GFX10-NEXT: v_writelane_b32 v40, s22, 18
1591415911; GFX10-NEXT: s_waitcnt lgkmcnt(0)
15915- ; GFX10-NEXT: v_mov_b32_e32 v0, s46
15916- ; GFX10-NEXT: v_writelane_b32 v40, s23, 19
15912+ ; GFX10-NEXT: v_mov_b32_e32 v0, s52
1591715913; GFX10-NEXT: v_mov_b32_e32 v1, s47
15914+ ; GFX10-NEXT: v_writelane_b32 v40, s23, 19
15915+ ; GFX10-NEXT: buffer_store_dword v0, off, s[0:3], s32 offset:24
15916+ ; GFX10-NEXT: v_mov_b32_e32 v0, s46
1591815917; GFX10-NEXT: v_mov_b32_e32 v2, s48
1591915918; GFX10-NEXT: v_mov_b32_e32 v3, s49
15920- ; GFX10-NEXT: s_mov_b32 s20, s36
1592115919; GFX10-NEXT: v_writelane_b32 v40, s24, 20
15920+ ; GFX10-NEXT: s_mov_b32 s20, s36
1592215921; GFX10-NEXT: s_mov_b32 s21, s37
1592315922; GFX10-NEXT: s_mov_b32 s22, s38
1592415923; GFX10-NEXT: s_mov_b32 s23, s39
15925- ; GFX10-NEXT: s_mov_b32 s24, s40
1592615924; GFX10-NEXT: v_writelane_b32 v40, s25, 21
15925+ ; GFX10-NEXT: s_mov_b32 s24, s40
1592715926; GFX10-NEXT: s_mov_b32 s25, s41
1592815927; GFX10-NEXT: v_mov_b32_e32 v4, s50
1592915928; GFX10-NEXT: v_mov_b32_e32 v5, s51
15929+ ; GFX10-NEXT: v_writelane_b32 v40, s26, 22
15930+ ; GFX10-NEXT: s_mov_b32 s26, s42
1593015931; GFX10-NEXT: buffer_store_dword v0, off, s[0:3], s32
1593115932; GFX10-NEXT: buffer_store_dword v1, off, s[0:3], s32 offset:4
1593215933; GFX10-NEXT: buffer_store_dword v2, off, s[0:3], s32 offset:8
1593315934; GFX10-NEXT: buffer_store_dword v3, off, s[0:3], s32 offset:12
1593415935; GFX10-NEXT: buffer_store_dword v4, off, s[0:3], s32 offset:16
1593515936; GFX10-NEXT: buffer_store_dword v5, off, s[0:3], s32 offset:20
15936- ; GFX10-NEXT: v_writelane_b32 v40, s26, 22
15937- ; GFX10-NEXT: s_mov_b32 s26, s42
1593815937; GFX10-NEXT: v_writelane_b32 v40, s27, 23
1593915938; GFX10-NEXT: s_mov_b32 s27, s43
1594015939; GFX10-NEXT: v_writelane_b32 v40, s28, 24
@@ -16100,22 +16099,15 @@ define amdgpu_gfx void @test_call_external_void_func_v32i32_i32_inreg(i32) #0 {
1610016099; GFX10-SCRATCH-NEXT: v_writelane_b32 v40, s0, 28
1610116100; GFX10-SCRATCH-NEXT: s_load_dwordx2 s[0:1], s[0:1], 0x0
1610216101; GFX10-SCRATCH-NEXT: s_add_i32 s32, s32, 16
16103- ; GFX10-SCRATCH-NEXT: ; kill: killed $sgpr0_sgpr1
16104- ; GFX10-SCRATCH-NEXT: ; kill: killed $sgpr0_sgpr1
1610516102; GFX10-SCRATCH-NEXT: s_add_i32 s3, s32, 16
1610616103; GFX10-SCRATCH-NEXT: v_writelane_b32 v40, s4, 0
1610716104; GFX10-SCRATCH-NEXT: v_writelane_b32 v40, s5, 1
1610816105; GFX10-SCRATCH-NEXT: v_writelane_b32 v40, s6, 2
1610916106; GFX10-SCRATCH-NEXT: v_writelane_b32 v40, s7, 3
16110- ; GFX10-SCRATCH-NEXT: s_waitcnt lgkmcnt(0)
16111- ; GFX10-SCRATCH-NEXT: s_load_dword s2, s[0:1], 0x0
1611216107; GFX10-SCRATCH-NEXT: v_writelane_b32 v40, s8, 4
1611316108; GFX10-SCRATCH-NEXT: v_writelane_b32 v40, s9, 5
1611416109; GFX10-SCRATCH-NEXT: v_writelane_b32 v40, s10, 6
1611516110; GFX10-SCRATCH-NEXT: v_writelane_b32 v40, s11, 7
16116- ; GFX10-SCRATCH-NEXT: s_waitcnt lgkmcnt(0)
16117- ; GFX10-SCRATCH-NEXT: v_mov_b32_e32 v6, s2
16118- ; GFX10-SCRATCH-NEXT: s_add_i32 s2, s32, 24
1611916111; GFX10-SCRATCH-NEXT: v_writelane_b32 v40, s12, 8
1612016112; GFX10-SCRATCH-NEXT: v_writelane_b32 v40, s13, 9
1612116113; GFX10-SCRATCH-NEXT: v_writelane_b32 v40, s14, 10
@@ -16124,7 +16116,11 @@ define amdgpu_gfx void @test_call_external_void_func_v32i32_i32_inreg(i32) #0 {
1612416116; GFX10-SCRATCH-NEXT: v_writelane_b32 v40, s17, 13
1612516117; GFX10-SCRATCH-NEXT: v_writelane_b32 v40, s18, 14
1612616118; GFX10-SCRATCH-NEXT: v_writelane_b32 v40, s19, 15
16127- ; GFX10-SCRATCH-NEXT: s_clause 0x1
16119+ ; GFX10-SCRATCH-NEXT: s_waitcnt lgkmcnt(0)
16120+ ; GFX10-SCRATCH-NEXT: s_clause 0x2
16121+ ; GFX10-SCRATCH-NEXT: s_load_dword s2, s[0:1], 0x0
16122+ ; GFX10-SCRATCH-NEXT: ; meta instruction
16123+ ; GFX10-SCRATCH-NEXT: ; meta instruction
1612816124; GFX10-SCRATCH-NEXT: s_load_dwordx16 s[36:51], s[0:1], 0x40
1612916125; GFX10-SCRATCH-NEXT: s_load_dwordx16 s[4:19], s[0:1], 0x0
1613016126; GFX10-SCRATCH-NEXT: s_mov_b32 s1, external_void_func_v32i32_i32_inreg@abs32@hi
@@ -16133,6 +16129,8 @@ define amdgpu_gfx void @test_call_external_void_func_v32i32_i32_inreg(i32) #0 {
1613316129; GFX10-SCRATCH-NEXT: v_writelane_b32 v40, s21, 17
1613416130; GFX10-SCRATCH-NEXT: v_writelane_b32 v40, s22, 18
1613516131; GFX10-SCRATCH-NEXT: s_waitcnt lgkmcnt(0)
16132+ ; GFX10-SCRATCH-NEXT: v_mov_b32_e32 v6, s2
16133+ ; GFX10-SCRATCH-NEXT: s_add_i32 s2, s32, 24
1613616134; GFX10-SCRATCH-NEXT: v_mov_b32_e32 v4, s50
1613716135; GFX10-SCRATCH-NEXT: v_writelane_b32 v40, s23, 19
1613816136; GFX10-SCRATCH-NEXT: v_mov_b32_e32 v5, s51
0 commit comments