@@ -746,9 +746,9 @@ define amdgpu_ps void @wqm_deriv(<2 x float> %input, float %arg, i32 %index) {
746746; GFX9-NEXT: s_mov_b64 exec, 0
747747; GFX9-NEXT: .LBB6_6: ; %.continue1
748748; GFX9-NEXT: s_or_b64 exec, exec, s[2:3]
749- ; GFX9-NEXT: v_mov_b32_e32 v0, 0x3c00
750- ; GFX9-NEXT: v_bfrev_b32_e32 v1, 60
751- ; GFX9-NEXT: exp mrt0 v0, v0, v1, v1 done compr vm
749+ ; GFX9-NEXT: v_bfrev_b32_e32 v0, 60
750+ ; GFX9-NEXT: v_mov_b32_e32 v1, 0x3c00
751+ ; GFX9-NEXT: exp mrt0 v1, v1, v0, v0 done compr vm
752752; GFX9-NEXT: s_endpgm
753753; GFX9-NEXT: .LBB6_7:
754754; GFX9-NEXT: s_mov_b64 exec, 0
@@ -792,9 +792,9 @@ define amdgpu_ps void @wqm_deriv(<2 x float> %input, float %arg, i32 %index) {
792792; GFX10-32-NEXT: s_mov_b32 exec_lo, 0
793793; GFX10-32-NEXT: .LBB6_6: ; %.continue1
794794; GFX10-32-NEXT: s_or_b32 exec_lo, exec_lo, s1
795- ; GFX10-32-NEXT: v_mov_b32_e32 v0, 0x3c00
796- ; GFX10-32-NEXT: v_bfrev_b32_e32 v1, 60
797- ; GFX10-32-NEXT: exp mrt0 v0, v0, v1, v1 done compr vm
795+ ; GFX10-32-NEXT: v_bfrev_b32_e32 v0, 60
796+ ; GFX10-32-NEXT: v_mov_b32_e32 v1, 0x3c00
797+ ; GFX10-32-NEXT: exp mrt0 v1, v1, v0, v0 done compr vm
798798; GFX10-32-NEXT: s_endpgm
799799; GFX10-32-NEXT: .LBB6_7:
800800; GFX10-32-NEXT: s_mov_b32 exec_lo, 0
@@ -838,9 +838,9 @@ define amdgpu_ps void @wqm_deriv(<2 x float> %input, float %arg, i32 %index) {
838838; GFX10-64-NEXT: s_mov_b64 exec, 0
839839; GFX10-64-NEXT: .LBB6_6: ; %.continue1
840840; GFX10-64-NEXT: s_or_b64 exec, exec, s[2:3]
841- ; GFX10-64-NEXT: v_mov_b32_e32 v0, 0x3c00
842- ; GFX10-64-NEXT: v_bfrev_b32_e32 v1, 60
843- ; GFX10-64-NEXT: exp mrt0 v0, v0, v1, v1 done compr vm
841+ ; GFX10-64-NEXT: v_bfrev_b32_e32 v0, 60
842+ ; GFX10-64-NEXT: v_mov_b32_e32 v1, 0x3c00
843+ ; GFX10-64-NEXT: exp mrt0 v1, v1, v0, v0 done compr vm
844844; GFX10-64-NEXT: s_endpgm
845845; GFX10-64-NEXT: .LBB6_7:
846846; GFX10-64-NEXT: s_mov_b64 exec, 0
@@ -1005,9 +1005,9 @@ define amdgpu_ps void @wqm_deriv_loop(<2 x float> %input, float %arg, i32 %index
10051005; GFX9-NEXT: .LBB7_8: ; %.return
10061006; GFX9-NEXT: s_or_b64 exec, exec, s[2:3]
10071007; GFX9-NEXT: s_and_b64 exec, exec, s[0:1]
1008- ; GFX9-NEXT: v_mov_b32_e32 v0, 0x3c00
1009- ; GFX9-NEXT: v_bfrev_b32_e32 v1, 60
1010- ; GFX9-NEXT: exp mrt0 v0, v0, v1, v1 done compr vm
1008+ ; GFX9-NEXT: v_bfrev_b32_e32 v0, 60
1009+ ; GFX9-NEXT: v_mov_b32_e32 v1, 0x3c00
1010+ ; GFX9-NEXT: exp mrt0 v1, v1, v0, v0 done compr vm
10111011; GFX9-NEXT: s_endpgm
10121012; GFX9-NEXT: .LBB7_9:
10131013; GFX9-NEXT: s_mov_b64 exec, 0
@@ -1068,9 +1068,9 @@ define amdgpu_ps void @wqm_deriv_loop(<2 x float> %input, float %arg, i32 %index
10681068; GFX10-32-NEXT: .LBB7_8: ; %.return
10691069; GFX10-32-NEXT: s_or_b32 exec_lo, exec_lo, s1
10701070; GFX10-32-NEXT: s_and_b32 exec_lo, exec_lo, s0
1071- ; GFX10-32-NEXT: v_mov_b32_e32 v0, 0x3c00
1072- ; GFX10-32-NEXT: v_bfrev_b32_e32 v1, 60
1073- ; GFX10-32-NEXT: exp mrt0 v0, v0, v1, v1 done compr vm
1071+ ; GFX10-32-NEXT: v_bfrev_b32_e32 v0, 60
1072+ ; GFX10-32-NEXT: v_mov_b32_e32 v1, 0x3c00
1073+ ; GFX10-32-NEXT: exp mrt0 v1, v1, v0, v0 done compr vm
10741074; GFX10-32-NEXT: s_endpgm
10751075; GFX10-32-NEXT: .LBB7_9:
10761076; GFX10-32-NEXT: s_mov_b32 exec_lo, 0
@@ -1131,9 +1131,9 @@ define amdgpu_ps void @wqm_deriv_loop(<2 x float> %input, float %arg, i32 %index
11311131; GFX10-64-NEXT: .LBB7_8: ; %.return
11321132; GFX10-64-NEXT: s_or_b64 exec, exec, s[2:3]
11331133; GFX10-64-NEXT: s_and_b64 exec, exec, s[0:1]
1134- ; GFX10-64-NEXT: v_mov_b32_e32 v0, 0x3c00
1135- ; GFX10-64-NEXT: v_bfrev_b32_e32 v1, 60
1136- ; GFX10-64-NEXT: exp mrt0 v0, v0, v1, v1 done compr vm
1134+ ; GFX10-64-NEXT: v_bfrev_b32_e32 v0, 60
1135+ ; GFX10-64-NEXT: v_mov_b32_e32 v1, 0x3c00
1136+ ; GFX10-64-NEXT: exp mrt0 v1, v1, v0, v0 done compr vm
11371137; GFX10-64-NEXT: s_endpgm
11381138; GFX10-64-NEXT: .LBB7_9:
11391139; GFX10-64-NEXT: s_mov_b64 exec, 0
0 commit comments