@@ -3963,8 +3963,8 @@ define i64 @test_vector_reduce_smax_v16i64(<16 x i64> %v) {
39633963; GFX7-SDAG-NEXT: v_cndmask_b32_e32 v5, v5, v7, vcc
39643964; GFX7-SDAG-NEXT: v_cndmask_b32_e32 v4, v4, v6, vcc
39653965; GFX7-SDAG-NEXT: v_cmp_gt_i64_e32 vcc, v[2:3], v[4:5]
3966- ; GFX7-SDAG-NEXT: v_cndmask_b32_e32 v3, v5, v3, vcc
39673966; GFX7-SDAG-NEXT: v_cndmask_b32_e32 v2, v4, v2, vcc
3967+ ; GFX7-SDAG-NEXT: v_cndmask_b32_e32 v3, v5, v3, vcc
39683968; GFX7-SDAG-NEXT: v_cmp_gt_i64_e32 vcc, v[0:1], v[2:3]
39693969; GFX7-SDAG-NEXT: v_cndmask_b32_e32 v0, v2, v0, vcc
39703970; GFX7-SDAG-NEXT: v_cndmask_b32_e32 v1, v3, v1, vcc
@@ -4067,8 +4067,8 @@ define i64 @test_vector_reduce_smax_v16i64(<16 x i64> %v) {
40674067; GFX8-SDAG-NEXT: v_cndmask_b32_e32 v5, v5, v7, vcc
40684068; GFX8-SDAG-NEXT: v_cndmask_b32_e32 v4, v4, v6, vcc
40694069; GFX8-SDAG-NEXT: v_cmp_gt_i64_e32 vcc, v[2:3], v[4:5]
4070- ; GFX8-SDAG-NEXT: v_cndmask_b32_e32 v3, v5, v3, vcc
40714070; GFX8-SDAG-NEXT: v_cndmask_b32_e32 v2, v4, v2, vcc
4071+ ; GFX8-SDAG-NEXT: v_cndmask_b32_e32 v3, v5, v3, vcc
40724072; GFX8-SDAG-NEXT: v_cmp_gt_i64_e32 vcc, v[0:1], v[2:3]
40734073; GFX8-SDAG-NEXT: v_cndmask_b32_e32 v0, v2, v0, vcc
40744074; GFX8-SDAG-NEXT: v_cndmask_b32_e32 v1, v3, v1, vcc
@@ -4175,8 +4175,8 @@ define i64 @test_vector_reduce_smax_v16i64(<16 x i64> %v) {
41754175; GFX9-SDAG-NEXT: v_cndmask_b32_e32 v4, v6, v4, vcc
41764176; GFX9-SDAG-NEXT: v_cmp_gt_i64_e32 vcc, v[2:3], v[4:5]
41774177; GFX9-SDAG-NEXT: s_nop 1
4178- ; GFX9-SDAG-NEXT: v_cndmask_b32_e32 v3, v5, v3, vcc
41794178; GFX9-SDAG-NEXT: v_cndmask_b32_e32 v2, v4, v2, vcc
4179+ ; GFX9-SDAG-NEXT: v_cndmask_b32_e32 v3, v5, v3, vcc
41804180; GFX9-SDAG-NEXT: v_cmp_gt_i64_e32 vcc, v[0:1], v[2:3]
41814181; GFX9-SDAG-NEXT: s_nop 1
41824182; GFX9-SDAG-NEXT: v_cndmask_b32_e32 v0, v2, v0, vcc
@@ -4283,8 +4283,8 @@ define i64 @test_vector_reduce_smax_v16i64(<16 x i64> %v) {
42834283; GFX10-SDAG-NEXT: v_cmp_gt_i64_e64 s4, v[2:3], v[6:7]
42844284; GFX10-SDAG-NEXT: v_cndmask_b32_e32 v1, v5, v1, vcc_lo
42854285; GFX10-SDAG-NEXT: v_cndmask_b32_e32 v0, v4, v0, vcc_lo
4286- ; GFX10-SDAG-NEXT: v_cndmask_b32_e64 v3, v7, v3, s4
42874286; GFX10-SDAG-NEXT: v_cndmask_b32_e64 v2, v6, v2, s4
4287+ ; GFX10-SDAG-NEXT: v_cndmask_b32_e64 v3, v7, v3, s4
42884288; GFX10-SDAG-NEXT: v_cmp_gt_i64_e32 vcc_lo, v[0:1], v[2:3]
42894289; GFX10-SDAG-NEXT: v_cndmask_b32_e32 v0, v2, v0, vcc_lo
42904290; GFX10-SDAG-NEXT: v_cndmask_b32_e32 v1, v3, v1, vcc_lo
@@ -4387,8 +4387,8 @@ define i64 @test_vector_reduce_smax_v16i64(<16 x i64> %v) {
43874387; GFX11-SDAG-NEXT: v_cmp_gt_i64_e64 s0, v[2:3], v[6:7]
43884388; GFX11-SDAG-NEXT: v_dual_cndmask_b32 v1, v5, v1 :: v_dual_cndmask_b32 v0, v4, v0
43894389; GFX11-SDAG-NEXT: s_delay_alu instid0(VALU_DEP_2) | instskip(SKIP_1) | instid1(VALU_DEP_1)
4390- ; GFX11-SDAG-NEXT: v_cndmask_b32_e64 v3, v7, v3, s0
43914390; GFX11-SDAG-NEXT: v_cndmask_b32_e64 v2, v6, v2, s0
4391+ ; GFX11-SDAG-NEXT: v_cndmask_b32_e64 v3, v7, v3, s0
43924392; GFX11-SDAG-NEXT: v_cmp_gt_i64_e32 vcc_lo, v[0:1], v[2:3]
43934393; GFX11-SDAG-NEXT: v_dual_cndmask_b32 v0, v2, v0 :: v_dual_cndmask_b32 v1, v3, v1
43944394; GFX11-SDAG-NEXT: s_setpc_b64 s[30:31]
@@ -4502,8 +4502,8 @@ define i64 @test_vector_reduce_smax_v16i64(<16 x i64> %v) {
45024502; GFX12-SDAG-NEXT: v_dual_cndmask_b32 v1, v5, v1 :: v_dual_cndmask_b32 v0, v4, v0
45034503; GFX12-SDAG-NEXT: s_wait_alu 0xf1ff
45044504; GFX12-SDAG-NEXT: s_delay_alu instid0(VALU_DEP_2) | instskip(SKIP_1) | instid1(VALU_DEP_1)
4505- ; GFX12-SDAG-NEXT: v_cndmask_b32_e64 v3, v7, v3, s0
45064505; GFX12-SDAG-NEXT: v_cndmask_b32_e64 v2, v6, v2, s0
4506+ ; GFX12-SDAG-NEXT: v_cndmask_b32_e64 v3, v7, v3, s0
45074507; GFX12-SDAG-NEXT: v_cmp_gt_i64_e32 vcc_lo, v[0:1], v[2:3]
45084508; GFX12-SDAG-NEXT: s_wait_alu 0xfffd
45094509; GFX12-SDAG-NEXT: v_dual_cndmask_b32 v0, v2, v0 :: v_dual_cndmask_b32 v1, v3, v1
0 commit comments