@@ -880,17 +880,17 @@ define amdgpu_kernel void @select_v2f16(
880880; GFX11-TRUE16-NEXT: v_lshrrev_b32_e32 v5, 16, v1
881881; GFX11-TRUE16-NEXT: v_cmp_lt_f16_e32 vcc_lo, v1.l, v0.l
882882; GFX11-TRUE16-NEXT: s_waitcnt vmcnt(1)
883- ; GFX11-TRUE16-NEXT: v_lshrrev_b32_e32 v1 , 16, v2
883+ ; GFX11-TRUE16-NEXT: v_lshrrev_b32_e32 v0 , 16, v2
884884; GFX11-TRUE16-NEXT: s_waitcnt vmcnt(0)
885- ; GFX11-TRUE16-NEXT: v_lshrrev_b32_e32 v6 , 16, v3
885+ ; GFX11-TRUE16-NEXT: v_lshrrev_b32_e32 v1 , 16, v3
886886; GFX11-TRUE16-NEXT: v_cmp_lt_f16_e64 s0, v5.l, v4.l
887- ; GFX11-TRUE16-NEXT: v_cndmask_b16 v0 .l, v2.l, v3.l, vcc_lo
887+ ; GFX11-TRUE16-NEXT: v_cndmask_b16 v2 .l, v2.l, v3.l, vcc_lo
888888; GFX11-TRUE16-NEXT: s_delay_alu instid0(VALU_DEP_2) | instskip(NEXT) | instid1(VALU_DEP_2)
889- ; GFX11-TRUE16-NEXT: v_cndmask_b16 v1 .l, v1 .l, v6 .l, s0
890- ; GFX11-TRUE16-NEXT: v_and_b32_e32 v0 , 0xffff, v0
889+ ; GFX11-TRUE16-NEXT: v_cndmask_b16 v0 .l, v0 .l, v1 .l, s0
890+ ; GFX11-TRUE16-NEXT: v_and_b32_e32 v1 , 0xffff, v2
891891; GFX11-TRUE16-NEXT: s_mov_b32 s0, s8
892892; GFX11-TRUE16-NEXT: s_delay_alu instid0(VALU_DEP_1)
893- ; GFX11-TRUE16-NEXT: v_lshl_or_b32 v0, v1 , 16, v0
893+ ; GFX11-TRUE16-NEXT: v_lshl_or_b32 v0, v0 , 16, v1
894894; GFX11-TRUE16-NEXT: buffer_store_b32 v0, off, s[0:3], 0
895895; GFX11-TRUE16-NEXT: s_endpgm
896896;
@@ -1066,17 +1066,17 @@ define amdgpu_kernel void @select_v2f16_imm_a(
10661066; GFX11-TRUE16-NEXT: v_lshrrev_b32_e32 v3, 16, v0
10671067; GFX11-TRUE16-NEXT: v_cmp_lt_f16_e32 vcc_lo, 0.5, v0.l
10681068; GFX11-TRUE16-NEXT: s_waitcnt vmcnt(1)
1069- ; GFX11-TRUE16-NEXT: v_lshrrev_b32_e32 v4 , 16, v1
1069+ ; GFX11-TRUE16-NEXT: v_lshrrev_b32_e32 v0 , 16, v1
10701070; GFX11-TRUE16-NEXT: s_waitcnt vmcnt(0)
1071- ; GFX11-TRUE16-NEXT: v_lshrrev_b32_e32 v5 , 16, v2
1071+ ; GFX11-TRUE16-NEXT: v_lshrrev_b32_e32 v4 , 16, v2
10721072; GFX11-TRUE16-NEXT: v_cmp_lt_f16_e64 s0, 0x3900, v3.l
1073- ; GFX11-TRUE16-NEXT: v_cndmask_b16 v0 .l, v2.l, v1.l, vcc_lo
1073+ ; GFX11-TRUE16-NEXT: v_cndmask_b16 v1 .l, v2.l, v1.l, vcc_lo
10741074; GFX11-TRUE16-NEXT: s_delay_alu instid0(VALU_DEP_2) | instskip(NEXT) | instid1(VALU_DEP_2)
1075- ; GFX11-TRUE16-NEXT: v_cndmask_b16 v1 .l, v5 .l, v4 .l, s0
1076- ; GFX11-TRUE16-NEXT: v_and_b32_e32 v0 , 0xffff, v0
1075+ ; GFX11-TRUE16-NEXT: v_cndmask_b16 v0 .l, v4 .l, v0 .l, s0
1076+ ; GFX11-TRUE16-NEXT: v_and_b32_e32 v1 , 0xffff, v1
10771077; GFX11-TRUE16-NEXT: s_mov_b32 s0, s4
10781078; GFX11-TRUE16-NEXT: s_delay_alu instid0(VALU_DEP_1)
1079- ; GFX11-TRUE16-NEXT: v_lshl_or_b32 v0, v1 , 16, v0
1079+ ; GFX11-TRUE16-NEXT: v_lshl_or_b32 v0, v0 , 16, v1
10801080; GFX11-TRUE16-NEXT: buffer_store_b32 v0, off, s[0:3], 0
10811081; GFX11-TRUE16-NEXT: s_endpgm
10821082;
@@ -1245,17 +1245,17 @@ define amdgpu_kernel void @select_v2f16_imm_b(
12451245; GFX11-TRUE16-NEXT: v_lshrrev_b32_e32 v3, 16, v0
12461246; GFX11-TRUE16-NEXT: v_cmp_gt_f16_e32 vcc_lo, 0.5, v0.l
12471247; GFX11-TRUE16-NEXT: s_waitcnt vmcnt(1)
1248- ; GFX11-TRUE16-NEXT: v_lshrrev_b32_e32 v4 , 16, v1
1248+ ; GFX11-TRUE16-NEXT: v_lshrrev_b32_e32 v0 , 16, v1
12491249; GFX11-TRUE16-NEXT: s_waitcnt vmcnt(0)
1250- ; GFX11-TRUE16-NEXT: v_lshrrev_b32_e32 v5 , 16, v2
1250+ ; GFX11-TRUE16-NEXT: v_lshrrev_b32_e32 v4 , 16, v2
12511251; GFX11-TRUE16-NEXT: v_cmp_gt_f16_e64 s0, 0x3900, v3.l
1252- ; GFX11-TRUE16-NEXT: v_cndmask_b16 v0 .l, v2.l, v1.l, vcc_lo
1252+ ; GFX11-TRUE16-NEXT: v_cndmask_b16 v1 .l, v2.l, v1.l, vcc_lo
12531253; GFX11-TRUE16-NEXT: s_delay_alu instid0(VALU_DEP_2) | instskip(NEXT) | instid1(VALU_DEP_2)
1254- ; GFX11-TRUE16-NEXT: v_cndmask_b16 v1 .l, v5 .l, v4 .l, s0
1255- ; GFX11-TRUE16-NEXT: v_and_b32_e32 v0 , 0xffff, v0
1254+ ; GFX11-TRUE16-NEXT: v_cndmask_b16 v0 .l, v4 .l, v0 .l, s0
1255+ ; GFX11-TRUE16-NEXT: v_and_b32_e32 v1 , 0xffff, v1
12561256; GFX11-TRUE16-NEXT: s_mov_b32 s0, s4
12571257; GFX11-TRUE16-NEXT: s_delay_alu instid0(VALU_DEP_1)
1258- ; GFX11-TRUE16-NEXT: v_lshl_or_b32 v0, v1 , 16, v0
1258+ ; GFX11-TRUE16-NEXT: v_lshl_or_b32 v0, v0 , 16, v1
12591259; GFX11-TRUE16-NEXT: buffer_store_b32 v0, off, s[0:3], 0
12601260; GFX11-TRUE16-NEXT: s_endpgm
12611261;
@@ -1428,15 +1428,15 @@ define amdgpu_kernel void @select_v2f16_imm_c(
14281428; GFX11-TRUE16-NEXT: v_lshrrev_b32_e32 v4, 16, v1
14291429; GFX11-TRUE16-NEXT: v_cmp_nlt_f16_e32 vcc_lo, v1.l, v0.l
14301430; GFX11-TRUE16-NEXT: s_waitcnt vmcnt(0)
1431- ; GFX11-TRUE16-NEXT: v_lshrrev_b32_e32 v1 , 16, v2
1431+ ; GFX11-TRUE16-NEXT: v_lshrrev_b32_e32 v0 , 16, v2
14321432; GFX11-TRUE16-NEXT: s_delay_alu instid0(VALU_DEP_3) | instskip(SKIP_1) | instid1(VALU_DEP_2)
14331433; GFX11-TRUE16-NEXT: v_cmp_nlt_f16_e64 s0, v4.l, v3.l
1434- ; GFX11-TRUE16-NEXT: v_cndmask_b16 v0 .l, 0x3800, v2.l, vcc_lo
1435- ; GFX11-TRUE16-NEXT: v_cndmask_b16 v1 .l, 0x3900, v1 .l, s0
1434+ ; GFX11-TRUE16-NEXT: v_cndmask_b16 v1 .l, 0x3800, v2.l, vcc_lo
1435+ ; GFX11-TRUE16-NEXT: v_cndmask_b16 v0 .l, 0x3900, v0 .l, s0
14361436; GFX11-TRUE16-NEXT: s_delay_alu instid0(VALU_DEP_2) | instskip(SKIP_1) | instid1(VALU_DEP_1)
1437- ; GFX11-TRUE16-NEXT: v_and_b32_e32 v0 , 0xffff, v0
1437+ ; GFX11-TRUE16-NEXT: v_and_b32_e32 v1 , 0xffff, v1
14381438; GFX11-TRUE16-NEXT: s_mov_b32 s0, s4
1439- ; GFX11-TRUE16-NEXT: v_lshl_or_b32 v0, v1 , 16, v0
1439+ ; GFX11-TRUE16-NEXT: v_lshl_or_b32 v0, v0 , 16, v1
14401440; GFX11-TRUE16-NEXT: buffer_store_b32 v0, off, s[0:3], 0
14411441; GFX11-TRUE16-NEXT: s_endpgm
14421442;
@@ -1609,15 +1609,15 @@ define amdgpu_kernel void @select_v2f16_imm_d(
16091609; GFX11-TRUE16-NEXT: v_lshrrev_b32_e32 v4, 16, v1
16101610; GFX11-TRUE16-NEXT: v_cmp_lt_f16_e32 vcc_lo, v1.l, v0.l
16111611; GFX11-TRUE16-NEXT: s_waitcnt vmcnt(0)
1612- ; GFX11-TRUE16-NEXT: v_lshrrev_b32_e32 v1 , 16, v2
1612+ ; GFX11-TRUE16-NEXT: v_lshrrev_b32_e32 v0 , 16, v2
16131613; GFX11-TRUE16-NEXT: s_delay_alu instid0(VALU_DEP_3) | instskip(SKIP_1) | instid1(VALU_DEP_2)
16141614; GFX11-TRUE16-NEXT: v_cmp_lt_f16_e64 s0, v4.l, v3.l
1615- ; GFX11-TRUE16-NEXT: v_cndmask_b16 v0 .l, 0x3800, v2.l, vcc_lo
1616- ; GFX11-TRUE16-NEXT: v_cndmask_b16 v1 .l, 0x3900, v1 .l, s0
1615+ ; GFX11-TRUE16-NEXT: v_cndmask_b16 v1 .l, 0x3800, v2.l, vcc_lo
1616+ ; GFX11-TRUE16-NEXT: v_cndmask_b16 v0 .l, 0x3900, v0 .l, s0
16171617; GFX11-TRUE16-NEXT: s_delay_alu instid0(VALU_DEP_2) | instskip(SKIP_1) | instid1(VALU_DEP_1)
1618- ; GFX11-TRUE16-NEXT: v_and_b32_e32 v0 , 0xffff, v0
1618+ ; GFX11-TRUE16-NEXT: v_and_b32_e32 v1 , 0xffff, v1
16191619; GFX11-TRUE16-NEXT: s_mov_b32 s0, s4
1620- ; GFX11-TRUE16-NEXT: v_lshl_or_b32 v0, v1 , 16, v0
1620+ ; GFX11-TRUE16-NEXT: v_lshl_or_b32 v0, v0 , 16, v1
16211621; GFX11-TRUE16-NEXT: buffer_store_b32 v0, off, s[0:3], 0
16221622; GFX11-TRUE16-NEXT: s_endpgm
16231623;
0 commit comments