@@ -1292,7 +1292,7 @@ define amdgpu_kernel void @ctpop_i16_in_br(ptr addrspace(1) %out, ptr addrspace(
12921292; SI-NEXT: buffer_store_short v0, off, s[0:3], 0
12931293; SI-NEXT: s_endpgm
12941294; SI-NEXT: .LBB14_4:
1295- ; SI-NEXT: v_mov_b32_e32 v0, 0
1295+ ; SI-NEXT: ; implicit-def: $vgpr0
12961296; SI-NEXT: s_branch .LBB14_2
12971297;
12981298; VI-LABEL: ctpop_i16_in_br:
@@ -1329,48 +1329,47 @@ define amdgpu_kernel void @ctpop_i16_in_br(ptr addrspace(1) %out, ptr addrspace(
13291329; EG: ; %bb.0: ; %entry
13301330; EG-NEXT: ALU 0, @20, KC0[], KC1[]
13311331; EG-NEXT: TEX 0 @14
1332- ; EG-NEXT: ALU_PUSH_BEFORE 4 , @21, KC0[], KC1[]
1332+ ; EG-NEXT: ALU_PUSH_BEFORE 3 , @21, KC0[], KC1[]
13331333; EG-NEXT: JUMP @7 POP:1
1334- ; EG-NEXT: ALU 0, @26 , KC0[CB0:0-32], KC1[]
1334+ ; EG-NEXT: ALU 0, @25 , KC0[CB0:0-32], KC1[]
13351335; EG-NEXT: TEX 0 @16
1336- ; EG-NEXT: ALU_POP_AFTER 1, @27 , KC0[], KC1[]
1337- ; EG-NEXT: ALU_PUSH_BEFORE 2, @29 , KC0[CB0:0-32], KC1[]
1336+ ; EG-NEXT: ALU_POP_AFTER 1, @26 , KC0[], KC1[]
1337+ ; EG-NEXT: ALU_PUSH_BEFORE 2, @28 , KC0[CB0:0-32], KC1[]
13381338; EG-NEXT: JUMP @11 POP:1
13391339; EG-NEXT: TEX 0 @18
1340- ; EG-NEXT: ALU_POP_AFTER 0, @32 , KC0[], KC1[]
1341- ; EG-NEXT: ALU 11, @33 , KC0[], KC1[]
1340+ ; EG-NEXT: ALU_POP_AFTER 0, @31 , KC0[], KC1[]
1341+ ; EG-NEXT: ALU 11, @32 , KC0[], KC1[]
13421342; EG-NEXT: MEM_RAT MSKOR T1.XW, T0.X
13431343; EG-NEXT: CF_END
13441344; EG-NEXT: Fetch clause starting at 14:
1345- ; EG-NEXT: VTX_READ_16 T2 .X, T1 .X, 46, #3
1345+ ; EG-NEXT: VTX_READ_16 T1 .X, T0 .X, 46, #3
13461346; EG-NEXT: Fetch clause starting at 16:
1347- ; EG-NEXT: VTX_READ_16 T0 .X, T0 .X, 2, #1
1347+ ; EG-NEXT: VTX_READ_16 T1 .X, T1 .X, 2, #1
13481348; EG-NEXT: Fetch clause starting at 18:
1349- ; EG-NEXT: VTX_READ_16 T0.X, T1 .X, 44, #3
1349+ ; EG-NEXT: VTX_READ_16 T0.X, T0 .X, 44, #3
13501350; EG-NEXT: ALU clause starting at 20:
1351- ; EG-NEXT: MOV * T1 .X, 0.0,
1351+ ; EG-NEXT: MOV * T0 .X, 0.0,
13521352; EG-NEXT: ALU clause starting at 21:
1353- ; EG-NEXT: MOV T0.X, literal.x,
1354- ; EG-NEXT: MOV T1.W, literal.y,
1355- ; EG-NEXT: SETNE_INT * T0.W, T2.X, 0.0,
1356- ; EG-NEXT: 0(0.000000e+00), 1(1.401298e-45)
1353+ ; EG-NEXT: MOV T1.W, literal.x,
1354+ ; EG-NEXT: SETNE_INT * T0.W, T1.X, 0.0,
1355+ ; EG-NEXT: 1(1.401298e-45), 0(0.000000e+00)
13571356; EG-NEXT: PRED_SETNE_INT * ExecMask,PredicateBit (MASKED), PS, 0.0,
1357+ ; EG-NEXT: ALU clause starting at 25:
1358+ ; EG-NEXT: MOV * T1.X, KC0[2].Z,
13581359; EG-NEXT: ALU clause starting at 26:
1359- ; EG-NEXT: MOV * T0.X, KC0[2].Z,
1360- ; EG-NEXT: ALU clause starting at 27:
13611360; EG-NEXT: MOV * T1.W, literal.x,
13621361; EG-NEXT: 0(0.000000e+00), 0(0.000000e+00)
1363- ; EG-NEXT: ALU clause starting at 29 :
1362+ ; EG-NEXT: ALU clause starting at 28 :
13641363; EG-NEXT: MOV T0.W, KC0[2].Y,
13651364; EG-NEXT: SETE_INT * T1.W, T1.W, 0.0,
13661365; EG-NEXT: PRED_SETE_INT * ExecMask,PredicateBit (MASKED), PS, 0.0,
1366+ ; EG-NEXT: ALU clause starting at 31:
1367+ ; EG-NEXT: BCNT_INT * T1.X, T0.X,
13671368; EG-NEXT: ALU clause starting at 32:
1368- ; EG-NEXT: BCNT_INT * T0.X, T0.X,
1369- ; EG-NEXT: ALU clause starting at 33:
13701369; EG-NEXT: LSHL * T1.W, T0.W, literal.x,
13711370; EG-NEXT: 3(4.203895e-45), 0(0.000000e+00)
13721371; EG-NEXT: AND_INT T1.W, PV.W, literal.x,
1373- ; EG-NEXT: AND_INT * T2.W, T0 .X, literal.y,
1372+ ; EG-NEXT: AND_INT * T2.W, T1 .X, literal.y,
13741373; EG-NEXT: 24(3.363116e-44), 65535(9.183409e-41)
13751374; EG-NEXT: LSHL T1.X, PS, PV.W,
13761375; EG-NEXT: LSHL * T1.W, literal.x, PV.W,
0 commit comments