@@ -24269,13 +24269,13 @@ define <16 x i8> @bitcast_v8bf16_to_v16i8(<8 x bfloat> %a, i32 %b) {
2426924269; GFX11-TRUE16-NEXT: ; implicit-def: $vgpr6_hi16
2427024270; GFX11-TRUE16-NEXT: ; implicit-def: $vgpr10_lo16
2427124271; GFX11-TRUE16-NEXT: ; implicit-def: $vgpr16_hi16
24272- ; GFX11-TRUE16-NEXT: ; implicit-def: $vgpr19_lo16
24272+ ; GFX11-TRUE16-NEXT: ; implicit-def: $vgpr22_lo16
2427324273; GFX11-TRUE16-NEXT: ; implicit-def: $vgpr4_hi16
2427424274; GFX11-TRUE16-NEXT: ; implicit-def: $vgpr5_lo16
2427524275; GFX11-TRUE16-NEXT: ; implicit-def: $vgpr7_lo16
2427624276; GFX11-TRUE16-NEXT: ; implicit-def: $vgpr8_hi16
2427724277; GFX11-TRUE16-NEXT: ; implicit-def: $vgpr9_lo16
24278- ; GFX11-TRUE16-NEXT: ; implicit-def: $vgpr21_hi16
24278+ ; GFX11-TRUE16-NEXT: ; implicit-def: $vgpr20_hi16
2427924279; GFX11-TRUE16-NEXT: ; implicit-def: $vgpr18_lo16
2428024280; GFX11-TRUE16-NEXT: ; implicit-def: $vgpr12_hi16
2428124281; GFX11-TRUE16-NEXT: ; implicit-def: $vgpr13_lo16
@@ -24285,22 +24285,22 @@ define <16 x i8> @bitcast_v8bf16_to_v16i8(<8 x bfloat> %a, i32 %b) {
2428524285; GFX11-TRUE16-NEXT: s_xor_b32 s0, exec_lo, s0
2428624286; GFX11-TRUE16-NEXT: s_cbranch_execz .LBB108_2
2428724287; GFX11-TRUE16-NEXT: ; %bb.1: ; %cmp.false
24288- ; GFX11-TRUE16-NEXT: v_lshrrev_b64 v[18:19], 24, v[2:3]
2428924288; GFX11-TRUE16-NEXT: v_lshrrev_b32_e32 v15, 24, v3
2429024289; GFX11-TRUE16-NEXT: v_lshrrev_b32_e32 v13, 8, v3
2429124290; GFX11-TRUE16-NEXT: v_lshrrev_b32_e32 v9, 8, v2
2429224291; GFX11-TRUE16-NEXT: v_lshrrev_b32_e32 v7, 24, v1
2429324292; GFX11-TRUE16-NEXT: v_lshrrev_b32_e32 v5, 8, v1
2429424293; GFX11-TRUE16-NEXT: v_lshrrev_b32_e32 v10, 8, v0
24295- ; GFX11-TRUE16-NEXT: v_lshrrev_b64 v[19:20], 24, v[0:1]
24294+ ; GFX11-TRUE16-NEXT: v_lshrrev_b64 v[18:19], 24, v[2:3]
24295+ ; GFX11-TRUE16-NEXT: v_lshrrev_b64 v[22:23], 24, v[0:1]
2429624296; GFX11-TRUE16-NEXT: v_mov_b16_e32 v6.h, v0.l
2429724297; GFX11-TRUE16-NEXT: v_mov_b16_e32 v16.h, v0.h
2429824298; GFX11-TRUE16-NEXT: v_mov_b16_e32 v4.h, v1.l
2429924299; GFX11-TRUE16-NEXT: v_mov_b16_e32 v17.h, v1.h
2430024300; GFX11-TRUE16-NEXT: v_mov_b16_e32 v8.h, v2.l
24301- ; GFX11-TRUE16-NEXT: v_mov_b16_e32 v21 .h, v2.h
24301+ ; GFX11-TRUE16-NEXT: v_mov_b16_e32 v20 .h, v2.h
2430224302; GFX11-TRUE16-NEXT: v_mov_b16_e32 v12.h, v3.l
24303- ; GFX11-TRUE16-NEXT: v_mov_b16_e32 v22 .h, v3.h
24303+ ; GFX11-TRUE16-NEXT: v_mov_b16_e32 v21 .h, v3.h
2430424304; GFX11-TRUE16-NEXT: ; implicit-def: $vgpr1
2430524305; GFX11-TRUE16-NEXT: ; implicit-def: $vgpr3
2430624306; GFX11-TRUE16-NEXT: .LBB108_2: ; %Flow
@@ -24372,32 +24372,32 @@ define <16 x i8> @bitcast_v8bf16_to_v16i8(<8 x bfloat> %a, i32 %b) {
2437224372; GFX11-TRUE16-NEXT: v_cndmask_b32_e32 v8, v8, v13, vcc_lo
2437324373; GFX11-TRUE16-NEXT: v_cmp_u_f32_e32 vcc_lo, v0, v0
2437424374; GFX11-TRUE16-NEXT: s_delay_alu instid0(VALU_DEP_4)
24375+ ; GFX11-TRUE16-NEXT: v_lshrrev_b64 v[22:23], 24, v[16:17]
2437524376; GFX11-TRUE16-NEXT: v_lshrrev_b32_e32 v10, 8, v16
24376- ; GFX11-TRUE16-NEXT: v_cndmask_b32_e32 v22 , v7, v9, vcc_lo
24377+ ; GFX11-TRUE16-NEXT: v_cndmask_b32_e32 v21 , v7, v9, vcc_lo
2437724378; GFX11-TRUE16-NEXT: v_cmp_u_f32_e32 vcc_lo, v2, v2
24378- ; GFX11-TRUE16-NEXT: v_mov_b16_e32 v22 .l, v12.h
24379+ ; GFX11-TRUE16-NEXT: v_mov_b16_e32 v21 .l, v12.h
2437924380; GFX11-TRUE16-NEXT: v_lshrrev_b32_e32 v7, 24, v17
24380- ; GFX11-TRUE16-NEXT: v_cndmask_b32_e32 v21 , v1, v3, vcc_lo
24381- ; GFX11-TRUE16-NEXT: v_mov_b16_e32 v21 .l, v8.h
24381+ ; GFX11-TRUE16-NEXT: v_cndmask_b32_e32 v20 , v1, v3, vcc_lo
24382+ ; GFX11-TRUE16-NEXT: v_mov_b16_e32 v20 .l, v8.h
2438224383; GFX11-TRUE16-NEXT: s_delay_alu instid0(VALU_DEP_4) | instskip(SKIP_1) | instid1(VALU_DEP_3)
24383- ; GFX11-TRUE16-NEXT: v_lshrrev_b32_e32 v15, 24, v22
24384- ; GFX11-TRUE16-NEXT: v_lshrrev_b32_e32 v13, 8, v22
24385- ; GFX11-TRUE16-NEXT: v_lshrrev_b64 v[18:19], 24, v[21:22]
24386- ; GFX11-TRUE16-NEXT: v_lshrrev_b64 v[19:20], 24, v[16:17]
24387- ; GFX11-TRUE16-NEXT: v_lshrrev_b32_e32 v9, 8, v21
24384+ ; GFX11-TRUE16-NEXT: v_lshrrev_b32_e32 v15, 24, v21
24385+ ; GFX11-TRUE16-NEXT: v_lshrrev_b32_e32 v13, 8, v21
24386+ ; GFX11-TRUE16-NEXT: v_lshrrev_b64 v[18:19], 24, v[20:21]
24387+ ; GFX11-TRUE16-NEXT: v_lshrrev_b32_e32 v9, 8, v20
2438824388; GFX11-TRUE16-NEXT: .LBB108_4: ; %end
2438924389; GFX11-TRUE16-NEXT: s_or_b32 exec_lo, exec_lo, s0
2439024390; GFX11-TRUE16-NEXT: v_mov_b16_e32 v0.l, v6.h
2439124391; GFX11-TRUE16-NEXT: v_mov_b16_e32 v1.l, v10.l
2439224392; GFX11-TRUE16-NEXT: v_mov_b16_e32 v2.l, v16.h
24393- ; GFX11-TRUE16-NEXT: v_mov_b16_e32 v3.l, v19 .l
24393+ ; GFX11-TRUE16-NEXT: v_mov_b16_e32 v3.l, v22 .l
2439424394; GFX11-TRUE16-NEXT: v_mov_b16_e32 v4.l, v4.h
2439524395; GFX11-TRUE16-NEXT: v_mov_b16_e32 v6.l, v17.h
2439624396; GFX11-TRUE16-NEXT: v_mov_b16_e32 v8.l, v8.h
24397- ; GFX11-TRUE16-NEXT: v_mov_b16_e32 v10.l, v21 .h
24397+ ; GFX11-TRUE16-NEXT: v_mov_b16_e32 v10.l, v20 .h
2439824398; GFX11-TRUE16-NEXT: v_mov_b16_e32 v11.l, v18.l
2439924399; GFX11-TRUE16-NEXT: v_mov_b16_e32 v12.l, v12.h
24400- ; GFX11-TRUE16-NEXT: v_mov_b16_e32 v14.l, v22 .h
24400+ ; GFX11-TRUE16-NEXT: v_mov_b16_e32 v14.l, v21 .h
2440124401; GFX11-TRUE16-NEXT: s_setpc_b64 s[30:31]
2440224402;
2440324403; GFX11-FAKE16-LABEL: bitcast_v8bf16_to_v16i8:
0 commit comments