@@ -46,7 +46,7 @@ define <4 x float> @test_mfma_scale_f32_16x16x128_f8f6f4_1_1__cbsz1__blgp1(<8 x
4646; GCN-NEXT: v_accvgpr_write_b32 a2, v18
4747; GCN-NEXT: v_accvgpr_write_b32 a3, v19
4848; GCN-NEXT: s_nop 1
49- ; GCN-NEXT: v_mfma_scale_f32_16x16x128_f8f6f4 a[0:3], v[0:7], v[8:15], a[0:3], v20, v21 op_sel_hi:[0,0,0]
49+ ; GCN-NEXT: v_mfma_scale_f32_16x16x128_f8f6f4 a[0:3], v[0:7], v[8:15], a[0:3], v20, v21 op_sel:[1,1,0] op_sel_hi:[0,0,0]
5050; GCN-NEXT: s_nop 7
5151; GCN-NEXT: s_nop 3
5252; GCN-NEXT: v_accvgpr_read_b32 v0, a0
@@ -70,7 +70,7 @@ define <4 x float> @test_mfma_scale_f32_16x16x128_f8f6f4_2_2__cbsz1__blgp1(<8 x
7070; GCN-NEXT: v_accvgpr_write_b32 a2, v18
7171; GCN-NEXT: v_accvgpr_write_b32 a3, v19
7272; GCN-NEXT: s_nop 1
73- ; GCN-NEXT: v_mfma_scale_f32_16x16x128_f8f6f4 a[0:3], v[0:7], v[8:15], a[0:3], v20, v21 op_sel_hi:[0,0 ,0]
73+ ; GCN-NEXT: v_mfma_scale_f32_16x16x128_f8f6f4 a[0:3], v[0:7], v[8:15], a[0:3], v20, v21 op_sel_hi:[1,1 ,0]
7474; GCN-NEXT: s_nop 7
7575; GCN-NEXT: s_nop 3
7676; GCN-NEXT: v_accvgpr_read_b32 v0, a0
@@ -94,7 +94,7 @@ define <4 x float> @test_mfma_scale_f32_16x16x128_f8f6f4_3_3__cbsz1__blgp1(<8 x
9494; GCN-NEXT: v_accvgpr_write_b32 a2, v18
9595; GCN-NEXT: v_accvgpr_write_b32 a3, v19
9696; GCN-NEXT: s_nop 1
97- ; GCN-NEXT: v_mfma_scale_f32_16x16x128_f8f6f4 a[0:3], v[0:7], v[8:15], a[0:3], v20, v21 op_sel_hi:[0,0 ,0]
97+ ; GCN-NEXT: v_mfma_scale_f32_16x16x128_f8f6f4 a[0:3], v[0:7], v[8:15], a[0:3], v20, v21 op_sel:[1,1,0] op_sel_hi:[1,1 ,0]
9898; GCN-NEXT: s_nop 7
9999; GCN-NEXT: s_nop 3
100100; GCN-NEXT: v_accvgpr_read_b32 v0, a0
@@ -118,7 +118,7 @@ define <4 x float> @test_mfma_scale_f32_16x16x128_f8f6f4_0_3__cbsz1__blgp1(<8 x
118118; GCN-NEXT: v_accvgpr_write_b32 a2, v18
119119; GCN-NEXT: v_accvgpr_write_b32 a3, v19
120120; GCN-NEXT: s_nop 1
121- ; GCN-NEXT: v_mfma_scale_f32_16x16x128_f8f6f4 a[0:3], v[0:7], v[8:15], a[0:3], v20, v21 op_sel_hi :[0,0 ,0]
121+ ; GCN-NEXT: v_mfma_scale_f32_16x16x128_f8f6f4 a[0:3], v[0:7], v[8:15], a[0:3], v20, v21 op_sel :[0,1,0] op_sel_hi:[0,1 ,0]
122122; GCN-NEXT: s_nop 7
123123; GCN-NEXT: s_nop 3
124124; GCN-NEXT: v_accvgpr_read_b32 v0, a0
@@ -142,7 +142,7 @@ define <4 x float> @test_mfma_scale_f32_16x16x128_f8f6f4_3_0__cbsz1__blgp1(<8 x
142142; GCN-NEXT: v_accvgpr_write_b32 a2, v18
143143; GCN-NEXT: v_accvgpr_write_b32 a3, v19
144144; GCN-NEXT: s_nop 1
145- ; GCN-NEXT: v_mfma_scale_f32_16x16x128_f8f6f4 a[0:3], v[0:7], v[8:15], a[0:3], v20, v21 op_sel_hi:[0 ,0,0]
145+ ; GCN-NEXT: v_mfma_scale_f32_16x16x128_f8f6f4 a[0:3], v[0:7], v[8:15], a[0:3], v20, v21 op_sel:[1,0,0] op_sel_hi:[1 ,0,0]
146146; GCN-NEXT: s_nop 7
147147; GCN-NEXT: s_nop 3
148148; GCN-NEXT: v_accvgpr_read_b32 v0, a0
@@ -166,7 +166,7 @@ define <4 x float> @test_mfma_scale_f32_16x16x128_f8f6f4_2_3__cbsz1__blgp1(<8 x
166166; GCN-NEXT: v_accvgpr_write_b32 a2, v18
167167; GCN-NEXT: v_accvgpr_write_b32 a3, v19
168168; GCN-NEXT: s_nop 1
169- ; GCN-NEXT: v_mfma_scale_f32_16x16x128_f8f6f4 a[0:3], v[0:7], v[8:15], a[0:3], v20, v21 op_sel_hi :[0,0 ,0]
169+ ; GCN-NEXT: v_mfma_scale_f32_16x16x128_f8f6f4 a[0:3], v[0:7], v[8:15], a[0:3], v20, v21 op_sel :[0,1,0] op_sel_hi:[1,1 ,0]
170170; GCN-NEXT: s_nop 7
171171; GCN-NEXT: s_nop 3
172172; GCN-NEXT: v_accvgpr_read_b32 v0, a0
@@ -190,7 +190,7 @@ define <4 x float> @test_mfma_scale_f32_16x16x128_f8f6f4_3_2__cbsz1__blgp1(<8 x
190190; GCN-NEXT: v_accvgpr_write_b32 a2, v18
191191; GCN-NEXT: v_accvgpr_write_b32 a3, v19
192192; GCN-NEXT: s_nop 1
193- ; GCN-NEXT: v_mfma_scale_f32_16x16x128_f8f6f4 a[0:3], v[0:7], v[8:15], a[0:3], v20, v21 op_sel_hi:[ 0,0,0]
193+ ; GCN-NEXT: v_mfma_scale_f32_16x16x128_f8f6f4 a[0:3], v[0:7], v[8:15], a[0:3], v20, v21 op_sel:[1, 0,0] op_sel_hi:[1,1 ,0]
194194; GCN-NEXT: s_nop 7
195195; GCN-NEXT: s_nop 3
196196; GCN-NEXT: v_accvgpr_read_b32 v0, a0
@@ -1797,7 +1797,7 @@ define <4 x float> @test_mfma_scale_f32_16x16x128_f8f6f4_0_0__scaleA_inlineimm__
17971797; GCN-NEXT: v_accvgpr_write_b32 a2, v18
17981798; GCN-NEXT: v_accvgpr_write_b32 a3, v19
17991799; GCN-NEXT: s_nop 1
1800- ; GCN-NEXT: v_mfma_scale_f32_16x16x128_f8f6f4 a[0:3], v[0:7], v[8:15], a[0:3], 33, -2 op_sel_hi:[0,0 ,0]
1800+ ; GCN-NEXT: v_mfma_scale_f32_16x16x128_f8f6f4 a[0:3], v[0:7], v[8:15], a[0:3], 33, -2 op_sel_hi:[1,1 ,0]
18011801; GCN-NEXT: s_nop 7
18021802; GCN-NEXT: s_nop 3
18031803; GCN-NEXT: v_accvgpr_read_b32 v0, a0
@@ -1819,7 +1819,7 @@ define <4 x float> @test_mfma_scale_f32_16x16x128_f8f6f4_0_0__scaleA_kimm__scale
18191819; SDAG-NEXT: v_accvgpr_write_b32 a2, v18
18201820; SDAG-NEXT: v_accvgpr_write_b32 a3, v19
18211821; SDAG-NEXT: s_nop 1
1822- ; SDAG-NEXT: v_mfma_scale_f32_16x16x128_f8f6f4 a[0:3], v[0:7], v[8:15], a[0:3], s0, -2 op_sel_hi:[0,0 ,0]
1822+ ; SDAG-NEXT: v_mfma_scale_f32_16x16x128_f8f6f4 a[0:3], v[0:7], v[8:15], a[0:3], s0, -2 op_sel_hi:[1,1 ,0]
18231823; SDAG-NEXT: s_nop 7
18241824; SDAG-NEXT: s_nop 3
18251825; SDAG-NEXT: v_accvgpr_read_b32 v0, a0
@@ -1837,7 +1837,7 @@ define <4 x float> @test_mfma_scale_f32_16x16x128_f8f6f4_0_0__scaleA_kimm__scale
18371837; GISEL-NEXT: v_accvgpr_write_b32 a3, v19
18381838; GISEL-NEXT: v_mov_b32_e32 v16, 0x41
18391839; GISEL-NEXT: s_nop 1
1840- ; GISEL-NEXT: v_mfma_scale_f32_16x16x128_f8f6f4 a[0:3], v[0:7], v[8:15], a[0:3], v16, -2 op_sel_hi:[0,0 ,0]
1840+ ; GISEL-NEXT: v_mfma_scale_f32_16x16x128_f8f6f4 a[0:3], v[0:7], v[8:15], a[0:3], v16, -2 op_sel_hi:[1,1 ,0]
18411841; GISEL-NEXT: s_nop 7
18421842; GISEL-NEXT: s_nop 3
18431843; GISEL-NEXT: v_accvgpr_read_b32 v0, a0
@@ -1860,7 +1860,7 @@ define <4 x float> @test_mfma_scale_f32_16x16x128_f8f6f4_0_0__scaleA_kimm__scale
18601860; SDAG-NEXT: v_accvgpr_write_b32 a3, v19
18611861; SDAG-NEXT: v_mov_b32_e32 v16, 0x4d
18621862; SDAG-NEXT: s_nop 1
1863- ; SDAG-NEXT: v_mfma_scale_f32_16x16x128_f8f6f4 a[0:3], v[0:7], v[8:15], a[0:3], s0, v16 op_sel_hi:[0,0 ,0]
1863+ ; SDAG-NEXT: v_mfma_scale_f32_16x16x128_f8f6f4 a[0:3], v[0:7], v[8:15], a[0:3], s0, v16 op_sel_hi:[1,1 ,0]
18641864; SDAG-NEXT: s_nop 7
18651865; SDAG-NEXT: s_nop 3
18661866; SDAG-NEXT: v_accvgpr_read_b32 v0, a0
@@ -1879,7 +1879,7 @@ define <4 x float> @test_mfma_scale_f32_16x16x128_f8f6f4_0_0__scaleA_kimm__scale
18791879; GISEL-NEXT: v_mov_b32_e32 v16, 0x41
18801880; GISEL-NEXT: v_mov_b32_e32 v17, 0x4d
18811881; GISEL-NEXT: s_nop 1
1882- ; GISEL-NEXT: v_mfma_scale_f32_16x16x128_f8f6f4 a[0:3], v[0:7], v[8:15], a[0:3], v16, v17 op_sel_hi:[0,0 ,0]
1882+ ; GISEL-NEXT: v_mfma_scale_f32_16x16x128_f8f6f4 a[0:3], v[0:7], v[8:15], a[0:3], v16, v17 op_sel_hi:[1,1 ,0]
18831883; GISEL-NEXT: s_nop 7
18841884; GISEL-NEXT: s_nop 3
18851885; GISEL-NEXT: v_accvgpr_read_b32 v0, a0
@@ -1921,7 +1921,7 @@ define amdgpu_kernel void @test_mfma_scale_f32_16x16x128_f8f6f4__vgprcd(<8 x i32
19211921; SDAG-NEXT: v_accvgpr_write_b32 a3, s11
19221922; SDAG-NEXT: v_mov_b32_e32 v17, s13
19231923; SDAG-NEXT: s_nop 1
1924- ; SDAG-NEXT: v_mfma_scale_f32_16x16x128_f8f6f4 a[0:3], v[0:7], v[8:15], a[0:3], s12, v17 op_sel_hi:[0 ,0,0] blgp:2
1924+ ; SDAG-NEXT: v_mfma_scale_f32_16x16x128_f8f6f4 a[0:3], v[0:7], v[8:15], a[0:3], s12, v17 op_sel:[1,1,0] op_sel_hi:[1 ,0,0] blgp:2
19251925; SDAG-NEXT: s_nop 7
19261926; SDAG-NEXT: s_nop 3
19271927; SDAG-NEXT: global_store_dwordx4 v16, a[0:3], s[14:15]
@@ -1946,7 +1946,7 @@ define amdgpu_kernel void @test_mfma_scale_f32_16x16x128_f8f6f4__vgprcd(<8 x i32
19461946; GISEL-NEXT: v_accvgpr_write_b32 a3, s27
19471947; GISEL-NEXT: v_mov_b32_e32 v16, s29
19481948; GISEL-NEXT: s_nop 1
1949- ; GISEL-NEXT: v_mfma_scale_f32_16x16x128_f8f6f4 a[0:3], v[0:7], v[8:15], a[0:3], s28, v16 op_sel_hi:[0 ,0,0] blgp:2
1949+ ; GISEL-NEXT: v_mfma_scale_f32_16x16x128_f8f6f4 a[0:3], v[0:7], v[8:15], a[0:3], s28, v16 op_sel:[1,1,0] op_sel_hi:[1 ,0,0] blgp:2
19501950; GISEL-NEXT: v_mov_b32_e32 v0, 0
19511951; GISEL-NEXT: s_nop 7
19521952; GISEL-NEXT: s_nop 2
@@ -1987,7 +1987,7 @@ define amdgpu_kernel void @test_mfma_scale_f32_16x16x128_f8f6f4__vgprcd___scaleA
19871987; SDAG-NEXT: v_accvgpr_write_b32 a2, s2
19881988; SDAG-NEXT: v_accvgpr_write_b32 a3, s3
19891989; SDAG-NEXT: s_nop 1
1990- ; SDAG-NEXT: v_mfma_scale_f32_16x16x128_f8f6f4 a[0:3], v[0:7], v[8:15], a[0:3], s6, -2 op_sel_hi:[0 ,0,0]
1990+ ; SDAG-NEXT: v_mfma_scale_f32_16x16x128_f8f6f4 a[0:3], v[0:7], v[8:15], a[0:3], s6, -2 op_sel:[1,1,0] op_sel_hi:[1 ,0,0]
19911991; SDAG-NEXT: s_nop 7
19921992; SDAG-NEXT: s_nop 3
19931993; SDAG-NEXT: global_store_dwordx4 v16, a[0:3], s[4:5]
@@ -2013,7 +2013,7 @@ define amdgpu_kernel void @test_mfma_scale_f32_16x16x128_f8f6f4__vgprcd___scaleA
20132013; GISEL-NEXT: v_accvgpr_write_b32 a2, s2
20142014; GISEL-NEXT: v_accvgpr_write_b32 a3, s3
20152015; GISEL-NEXT: s_nop 1
2016- ; GISEL-NEXT: v_mfma_scale_f32_16x16x128_f8f6f4 a[0:3], v[0:7], v[8:15], a[0:3], v16, -2 op_sel_hi:[0 ,0,0]
2016+ ; GISEL-NEXT: v_mfma_scale_f32_16x16x128_f8f6f4 a[0:3], v[0:7], v[8:15], a[0:3], v16, -2 op_sel:[1,1,0] op_sel_hi:[1 ,0,0]
20172017; GISEL-NEXT: v_mov_b32_e32 v0, 0
20182018; GISEL-NEXT: s_nop 7
20192019; GISEL-NEXT: s_nop 2
0 commit comments