@@ -28,7 +28,7 @@ define amdgpu_ps void @test_cvt_scalef32_sr_bf8_bf16_dst_sel_1(ptr addrspace(1)
2828; GFX950: ; %bb.0:
2929; GFX950-NEXT: global_load_dword v5, v[0:1], off
3030; GFX950-NEXT: s_waitcnt vmcnt(0)
31- ; GFX950-NEXT: v_cvt_scalef32_sr_bf8_bf16 v5, v2, v3, v4 op_sel:[0,0,0,1 ]
31+ ; GFX950-NEXT: v_cvt_scalef32_sr_bf8_bf16 v5, v2, v3, v4 op_sel:[0,0,1,0 ]
3232; GFX950-NEXT: global_store_dword v[0:1], v5, off
3333; GFX950-NEXT: s_endpgm
3434 %old = load i32 , ptr addrspace (1 ) %out , align 4
@@ -42,7 +42,7 @@ define amdgpu_ps void @test_cvt_scalef32_sr_bf8_bf16_dst_sel_2(ptr addrspace(1)
4242; GFX950: ; %bb.0:
4343; GFX950-NEXT: global_load_dword v5, v[0:1], off
4444; GFX950-NEXT: s_waitcnt vmcnt(0)
45- ; GFX950-NEXT: v_cvt_scalef32_sr_bf8_bf16 v5, v2, v3, v4 op_sel:[0,0,1,0 ]
45+ ; GFX950-NEXT: v_cvt_scalef32_sr_bf8_bf16 v5, v2, v3, v4 op_sel:[0,0,0,1 ]
4646; GFX950-NEXT: global_store_dword v[0:1], v5, off
4747; GFX950-NEXT: s_endpgm
4848 %old = load i32 , ptr addrspace (1 ) %out , align 4
@@ -84,7 +84,7 @@ define amdgpu_ps void @test_cvt_scalef32_sr_bf8_f16_dst_sel_1(ptr addrspace(1) %
8484; GFX950: ; %bb.0:
8585; GFX950-NEXT: global_load_dword v5, v[0:1], off
8686; GFX950-NEXT: s_waitcnt vmcnt(0)
87- ; GFX950-NEXT: v_cvt_scalef32_sr_bf8_f16 v5, v2, v3, v4 op_sel:[0,0,0,1 ]
87+ ; GFX950-NEXT: v_cvt_scalef32_sr_bf8_f16 v5, v2, v3, v4 op_sel:[0,0,1,0 ]
8888; GFX950-NEXT: global_store_dword v[0:1], v5, off
8989; GFX950-NEXT: s_endpgm
9090 %old = load i32 , ptr addrspace (1 ) %out , align 4
@@ -98,7 +98,7 @@ define amdgpu_ps void @test_cvt_scalef32_sr_bf8_f16_dst_sel_2(ptr addrspace(1) %
9898; GFX950: ; %bb.0:
9999; GFX950-NEXT: global_load_dword v5, v[0:1], off
100100; GFX950-NEXT: s_waitcnt vmcnt(0)
101- ; GFX950-NEXT: v_cvt_scalef32_sr_bf8_f16 v5, v2, v3, v4 op_sel:[0,0,1,0 ]
101+ ; GFX950-NEXT: v_cvt_scalef32_sr_bf8_f16 v5, v2, v3, v4 op_sel:[0,0,0,1 ]
102102; GFX950-NEXT: global_store_dword v[0:1], v5, off
103103; GFX950-NEXT: s_endpgm
104104 %old = load i32 , ptr addrspace (1 ) %out , align 4
@@ -140,7 +140,7 @@ define amdgpu_ps void @test_cvt_scalef32_sr_bf8_f32_dst_sel_1(ptr addrspace(1) %
140140; GFX950: ; %bb.0:
141141; GFX950-NEXT: global_load_dword v5, v[0:1], off
142142; GFX950-NEXT: s_waitcnt vmcnt(0)
143- ; GFX950-NEXT: v_cvt_scalef32_sr_bf8_f32 v5, v2, v3, v4 op_sel:[0,0,0,1 ]
143+ ; GFX950-NEXT: v_cvt_scalef32_sr_bf8_f32 v5, v2, v3, v4 op_sel:[0,0,1,0 ]
144144; GFX950-NEXT: global_store_dword v[0:1], v5, off
145145; GFX950-NEXT: s_endpgm
146146 %old = load i32 , ptr addrspace (1 ) %out , align 4
@@ -154,7 +154,7 @@ define amdgpu_ps void @test_cvt_scalef32_sr_bf8_f32_dst_sel_2(ptr addrspace(1) %
154154; GFX950: ; %bb.0:
155155; GFX950-NEXT: global_load_dword v5, v[0:1], off
156156; GFX950-NEXT: s_waitcnt vmcnt(0)
157- ; GFX950-NEXT: v_cvt_scalef32_sr_bf8_f32 v5, v2, v3, v4 op_sel:[0,0,1,0 ]
157+ ; GFX950-NEXT: v_cvt_scalef32_sr_bf8_f32 v5, v2, v3, v4 op_sel:[0,0,0,1 ]
158158; GFX950-NEXT: global_store_dword v[0:1], v5, off
159159; GFX950-NEXT: s_endpgm
160160 %old = load i32 , ptr addrspace (1 ) %out , align 4
@@ -196,7 +196,7 @@ define amdgpu_ps void @test_cvt_scalef32_sr_fp8_bf16_dst_sel_1(ptr addrspace(1)
196196; GFX950: ; %bb.0:
197197; GFX950-NEXT: global_load_dword v5, v[0:1], off
198198; GFX950-NEXT: s_waitcnt vmcnt(0)
199- ; GFX950-NEXT: v_cvt_scalef32_sr_fp8_bf16 v5, v2, v3, v4 op_sel:[0,0,0,1 ]
199+ ; GFX950-NEXT: v_cvt_scalef32_sr_fp8_bf16 v5, v2, v3, v4 op_sel:[0,0,1,0 ]
200200; GFX950-NEXT: global_store_dword v[0:1], v5, off
201201; GFX950-NEXT: s_endpgm
202202 %old = load i32 , ptr addrspace (1 ) %out , align 4
@@ -210,7 +210,7 @@ define amdgpu_ps void @test_cvt_scalef32_sr_fp8_bf16_dst_sel_2(ptr addrspace(1)
210210; GFX950: ; %bb.0:
211211; GFX950-NEXT: global_load_dword v5, v[0:1], off
212212; GFX950-NEXT: s_waitcnt vmcnt(0)
213- ; GFX950-NEXT: v_cvt_scalef32_sr_fp8_bf16 v5, v2, v3, v4 op_sel:[0,0,1,0 ]
213+ ; GFX950-NEXT: v_cvt_scalef32_sr_fp8_bf16 v5, v2, v3, v4 op_sel:[0,0,0,1 ]
214214; GFX950-NEXT: global_store_dword v[0:1], v5, off
215215; GFX950-NEXT: s_endpgm
216216 %old = load i32 , ptr addrspace (1 ) %out , align 4
@@ -252,7 +252,7 @@ define amdgpu_ps void @test_cvt_scalef32_sr_fp8_f16_dst_sel_1(ptr addrspace(1) %
252252; GFX950: ; %bb.0:
253253; GFX950-NEXT: global_load_dword v5, v[0:1], off
254254; GFX950-NEXT: s_waitcnt vmcnt(0)
255- ; GFX950-NEXT: v_cvt_scalef32_sr_fp8_f16 v5, v2, v3, v4 op_sel:[0,0,0,1 ]
255+ ; GFX950-NEXT: v_cvt_scalef32_sr_fp8_f16 v5, v2, v3, v4 op_sel:[0,0,1,0 ]
256256; GFX950-NEXT: global_store_dword v[0:1], v5, off
257257; GFX950-NEXT: s_endpgm
258258 %old = load i32 , ptr addrspace (1 ) %out , align 4
@@ -266,7 +266,7 @@ define amdgpu_ps void @test_cvt_scalef32_sr_fp8_f16_dst_sel_2(ptr addrspace(1) %
266266; GFX950: ; %bb.0:
267267; GFX950-NEXT: global_load_dword v5, v[0:1], off
268268; GFX950-NEXT: s_waitcnt vmcnt(0)
269- ; GFX950-NEXT: v_cvt_scalef32_sr_fp8_f16 v5, v2, v3, v4 op_sel:[0,0,1,0 ]
269+ ; GFX950-NEXT: v_cvt_scalef32_sr_fp8_f16 v5, v2, v3, v4 op_sel:[0,0,0,1 ]
270270; GFX950-NEXT: global_store_dword v[0:1], v5, off
271271; GFX950-NEXT: s_endpgm
272272 %old = load i32 , ptr addrspace (1 ) %out , align 4
@@ -308,7 +308,7 @@ define amdgpu_ps void @test_cvt_scalef32_sr_fp8_f32_dst_sel_1(ptr addrspace(1) %
308308; GFX950: ; %bb.0:
309309; GFX950-NEXT: global_load_dword v5, v[0:1], off
310310; GFX950-NEXT: s_waitcnt vmcnt(0)
311- ; GFX950-NEXT: v_cvt_scalef32_sr_fp8_f32 v5, v2, v3, v4 op_sel:[0,0,0,1 ]
311+ ; GFX950-NEXT: v_cvt_scalef32_sr_fp8_f32 v5, v2, v3, v4 op_sel:[0,0,1,0 ]
312312; GFX950-NEXT: global_store_dword v[0:1], v5, off
313313; GFX950-NEXT: s_endpgm
314314 %old = load i32 , ptr addrspace (1 ) %out , align 4
@@ -322,7 +322,7 @@ define amdgpu_ps void @test_cvt_scalef32_sr_fp8_f32_dst_sel_2(ptr addrspace(1) %
322322; GFX950: ; %bb.0:
323323; GFX950-NEXT: global_load_dword v5, v[0:1], off
324324; GFX950-NEXT: s_waitcnt vmcnt(0)
325- ; GFX950-NEXT: v_cvt_scalef32_sr_fp8_f32 v5, v2, v3, v4 op_sel:[0,0,1,0 ]
325+ ; GFX950-NEXT: v_cvt_scalef32_sr_fp8_f32 v5, v2, v3, v4 op_sel:[0,0,0,1 ]
326326; GFX950-NEXT: global_store_dword v[0:1], v5, off
327327; GFX950-NEXT: s_endpgm
328328 %old = load i32 , ptr addrspace (1 ) %out , align 4
0 commit comments