@@ -134,9 +134,9 @@ define amdgpu_kernel void @fptrunc_f64_to_f16(ptr addrspace(1) %out, double %in)
134134; SI-NEXT: s_cmp_lt_i32 s0, 31
135135; SI-NEXT: s_cmovk_i32 s6, 0x7c00
136136; SI-NEXT: s_cmp_lg_u32 s1, 0
137- ; SI-NEXT: s_cselect_b32 s1, s2, 0x7c00
137+ ; SI-NEXT: s_cmovk_i32 s2, 0x7c00
138138; SI-NEXT: s_cmpk_eq_i32 s0, 0x40f
139- ; SI-NEXT: s_cselect_b32 s0, s1 , s6
139+ ; SI-NEXT: s_cselect_b32 s0, s2 , s6
140140; SI-NEXT: s_lshr_b32 s1, s7, 16
141141; SI-NEXT: s_and_b32 s1, s1, 0x8000
142142; SI-NEXT: s_or_b32 s6, s1, s0
@@ -314,9 +314,9 @@ define amdgpu_kernel void @fptrunc_f64_to_f16(ptr addrspace(1) %out, double %in)
314314; GFX10-SAFE-SDAG-NEXT: s_movk_i32 s6, 0x7e00
315315; GFX10-SAFE-SDAG-NEXT: s_cmovk_i32 s5, 0x7c00
316316; GFX10-SAFE-SDAG-NEXT: s_cmp_lg_u32 s4, 0
317- ; GFX10-SAFE-SDAG-NEXT: s_cselect_b32 s4, s6, 0x7c00
317+ ; GFX10-SAFE-SDAG-NEXT: s_cmovk_i32 s6, 0x7c00
318318; GFX10-SAFE-SDAG-NEXT: s_cmpk_eq_i32 s2, 0x40f
319- ; GFX10-SAFE-SDAG-NEXT: s_cselect_b32 s2, s4 , s5
319+ ; GFX10-SAFE-SDAG-NEXT: s_cselect_b32 s2, s6 , s5
320320; GFX10-SAFE-SDAG-NEXT: s_lshr_b32 s3, s3, 16
321321; GFX10-SAFE-SDAG-NEXT: s_and_b32 s3, s3, 0x8000
322322; GFX10-SAFE-SDAG-NEXT: s_or_b32 s2, s3, s2
@@ -446,9 +446,9 @@ define amdgpu_kernel void @fptrunc_f64_to_f16(ptr addrspace(1) %out, double %in)
446446; GFX11-SAFE-SDAG-NEXT: s_movk_i32 s6, 0x7e00
447447; GFX11-SAFE-SDAG-NEXT: s_cmovk_i32 s5, 0x7c00
448448; GFX11-SAFE-SDAG-NEXT: s_cmp_lg_u32 s4, 0
449- ; GFX11-SAFE-SDAG-NEXT: s_cselect_b32 s4, s6, 0x7c00
449+ ; GFX11-SAFE-SDAG-NEXT: s_cmovk_i32 s6, 0x7c00
450450; GFX11-SAFE-SDAG-NEXT: s_cmpk_eq_i32 s2, 0x40f
451- ; GFX11-SAFE-SDAG-NEXT: s_cselect_b32 s2, s4 , s5
451+ ; GFX11-SAFE-SDAG-NEXT: s_cselect_b32 s2, s6 , s5
452452; GFX11-SAFE-SDAG-NEXT: s_lshr_b32 s3, s3, 16
453453; GFX11-SAFE-SDAG-NEXT: s_delay_alu instid0(SALU_CYCLE_1) | instskip(NEXT) | instid1(SALU_CYCLE_1)
454454; GFX11-SAFE-SDAG-NEXT: s_and_b32 s3, s3, 0x8000
0 commit comments