@@ -17,9 +17,7 @@ define float @fma_from_freeze_mul_add_left_with_nnan(float %x, float %y) {
1717; CHECK-LABEL: fma_from_freeze_mul_add_left_with_nnan:
1818; CHECK: ; %bb.0:
1919; CHECK-NEXT: s_waitcnt vmcnt(0) expcnt(0) lgkmcnt(0)
20- ; CHECK-NEXT: v_mul_f32_e32 v0, v0, v1
21- ; CHECK-NEXT: s_delay_alu instid0(VALU_DEP_1)
22- ; CHECK-NEXT: v_add_f32_e32 v0, 1.0, v0
20+ ; CHECK-NEXT: v_fma_f32 v0, v0, v1, 1.0
2321; CHECK-NEXT: s_setpc_b64 s[30:31]
2422 %mul = fmul nnan contract afn float %x , %y
2523 %mul.fr = freeze float %mul
@@ -43,9 +41,7 @@ define float @fma_from_freeze_mul_add_right_with_nnan(float %x, float %y) {
4341; CHECK-LABEL: fma_from_freeze_mul_add_right_with_nnan:
4442; CHECK: ; %bb.0:
4543; CHECK-NEXT: s_waitcnt vmcnt(0) expcnt(0) lgkmcnt(0)
46- ; CHECK-NEXT: v_mul_f32_e32 v0, v0, v1
47- ; CHECK-NEXT: s_delay_alu instid0(VALU_DEP_1)
48- ; CHECK-NEXT: v_add_f32_e32 v0, 1.0, v0
44+ ; CHECK-NEXT: v_fma_f32 v0, v0, v1, 1.0
4945; CHECK-NEXT: s_setpc_b64 s[30:31]
5046 %mul = fmul nnan contract float %x , %y
5147 %mul.fr = freeze float %mul
@@ -69,9 +65,7 @@ define float @fma_from_freeze_mul_sub_left_with_nnan(float %x, float %y) {
6965; CHECK-LABEL: fma_from_freeze_mul_sub_left_with_nnan:
7066; CHECK: ; %bb.0:
7167; CHECK-NEXT: s_waitcnt vmcnt(0) expcnt(0) lgkmcnt(0)
72- ; CHECK-NEXT: v_mul_f32_e32 v0, v0, v1
73- ; CHECK-NEXT: s_delay_alu instid0(VALU_DEP_1)
74- ; CHECK-NEXT: v_add_f32_e32 v0, -1.0, v0
68+ ; CHECK-NEXT: v_fma_f32 v0, v0, v1, -1.0
7569; CHECK-NEXT: s_setpc_b64 s[30:31]
7670 %mul = fmul nnan contract float %x , %y
7771 %mul.fr = freeze float %mul
@@ -95,12 +89,42 @@ define float @fma_from_freeze_mul_sub_right_with_nnan(float %x, float %y) {
9589; CHECK-LABEL: fma_from_freeze_mul_sub_right_with_nnan:
9690; CHECK: ; %bb.0:
9791; CHECK-NEXT: s_waitcnt vmcnt(0) expcnt(0) lgkmcnt(0)
98- ; CHECK-NEXT: v_mul_f32_e32 v0, v0, v1
99- ; CHECK-NEXT: s_delay_alu instid0(VALU_DEP_1)
100- ; CHECK-NEXT: v_sub_f32_e32 v0, 1.0, v0
92+ ; CHECK-NEXT: v_fma_f32 v0, -v0, v1, 1.0
10193; CHECK-NEXT: s_setpc_b64 s[30:31]
10294 %mul = fmul nnan contract float %x , %y
10395 %mul.fr = freeze float %mul
10496 %sub = fsub nnan contract float 1 .000000e+00 , %mul.fr
10597 ret float %sub
10698}
99+
100+ define float @fma_freeze_sink_multiple_maybe_poison_nnan_add (float %x , float %y ) {
101+ ; CHECK-LABEL: fma_freeze_sink_multiple_maybe_poison_nnan_add:
102+ ; CHECK: ; %bb.0:
103+ ; CHECK-NEXT: s_waitcnt vmcnt(0) expcnt(0) lgkmcnt(0)
104+ ; CHECK-NEXT: v_dual_subrev_f32 v0, 1.0, v0 :: v_dual_add_f32 v1, 1.0, v1
105+ ; CHECK-NEXT: s_delay_alu instid0(VALU_DEP_1)
106+ ; CHECK-NEXT: v_fma_f32 v0, v0, v1, 1.0
107+ ; CHECK-NEXT: s_setpc_b64 s[30:31]
108+ %fsub_x = fsub nnan contract float %x , 1 .000000e+00
109+ %fadd_y = fadd nnan contract float %y , 1 .000000e+00
110+ %mul = fmul nnan contract float %fsub_x , %fadd_y
111+ %mul.fr = freeze float %mul
112+ %add = fadd nnan contract float %mul.fr , 1 .000000e+00
113+ ret float %add
114+ }
115+
116+ define float @fma_freeze_sink_multiple_maybe_poison_nnan_sub (float %x , float %y ) {
117+ ; CHECK-LABEL: fma_freeze_sink_multiple_maybe_poison_nnan_sub:
118+ ; CHECK: ; %bb.0:
119+ ; CHECK-NEXT: s_waitcnt vmcnt(0) expcnt(0) lgkmcnt(0)
120+ ; CHECK-NEXT: v_dual_add_f32 v0, 1.0, v0 :: v_dual_add_f32 v1, -1.0, v1
121+ ; CHECK-NEXT: s_delay_alu instid0(VALU_DEP_1)
122+ ; CHECK-NEXT: v_fma_f32 v0, v0, v1, -1.0
123+ ; CHECK-NEXT: s_setpc_b64 s[30:31]
124+ %fadd_x = fadd nnan contract float %x , 1 .000000e+00
125+ %fsub_y = fsub nnan contract float %y , 1 .000000e+00
126+ %mul = fmul nnan contract float %fadd_x , %fsub_y
127+ %mul.fr = freeze float %mul
128+ %sub = fsub nnan contract float %mul.fr , 1 .000000e+00
129+ ret float %sub
130+ }
0 commit comments