@@ -23,19 +23,19 @@ define half @reduce_fadd_half(<8 x half> %in) {
2323; CHECK-EMPTY:
2424; CHECK-NEXT: // %bb.0:
2525; CHECK-NEXT: ld.param.v4.u32 {%r1, %r2, %r3, %r4}, [reduce_fadd_half_param_0];
26- ; CHECK-NEXT: mov.b32 {%rs1, %rs2}, %r4 ;
27- ; CHECK-NEXT: mov.b32 { %rs3, %rs4}, %r3 ;
28- ; CHECK-NEXT: mov.b32 {%rs5 , %rs6} , %r2 ;
29- ; CHECK-NEXT: mov.b32 {%rs7 , %rs8} , %r1 ;
30- ; CHECK-NEXT: mov.b16 %rs9, 0x0000 ;
31- ; CHECK-NEXT: add.rn.f16 %rs10 , %rs7 , %rs9 ;
32- ; CHECK-NEXT: add.rn.f16 %rs11 , %rs10 , %rs8 ;
33- ; CHECK-NEXT: add.rn.f16 %rs12 , %rs11, %rs5 ;
34- ; CHECK-NEXT: add.rn.f16 %rs13 , %rs12 , %rs6 ;
35- ; CHECK-NEXT: add.rn.f16 %rs14 , %rs13 , %rs3 ;
36- ; CHECK-NEXT: add.rn.f16 %rs15 , %rs14 , %rs4 ;
37- ; CHECK-NEXT: add.rn.f16 %rs16, %rs15 , %rs1 ;
38- ; CHECK-NEXT: add.rn.f16 %rs17, %rs16, %rs2 ;
26+ ; CHECK-NEXT: mov.b32 {%rs1, %rs2}, %r1 ;
27+ ; CHECK-NEXT: mov.b16 %rs3, 0x0000 ;
28+ ; CHECK-NEXT: add.rn.f16 %rs4 , %rs1 , %rs3 ;
29+ ; CHECK-NEXT: add.rn.f16 %rs5 , %rs4 , %rs2 ;
30+ ; CHECK-NEXT: mov.b32 {%rs6, %rs7}, %r2 ;
31+ ; CHECK-NEXT: add.rn.f16 %rs8 , %rs5 , %rs6 ;
32+ ; CHECK-NEXT: add.rn.f16 %rs9 , %rs8 , %rs7 ;
33+ ; CHECK-NEXT: mov.b32 {%rs10 , %rs11} , %r3 ;
34+ ; CHECK-NEXT: add.rn.f16 %rs12 , %rs9 , %rs10 ;
35+ ; CHECK-NEXT: add.rn.f16 %rs13 , %rs12 , %rs11 ;
36+ ; CHECK-NEXT: mov.b32 {%rs14 , %rs15} , %r4 ;
37+ ; CHECK-NEXT: add.rn.f16 %rs16, %rs13 , %rs14 ;
38+ ; CHECK-NEXT: add.rn.f16 %rs17, %rs16, %rs15 ;
3939; CHECK-NEXT: st.param.b16 [func_retval0], %rs17;
4040; CHECK-NEXT: ret;
4141 %res = call half @llvm.vector.reduce.fadd (half 0 .0 , <8 x half > %in )
@@ -174,17 +174,17 @@ define half @reduce_fmul_half(<8 x half> %in) {
174174; CHECK-EMPTY:
175175; CHECK-NEXT: // %bb.0:
176176; CHECK-NEXT: ld.param.v4.u32 {%r1, %r2, %r3, %r4}, [reduce_fmul_half_param_0];
177- ; CHECK-NEXT: mov.b32 {%rs1, %rs2}, %r4 ;
178- ; CHECK-NEXT: mov.b32 {%rs3, %rs4}, %r3 ;
179- ; CHECK-NEXT: mov.b32 { %rs5, %rs6} , %r2 ;
180- ; CHECK-NEXT: mov.b32 {%rs7 , %rs8} , %r1 ;
181- ; CHECK-NEXT: mul.rn.f16 %rs9 , %rs7 , %rs8 ;
182- ; CHECK-NEXT: mul.rn.f16 %rs10 , %rs9, %rs5 ;
183- ; CHECK-NEXT: mul.rn.f16 %rs11 , %rs10 , %rs6 ;
184- ; CHECK-NEXT: mul.rn.f16 %rs12 , %rs11 , %rs3 ;
185- ; CHECK-NEXT: mul.rn.f16 %rs13 , %rs12 , %rs4 ;
186- ; CHECK-NEXT: mul.rn.f16 %rs14, %rs13 , %rs1 ;
187- ; CHECK-NEXT: mul.rn.f16 %rs15, %rs14, %rs2 ;
177+ ; CHECK-NEXT: mov.b32 {%rs1, %rs2}, %r2 ;
178+ ; CHECK-NEXT: mov.b32 {%rs3, %rs4}, %r1 ;
179+ ; CHECK-NEXT: mul.rn.f16 %rs5, %rs3 , %rs4 ;
180+ ; CHECK-NEXT: mul.rn.f16 %rs6 , %rs5 , %rs1 ;
181+ ; CHECK-NEXT: mul.rn.f16 %rs7 , %rs6 , %rs2 ;
182+ ; CHECK-NEXT: mov.b32 {%rs8 , %rs9} , %r3 ;
183+ ; CHECK-NEXT: mul.rn.f16 %rs10 , %rs7 , %rs8 ;
184+ ; CHECK-NEXT: mul.rn.f16 %rs11 , %rs10 , %rs9 ;
185+ ; CHECK-NEXT: mov.b32 {%rs12 , %rs13} , %r4 ;
186+ ; CHECK-NEXT: mul.rn.f16 %rs14, %rs11 , %rs12 ;
187+ ; CHECK-NEXT: mul.rn.f16 %rs15, %rs14, %rs13 ;
188188; CHECK-NEXT: st.param.b16 [func_retval0], %rs15;
189189; CHECK-NEXT: ret;
190190 %res = call half @llvm.vector.reduce.fmul (half 1 .0 , <8 x half > %in )
0 commit comments