@@ -5896,30 +5896,30 @@ define void @sink_vp_splat(ptr nocapture %out, ptr nocapture %in) {
58965896; CHECK: # %bb.0: # %entry
58975897; CHECK-NEXT: li a2, 0
58985898; CHECK-NEXT: li a3, 1024
5899- ; CHECK-NEXT: lui a4, 1
5899+ ; CHECK-NEXT: li a4, 3
5900+ ; CHECK-NEXT: lui a5, 1
59005901; CHECK-NEXT: .LBB129_1: # %vector.body
59015902; CHECK-NEXT: # =>This Loop Header: Depth=1
59025903; CHECK-NEXT: # Child Loop BB129_2 Depth 2
5903- ; CHECK-NEXT: vsetvli a5 , a3, e32, m4, ta, ma
5904- ; CHECK-NEXT: slli a6 , a2, 2
5904+ ; CHECK-NEXT: vsetvli a6 , a3, e32, m4, ta, ma
5905+ ; CHECK-NEXT: slli a7 , a2, 2
59055906; CHECK-NEXT: vmv.v.i v8, 0
5906- ; CHECK-NEXT: vmv.v.i v12, 3
5907- ; CHECK-NEXT: add a7, a1, a6
5908- ; CHECK-NEXT: li t0, 1024
5907+ ; CHECK-NEXT: add t0, a1, a7
5908+ ; CHECK-NEXT: li t1, 1024
59095909; CHECK-NEXT: .LBB129_2: # %for.body424
59105910; CHECK-NEXT: # Parent Loop BB129_1 Depth=1
59115911; CHECK-NEXT: # => This Inner Loop Header: Depth=2
5912- ; CHECK-NEXT: vle32.v v16 , (a7 )
5913- ; CHECK-NEXT: addi t0, t0 , -1
5914- ; CHECK-NEXT: vmacc.vv v8, v16 , v12
5915- ; CHECK-NEXT: add a7, a7, a4
5916- ; CHECK-NEXT: bnez t0 , .LBB129_2
5912+ ; CHECK-NEXT: vle32.v v12 , (t0 )
5913+ ; CHECK-NEXT: addi t1, t1 , -1
5914+ ; CHECK-NEXT: vmacc.vx v8, a4 , v12
5915+ ; CHECK-NEXT: add t0, t0, a5
5916+ ; CHECK-NEXT: bnez t1 , .LBB129_2
59175917; CHECK-NEXT: # %bb.3: # %vector.latch
59185918; CHECK-NEXT: # in Loop: Header=BB129_1 Depth=1
5919- ; CHECK-NEXT: add a6 , a0, a6
5920- ; CHECK-NEXT: sub a3, a3, a5
5921- ; CHECK-NEXT: vse32.v v8, (a6 )
5922- ; CHECK-NEXT: add a2, a2, a5
5919+ ; CHECK-NEXT: add a7 , a0, a7
5920+ ; CHECK-NEXT: sub a3, a3, a6
5921+ ; CHECK-NEXT: vse32.v v8, (a7 )
5922+ ; CHECK-NEXT: add a2, a2, a6
59235923; CHECK-NEXT: bnez a3, .LBB129_1
59245924; CHECK-NEXT: # %bb.4: # %for.cond.cleanup
59255925; CHECK-NEXT: ret
@@ -5962,24 +5962,23 @@ define void @sink_vp_splat_vfwadd_wf(ptr nocapture %in, float %f) {
59625962; CHECK-LABEL: sink_vp_splat_vfwadd_wf:
59635963; CHECK: # %bb.0: # %entry
59645964; CHECK-NEXT: li a1, 0
5965- ; CHECK-NEXT: fcvt.d.s fa5, fa0
59665965; CHECK-NEXT: li a2, 1024
59675966; CHECK-NEXT: lui a3, 2
59685967; CHECK-NEXT: .LBB130_1: # %vector.body
59695968; CHECK-NEXT: # =>This Loop Header: Depth=1
59705969; CHECK-NEXT: # Child Loop BB130_2 Depth 2
5971- ; CHECK-NEXT: vsetvli a4, a2, e64, m8 , ta, ma
5970+ ; CHECK-NEXT: vsetvli a4, a2, e8, m1 , ta, ma
59725971; CHECK-NEXT: slli a5, a1, 3
5973- ; CHECK-NEXT: vfmv.v.f v8, fa5
59745972; CHECK-NEXT: add a5, a0, a5
59755973; CHECK-NEXT: li a6, 1024
59765974; CHECK-NEXT: .LBB130_2: # %for.body419
59775975; CHECK-NEXT: # Parent Loop BB130_1 Depth=1
59785976; CHECK-NEXT: # => This Inner Loop Header: Depth=2
5979- ; CHECK-NEXT: vle64.v v16, (a5)
5977+ ; CHECK-NEXT: vsetvli zero, zero, e32, m4, ta, ma
5978+ ; CHECK-NEXT: vle64.v v8, (a5)
59805979; CHECK-NEXT: addi a6, a6, -1
5981- ; CHECK-NEXT: vfadd.vv v16, v16, v8
5982- ; CHECK-NEXT: vse64.v v16 , (a5)
5980+ ; CHECK-NEXT: vfwadd.wf v8, v8, fa0
5981+ ; CHECK-NEXT: vse64.v v8 , (a5)
59835982; CHECK-NEXT: add a5, a5, a3
59845983; CHECK-NEXT: bnez a6, .LBB130_2
59855984; CHECK-NEXT: # %bb.3: # %vector.latch
0 commit comments