@@ -44,10 +44,64 @@ exit:
4444 ret void
4545}
4646
47+ define i32 @test_remove_iv (i32 %start ) #0 {
48+ ; CHECK-LABEL: define i32 @test_remove_iv(
49+ ; CHECK-SAME: i32 [[START:%.*]]) #[[ATTR0]] {
50+ ; CHECK-NEXT: [[ENTRY:.*:]]
51+ ; CHECK-NEXT: br i1 false, label %[[SCALAR_PH:.*]], label %[[VECTOR_PH:.*]]
52+ ; CHECK: [[VECTOR_PH]]:
53+ ; CHECK-NEXT: [[TMP0:%.*]] = call i32 @llvm.vscale.i32()
54+ ; CHECK-NEXT: [[TMP1:%.*]] = mul nuw i32 [[TMP0]], 4
55+ ; CHECK-NEXT: [[TMP2:%.*]] = insertelement <vscale x 4 x i32> zeroinitializer, i32 [[START]], i32 0
56+ ; CHECK-NEXT: br label %[[VECTOR_BODY:.*]]
57+ ; CHECK: [[VECTOR_BODY]]:
58+ ; CHECK-NEXT: [[EVL_BASED_IV:%.*]] = phi i32 [ 0, %[[VECTOR_PH]] ], [ [[INDEX_EVL_NEXT:%.*]], %[[VECTOR_BODY]] ]
59+ ; CHECK-NEXT: [[VEC_PHI:%.*]] = phi <vscale x 4 x i32> [ [[TMP2]], %[[VECTOR_PH]] ], [ [[TMP5:%.*]], %[[VECTOR_BODY]] ]
60+ ; CHECK-NEXT: [[AVL:%.*]] = phi i32 [ 6, %[[VECTOR_PH]] ], [ [[AVL_NEXT:%.*]], %[[VECTOR_BODY]] ]
61+ ; CHECK-NEXT: [[TMP3:%.*]] = call i32 @llvm.experimental.get.vector.length.i32(i32 [[AVL]], i32 4, i1 true)
62+ ; CHECK-NEXT: [[TMP4:%.*]] = xor <vscale x 4 x i32> [[VEC_PHI]], splat (i32 3)
63+ ; CHECK-NEXT: [[TMP5]] = call <vscale x 4 x i32> @llvm.vp.merge.nxv4i32(<vscale x 4 x i1> splat (i1 true), <vscale x 4 x i32> [[TMP4]], <vscale x 4 x i32> [[VEC_PHI]], i32 [[TMP3]])
64+ ; CHECK-NEXT: [[INDEX_EVL_NEXT]] = add nuw i32 [[TMP3]], [[EVL_BASED_IV]]
65+ ; CHECK-NEXT: [[AVL_NEXT]] = sub nuw i32 [[AVL]], [[TMP3]]
66+ ; CHECK-NEXT: br i1 true, label %[[MIDDLE_BLOCK:.*]], label %[[VECTOR_BODY]], !llvm.loop [[LOOP3:![0-9]+]]
67+ ; CHECK: [[MIDDLE_BLOCK]]:
68+ ; CHECK-NEXT: [[TMP6:%.*]] = call i32 @llvm.vector.reduce.xor.nxv4i32(<vscale x 4 x i32> [[TMP5]])
69+ ; CHECK-NEXT: br label %[[EXIT:.*]]
70+ ; CHECK: [[SCALAR_PH]]:
71+ ; CHECK-NEXT: br label %[[LOOP:.*]]
72+ ; CHECK: [[LOOP]]:
73+ ; CHECK-NEXT: [[IV:%.*]] = phi i32 [ 0, %[[SCALAR_PH]] ], [ [[IV_NEXT:%.*]], %[[LOOP]] ]
74+ ; CHECK-NEXT: [[RED:%.*]] = phi i32 [ [[START]], %[[SCALAR_PH]] ], [ [[RED_NEXT:%.*]], %[[LOOP]] ]
75+ ; CHECK-NEXT: [[RED_NEXT]] = xor i32 [[RED]], 3
76+ ; CHECK-NEXT: [[IV_NEXT]] = add i32 [[IV]], 1
77+ ; CHECK-NEXT: [[EC:%.*]] = icmp eq i32 [[IV]], 5
78+ ; CHECK-NEXT: br i1 [[EC]], label %[[EXIT]], label %[[LOOP]], !llvm.loop [[LOOP5:![0-9]+]]
79+ ; CHECK: [[EXIT]]:
80+ ; CHECK-NEXT: [[RED_NEXT_LCSSA:%.*]] = phi i32 [ [[RED_NEXT]], %[[LOOP]] ], [ [[TMP6]], %[[MIDDLE_BLOCK]] ]
81+ ; CHECK-NEXT: ret i32 [[RED_NEXT_LCSSA]]
82+ ;
83+ entry:
84+ br label %loop
85+
86+ loop:
87+ %iv = phi i32 [ 0 , %entry ], [ %iv.next , %loop ]
88+ %red = phi i32 [ %start , %entry ], [ %red.next , %loop ]
89+ %red.next = xor i32 %red , 3
90+ %iv.next = add i32 %iv , 1
91+ %ec = icmp eq i32 %iv , 5
92+ br i1 %ec , label %exit , label %loop
93+
94+ exit:
95+ ret i32 %red.next
96+ }
97+
4798attributes #0 = { vscale_range(2 ,2 ) }
4899
49100;.
50101; CHECK: [[LOOP0]] = distinct !{[[LOOP0]], [[META1:![0-9]+]], [[META2:![0-9]+]]}
51102; CHECK: [[META1]] = !{!"llvm.loop.unroll.runtime.disable"}
52103; CHECK: [[META2]] = !{!"llvm.loop.isvectorized", i32 1}
104+ ; CHECK: [[LOOP3]] = distinct !{[[LOOP3]], [[META2]], [[META4:![0-9]+]], [[META1]]}
105+ ; CHECK: [[META4]] = !{!"llvm.loop.isvectorized.tailfoldingstyle", !"evl"}
106+ ; CHECK: [[LOOP5]] = distinct !{[[LOOP5]], [[META1]], [[META2]]}
53107;.
0 commit comments