@@ -44,10 +44,64 @@ exit:
44
44
ret void
45
45
}
46
46
47
+ define i32 @test_remove_iv (i32 %start ) #0 {
48
+ ; CHECK-LABEL: define i32 @test_remove_iv(
49
+ ; CHECK-SAME: i32 [[START:%.*]]) #[[ATTR0]] {
50
+ ; CHECK-NEXT: [[ENTRY:.*:]]
51
+ ; CHECK-NEXT: br i1 false, label %[[SCALAR_PH:.*]], label %[[VECTOR_PH:.*]]
52
+ ; CHECK: [[VECTOR_PH]]:
53
+ ; CHECK-NEXT: [[TMP0:%.*]] = call i32 @llvm.vscale.i32()
54
+ ; CHECK-NEXT: [[TMP1:%.*]] = mul nuw i32 [[TMP0]], 4
55
+ ; CHECK-NEXT: [[TMP2:%.*]] = insertelement <vscale x 4 x i32> zeroinitializer, i32 [[START]], i32 0
56
+ ; CHECK-NEXT: br label %[[VECTOR_BODY:.*]]
57
+ ; CHECK: [[VECTOR_BODY]]:
58
+ ; CHECK-NEXT: [[EVL_BASED_IV:%.*]] = phi i32 [ 0, %[[VECTOR_PH]] ], [ [[INDEX_EVL_NEXT:%.*]], %[[VECTOR_BODY]] ]
59
+ ; CHECK-NEXT: [[VEC_PHI:%.*]] = phi <vscale x 4 x i32> [ [[TMP2]], %[[VECTOR_PH]] ], [ [[TMP5:%.*]], %[[VECTOR_BODY]] ]
60
+ ; CHECK-NEXT: [[AVL:%.*]] = phi i32 [ 6, %[[VECTOR_PH]] ], [ [[AVL_NEXT:%.*]], %[[VECTOR_BODY]] ]
61
+ ; CHECK-NEXT: [[TMP3:%.*]] = call i32 @llvm.experimental.get.vector.length.i32(i32 [[AVL]], i32 4, i1 true)
62
+ ; CHECK-NEXT: [[TMP4:%.*]] = xor <vscale x 4 x i32> [[VEC_PHI]], splat (i32 3)
63
+ ; CHECK-NEXT: [[TMP5]] = call <vscale x 4 x i32> @llvm.vp.merge.nxv4i32(<vscale x 4 x i1> splat (i1 true), <vscale x 4 x i32> [[TMP4]], <vscale x 4 x i32> [[VEC_PHI]], i32 [[TMP3]])
64
+ ; CHECK-NEXT: [[INDEX_EVL_NEXT]] = add nuw i32 [[TMP3]], [[EVL_BASED_IV]]
65
+ ; CHECK-NEXT: [[AVL_NEXT]] = sub nuw i32 [[AVL]], [[TMP3]]
66
+ ; CHECK-NEXT: br i1 true, label %[[MIDDLE_BLOCK:.*]], label %[[VECTOR_BODY]], !llvm.loop [[LOOP3:![0-9]+]]
67
+ ; CHECK: [[MIDDLE_BLOCK]]:
68
+ ; CHECK-NEXT: [[TMP6:%.*]] = call i32 @llvm.vector.reduce.xor.nxv4i32(<vscale x 4 x i32> [[TMP5]])
69
+ ; CHECK-NEXT: br label %[[EXIT:.*]]
70
+ ; CHECK: [[SCALAR_PH]]:
71
+ ; CHECK-NEXT: br label %[[LOOP:.*]]
72
+ ; CHECK: [[LOOP]]:
73
+ ; CHECK-NEXT: [[IV:%.*]] = phi i32 [ 0, %[[SCALAR_PH]] ], [ [[IV_NEXT:%.*]], %[[LOOP]] ]
74
+ ; CHECK-NEXT: [[RED:%.*]] = phi i32 [ [[START]], %[[SCALAR_PH]] ], [ [[RED_NEXT:%.*]], %[[LOOP]] ]
75
+ ; CHECK-NEXT: [[RED_NEXT]] = xor i32 [[RED]], 3
76
+ ; CHECK-NEXT: [[IV_NEXT]] = add i32 [[IV]], 1
77
+ ; CHECK-NEXT: [[EC:%.*]] = icmp eq i32 [[IV]], 5
78
+ ; CHECK-NEXT: br i1 [[EC]], label %[[EXIT]], label %[[LOOP]], !llvm.loop [[LOOP5:![0-9]+]]
79
+ ; CHECK: [[EXIT]]:
80
+ ; CHECK-NEXT: [[RED_NEXT_LCSSA:%.*]] = phi i32 [ [[RED_NEXT]], %[[LOOP]] ], [ [[TMP6]], %[[MIDDLE_BLOCK]] ]
81
+ ; CHECK-NEXT: ret i32 [[RED_NEXT_LCSSA]]
82
+ ;
83
+ entry:
84
+ br label %loop
85
+
86
+ loop:
87
+ %iv = phi i32 [ 0 , %entry ], [ %iv.next , %loop ]
88
+ %red = phi i32 [ %start , %entry ], [ %red.next , %loop ]
89
+ %red.next = xor i32 %red , 3
90
+ %iv.next = add i32 %iv , 1
91
+ %ec = icmp eq i32 %iv , 5
92
+ br i1 %ec , label %exit , label %loop
93
+
94
+ exit:
95
+ ret i32 %red.next
96
+ }
97
+
47
98
attributes #0 = { vscale_range(2 ,2 ) }
48
99
49
100
;.
50
101
; CHECK: [[LOOP0]] = distinct !{[[LOOP0]], [[META1:![0-9]+]], [[META2:![0-9]+]]}
51
102
; CHECK: [[META1]] = !{!"llvm.loop.unroll.runtime.disable"}
52
103
; CHECK: [[META2]] = !{!"llvm.loop.isvectorized", i32 1}
104
+ ; CHECK: [[LOOP3]] = distinct !{[[LOOP3]], [[META2]], [[META4:![0-9]+]], [[META1]]}
105
+ ; CHECK: [[META4]] = !{!"llvm.loop.isvectorized.tailfoldingstyle", !"evl"}
106
+ ; CHECK: [[LOOP5]] = distinct !{[[LOOP5]], [[META1]], [[META2]]}
53
107
;.
0 commit comments