@@ -66,22 +66,19 @@ define void @wide_gep_index_invariant(ptr noalias %dst, ptr noalias %src, i64 %n
66
66
; CHECK-NEXT: entry:
67
67
; CHECK-NEXT: br i1 false, label [[SCALAR_PH:%.*]], label [[VECTOR_PH:%.*]]
68
68
; CHECK: vector.ph:
69
- ; CHECK-NEXT: [[BROADCAST_SPLATINSERT:%.*]] = insertelement <4 x i64> poison, i64 [[N]], i64 0
70
- ; CHECK-NEXT: [[BROADCAST_SPLAT:%.*]] = shufflevector <4 x i64> [[BROADCAST_SPLATINSERT]], <4 x i64> poison, <4 x i32> zeroinitializer
71
69
; CHECK-NEXT: br label [[VECTOR_BODY:%.*]]
72
70
; CHECK: vector.body:
73
71
; CHECK-NEXT: [[INDEX:%.*]] = phi i64 [ 0, [[VECTOR_PH]] ], [ [[INDEX_NEXT:%.*]], [[VECTOR_BODY]] ]
74
72
; CHECK-NEXT: [[TMP0:%.*]] = load ptr, ptr [[SRC]], align 8
75
- ; CHECK-NEXT: [[BROADCAST_SPLATINSERT1:%.*]] = insertelement <4 x ptr> poison, ptr [[TMP0]], i64 0
76
- ; CHECK-NEXT: [[BROADCAST_SPLAT2:%.*]] = shufflevector <4 x ptr> [[BROADCAST_SPLATINSERT1]], <4 x ptr> poison, <4 x i32> zeroinitializer
77
- ; CHECK-NEXT: [[TMP1:%.*]] = extractelement <4 x i64> [[BROADCAST_SPLAT]], i32 0
78
- ; CHECK-NEXT: [[TMP2:%.*]] = getelementptr float, <4 x ptr> [[BROADCAST_SPLAT2]], i64 [[TMP1]]
79
- ; CHECK-NEXT: [[TMP3:%.*]] = getelementptr ptr, ptr [[DST]], i64 [[INDEX]]
80
- ; CHECK-NEXT: [[TMP4:%.*]] = getelementptr ptr, ptr [[TMP3]], i32 0
81
- ; CHECK-NEXT: store <4 x ptr> [[TMP2]], ptr [[TMP4]], align 8
73
+ ; CHECK-NEXT: [[BROADCAST_SPLATINSERT:%.*]] = insertelement <4 x ptr> poison, ptr [[TMP0]], i64 0
74
+ ; CHECK-NEXT: [[BROADCAST_SPLAT:%.*]] = shufflevector <4 x ptr> [[BROADCAST_SPLATINSERT]], <4 x ptr> poison, <4 x i32> zeroinitializer
75
+ ; CHECK-NEXT: [[TMP1:%.*]] = getelementptr float, <4 x ptr> [[BROADCAST_SPLAT]], i64 [[N]]
76
+ ; CHECK-NEXT: [[TMP2:%.*]] = getelementptr ptr, ptr [[DST]], i64 [[INDEX]]
77
+ ; CHECK-NEXT: [[TMP3:%.*]] = getelementptr ptr, ptr [[TMP2]], i32 0
78
+ ; CHECK-NEXT: store <4 x ptr> [[TMP1]], ptr [[TMP3]], align 8
82
79
; CHECK-NEXT: [[INDEX_NEXT]] = add nuw i64 [[INDEX]], 4
83
- ; CHECK-NEXT: [[TMP5 :%.*]] = icmp eq i64 [[INDEX_NEXT]], 100
84
- ; CHECK-NEXT: br i1 [[TMP5 ]], label [[MIDDLE_BLOCK:%.*]], label [[VECTOR_BODY]], !llvm.loop [[LOOP4:![0-9]+]]
80
+ ; CHECK-NEXT: [[TMP4 :%.*]] = icmp eq i64 [[INDEX_NEXT]], 100
81
+ ; CHECK-NEXT: br i1 [[TMP4 ]], label [[MIDDLE_BLOCK:%.*]], label [[VECTOR_BODY]], !llvm.loop [[LOOP4:![0-9]+]]
85
82
; CHECK: middle.block:
86
83
; CHECK-NEXT: br i1 true, label [[EXIT:%.*]], label [[SCALAR_PH]]
87
84
; CHECK: scalar.ph:
@@ -115,3 +112,58 @@ loop:
115
112
exit:
116
113
ret void
117
114
}
115
+
116
+ define void @wide_gep_multiple_indices_some_invariant (ptr noalias %dst , ptr noalias %src , i32 %x ) {
117
+ ; CHECK-LABEL: define void @wide_gep_multiple_indices_some_invariant
118
+ ; CHECK-SAME: (ptr noalias [[DST:%.*]], ptr noalias [[SRC:%.*]], i32 [[X:%.*]]) {
119
+ ; CHECK-NEXT: entry:
120
+ ; CHECK-NEXT: br i1 false, label [[SCALAR_PH:%.*]], label [[VECTOR_PH:%.*]]
121
+ ; CHECK: vector.ph:
122
+ ; CHECK-NEXT: br label [[VECTOR_BODY:%.*]]
123
+ ; CHECK: vector.body:
124
+ ; CHECK-NEXT: [[INDEX:%.*]] = phi i64 [ 0, [[VECTOR_PH]] ], [ [[INDEX_NEXT:%.*]], [[VECTOR_BODY]] ]
125
+ ; CHECK-NEXT: [[VEC_IND:%.*]] = phi <4 x i64> [ <i64 0, i64 1, i64 2, i64 3>, [[VECTOR_PH]] ], [ [[VEC_IND_NEXT:%.*]], [[VECTOR_BODY]] ]
126
+ ; CHECK-NEXT: [[TMP0:%.*]] = load ptr, ptr [[SRC]], align 8
127
+ ; CHECK-NEXT: [[BROADCAST_SPLATINSERT:%.*]] = insertelement <4 x ptr> poison, ptr [[TMP0]], i64 0
128
+ ; CHECK-NEXT: [[BROADCAST_SPLAT:%.*]] = shufflevector <4 x ptr> [[BROADCAST_SPLATINSERT]], <4 x ptr> poison, <4 x i32> zeroinitializer
129
+ ; CHECK-NEXT: [[TMP1:%.*]] = getelementptr [10 x float], <4 x ptr> [[BROADCAST_SPLAT]], i32 [[X]], <4 x i64> [[VEC_IND]]
130
+ ; CHECK-NEXT: [[TMP2:%.*]] = getelementptr ptr, ptr [[DST]], i64 [[INDEX]]
131
+ ; CHECK-NEXT: [[TMP3:%.*]] = getelementptr ptr, ptr [[TMP2]], i32 0
132
+ ; CHECK-NEXT: store <4 x ptr> [[TMP1]], ptr [[TMP3]], align 8
133
+ ; CHECK-NEXT: [[INDEX_NEXT]] = add nuw i64 [[INDEX]], 4
134
+ ; CHECK-NEXT: [[VEC_IND_NEXT]] = add <4 x i64> [[VEC_IND]], splat (i64 4)
135
+ ; CHECK-NEXT: [[TMP4:%.*]] = icmp eq i64 [[INDEX_NEXT]], 100
136
+ ; CHECK-NEXT: br i1 [[TMP4]], label [[MIDDLE_BLOCK:%.*]], label [[VECTOR_BODY]], !llvm.loop [[LOOP6:![0-9]+]]
137
+ ; CHECK: middle.block:
138
+ ; CHECK-NEXT: br i1 true, label [[EXIT:%.*]], label [[SCALAR_PH]]
139
+ ; CHECK: scalar.ph:
140
+ ; CHECK-NEXT: [[BC_RESUME_VAL:%.*]] = phi i64 [ 100, [[MIDDLE_BLOCK]] ], [ 0, [[ENTRY:%.*]] ]
141
+ ; CHECK-NEXT: br label [[LOOP:%.*]]
142
+ ; CHECK: loop:
143
+ ; CHECK-NEXT: [[IV:%.*]] = phi i64 [ [[BC_RESUME_VAL]], [[SCALAR_PH]] ], [ [[IV_NEXT:%.*]], [[LOOP]] ]
144
+ ; CHECK-NEXT: [[L:%.*]] = load ptr, ptr [[SRC]], align 8
145
+ ; CHECK-NEXT: [[GEP_L:%.*]] = getelementptr [10 x float], ptr [[L]], i32 [[X]], i64 [[IV]]
146
+ ; CHECK-NEXT: [[GEP_DST:%.*]] = getelementptr ptr, ptr [[DST]], i64 [[IV]]
147
+ ; CHECK-NEXT: store ptr [[GEP_L]], ptr [[GEP_DST]], align 8
148
+ ; CHECK-NEXT: [[IV_NEXT]] = add nuw nsw i64 [[IV]], 1
149
+ ; CHECK-NEXT: [[EC:%.*]] = icmp eq i64 [[IV_NEXT]], 100
150
+ ; CHECK-NEXT: br i1 [[EC]], label [[EXIT]], label [[LOOP]], !llvm.loop [[LOOP7:![0-9]+]]
151
+ ; CHECK: exit:
152
+ ; CHECK-NEXT: ret void
153
+ ;
154
+ entry:
155
+ br label %loop
156
+
157
+ loop:
158
+ %iv = phi i64 [ 0 , %entry ], [ %iv.next , %loop ]
159
+ %l = load ptr , ptr %src , align 8
160
+ %gep.l = getelementptr [10 x float ], ptr %l , i32 %x , i64 %iv
161
+ %gep.dst = getelementptr ptr , ptr %dst , i64 %iv
162
+ store ptr %gep.l , ptr %gep.dst , align 8
163
+ %iv.next = add nuw nsw i64 %iv , 1
164
+ %ec = icmp eq i64 %iv.next , 100
165
+ br i1 %ec , label %exit , label %loop
166
+
167
+ exit:
168
+ ret void
169
+ }
0 commit comments