1
+ ; NOTE: Assertions have been autogenerated by utils/update_test_checks.py UTC_ARGS: --check-globals none --filter-out-after "vector.ph" --version 5
1
2
; RUN: opt %s -passes=loop-vectorize -hoist-runtime-checks=false -force-vector-width=4 -force-vector-interleave=1 -S | FileCheck %s
2
3
3
4
target datalayout = "e-m:e-i64:64-i128:128-n32:64-S128"
4
5
5
6
define void @same_step_and_size (ptr %a , ptr %b , i64 %n ) {
6
- ; CHECK-LABEL: @same_step_and_size(
7
- ; CHECK-NEXT: entry:
8
- ; CHECK-NEXT: [[A2:%.*]] = ptrtoint ptr [[A:%.*]] to i64
9
- ; CHECK-NEXT: [[B1:%.*]] = ptrtoint ptr [[B:%.*]] to i64
10
- ; CHECK-NEXT: [[MIN_ITERS_CHECK:%.*]] = icmp ult i64 [[N:%.*]], 4
11
- ; CHECK-NEXT: br i1 [[MIN_ITERS_CHECK]], label %scalar.ph, label %vector.memcheck
12
- ; CHECK: vector.memcheck:
7
+ ; CHECK-LABEL: define void @same_step_and_size(
8
+ ; CHECK-SAME: ptr [[A:%.*]], ptr [[B:%.*]], i64 [[N:%.*]]) {
9
+ ; CHECK-NEXT: [[ENTRY:.*:]]
10
+ ; CHECK-NEXT: [[A2:%.*]] = ptrtoint ptr [[A]] to i64
11
+ ; CHECK-NEXT: [[B1:%.*]] = ptrtoint ptr [[B]] to i64
12
+ ; CHECK-NEXT: [[MIN_ITERS_CHECK:%.*]] = icmp ult i64 [[N]], 4
13
+ ; CHECK-NEXT: br i1 [[MIN_ITERS_CHECK]], [[SCALAR_PH:label %.*]], label %[[VECTOR_MEMCHECK:.*]]
14
+ ; CHECK: [[VECTOR_MEMCHECK]]:
13
15
; CHECK-NEXT: [[TMP0:%.*]] = sub i64 [[B1]], [[A2]]
14
16
; CHECK-NEXT: [[DIFF_CHECK:%.*]] = icmp ult i64 [[TMP0]], 16
15
- ; CHECK-NEXT: br i1 [[DIFF_CHECK]], label %scalar.ph, label %vector.ph
17
+ ; CHECK-NEXT: br i1 [[DIFF_CHECK]], [[SCALAR_PH]], [[VECTOR_PH: label %.*]]
16
18
;
17
19
entry:
18
20
br label %loop
@@ -33,16 +35,17 @@ exit:
33
35
}
34
36
35
37
define void @same_step_and_size_no_dominance_between_accesses (ptr %a , ptr %b , i64 %n , i64 %x ) {
36
- ; CHECK-LABEL: @same_step_and_size_no_dominance_between_accesses(
37
- ; CHECK-NEXT: entry:
38
- ; CHECK-NEXT: [[B2:%.*]] = ptrtoint ptr [[B:%.*]] to i64
39
- ; CHECK-NEXT: [[A1:%.*]] = ptrtoint ptr [[A:%.*]] to i64
40
- ; CHECK-NEXT: [[MIN_ITERS_CHECK:%.*]] = icmp ult i64 [[N:%.*]], 4
41
- ; CHECK-NEXT: br i1 [[MIN_ITERS_CHECK]], label %scalar.ph, label %vector.memcheck
42
- ; CHECK: vector.memcheck:
38
+ ; CHECK-LABEL: define void @same_step_and_size_no_dominance_between_accesses(
39
+ ; CHECK-SAME: ptr [[A:%.*]], ptr [[B:%.*]], i64 [[N:%.*]], i64 [[X:%.*]]) {
40
+ ; CHECK-NEXT: [[ENTRY:.*:]]
41
+ ; CHECK-NEXT: [[B2:%.*]] = ptrtoint ptr [[B]] to i64
42
+ ; CHECK-NEXT: [[A1:%.*]] = ptrtoint ptr [[A]] to i64
43
+ ; CHECK-NEXT: [[MIN_ITERS_CHECK:%.*]] = icmp ult i64 [[N]], 4
44
+ ; CHECK-NEXT: br i1 [[MIN_ITERS_CHECK]], [[SCALAR_PH:label %.*]], label %[[VECTOR_MEMCHECK:.*]]
45
+ ; CHECK: [[VECTOR_MEMCHECK]]:
43
46
; CHECK-NEXT: [[TMP0:%.*]] = sub i64 [[A1]], [[B2]]
44
47
; CHECK-NEXT: [[DIFF_CHECK:%.*]] = icmp ult i64 [[TMP0]], 16
45
- ; CHECK-NEXT: br i1 [[DIFF_CHECK]], label %scalar.ph, label %vector.ph
48
+ ; CHECK-NEXT: br i1 [[DIFF_CHECK]], [[SCALAR_PH]], [[VECTOR_PH: label %.*]]
46
49
;
47
50
entry:
48
51
br label %loop
@@ -72,19 +75,20 @@ exit:
72
75
}
73
76
74
77
define void @different_steps_and_different_access_sizes (ptr %a , ptr %b , i64 %n ) {
75
- ; CHECK-LABEL: @different_steps_and_different_access_sizes(
76
- ; CHECK-NEXT: entry:
77
- ; CHECK-NEXT: [[MIN_ITERS_CHECK:%.*]] = icmp ult i64 [[N:%.*]], 4
78
- ; CHECK-NEXT: br i1 [[MIN_ITERS_CHECK]], label %scalar.ph, label %vector.memcheck
79
- ; CHECK: vector.memcheck:
80
- ; CHECK-NEXT: [[N_SHL_2:%.]] = shl i64 %n, 2
81
- ; CHECK-NEXT: [[SCEVGEP:%.*]] = getelementptr i8, ptr %b, i64 [[N_SHL_2]]
82
- ; CHECK-NEXT: [[N_SHL_1:%.]] = shl i64 %n, 1
83
- ; CHECK-NEXT: [[SCEVGEP4:%.*]] = getelementptr i8, ptr %a, i64 [[N_SHL_1]]
84
- ; CHECK-NEXT: [[BOUND0:%.*]] = icmp ult ptr %b, [[SCEVGEP4]]
85
- ; CHECK-NEXT: [[BOUND1:%.*]] = icmp ult ptr %a, [[SCEVGEP]]
78
+ ; CHECK-LABEL: define void @different_steps_and_different_access_sizes(
79
+ ; CHECK-SAME: ptr [[A:%.*]], ptr [[B:%.*]], i64 [[N:%.*]]) {
80
+ ; CHECK-NEXT: [[ENTRY:.*:]]
81
+ ; CHECK-NEXT: [[MIN_ITERS_CHECK:%.*]] = icmp ult i64 [[N]], 4
82
+ ; CHECK-NEXT: br i1 [[MIN_ITERS_CHECK]], [[SCALAR_PH:label %.*]], label %[[VECTOR_MEMCHECK:.*]]
83
+ ; CHECK: [[VECTOR_MEMCHECK]]:
84
+ ; CHECK-NEXT: [[TMP0:%.*]] = shl i64 [[N]], 2
85
+ ; CHECK-NEXT: [[SCEVGEP:%.*]] = getelementptr i8, ptr [[B]], i64 [[TMP0]]
86
+ ; CHECK-NEXT: [[TMP1:%.*]] = shl i64 [[N]], 1
87
+ ; CHECK-NEXT: [[SCEVGEP1:%.*]] = getelementptr i8, ptr [[A]], i64 [[TMP1]]
88
+ ; CHECK-NEXT: [[BOUND0:%.*]] = icmp ult ptr [[B]], [[SCEVGEP1]]
89
+ ; CHECK-NEXT: [[BOUND1:%.*]] = icmp ult ptr [[A]], [[SCEVGEP]]
86
90
; CHECK-NEXT: [[FOUND_CONFLICT:%.*]] = and i1 [[BOUND0]], [[BOUND1]]
87
- ; CHECK-NEXT: br i1 [[FOUND_CONFLICT]], label %scalar.ph, label %vector.ph
91
+ ; CHECK-NEXT: br i1 [[FOUND_CONFLICT]], [[SCALAR_PH]], [[VECTOR_PH: label %.*]]
88
92
;
89
93
entry:
90
94
br label %loop
@@ -106,17 +110,18 @@ exit:
106
110
}
107
111
108
112
define void @steps_match_but_different_access_sizes_1 (ptr %a , ptr %b , i64 %n ) {
109
- ; CHECK-LABEL: @steps_match_but_different_access_sizes_1(
110
- ; CHECK-NEXT: entry:
111
- ; CHECK-NEXT: [[A2:%.*]] = ptrtoint ptr [[A:%.*]] to i64
112
- ; CHECK-NEXT: [[B1:%.*]] = ptrtoint ptr [[B:%.*]] to i64
113
- ; CHECK-NEXT: [[MIN_ITERS_CHECK:%.*]] = icmp ult i64 [[N:%.*]], 4
114
- ; CHECK-NEXT: br i1 [[MIN_ITERS_CHECK]], label %scalar.ph, label %vector.memcheck
115
- ; CHECK: vector.memcheck:
113
+ ; CHECK-LABEL: define void @steps_match_but_different_access_sizes_1(
114
+ ; CHECK-SAME: ptr [[A:%.*]], ptr [[B:%.*]], i64 [[N:%.*]]) {
115
+ ; CHECK-NEXT: [[ENTRY:.*:]]
116
+ ; CHECK-NEXT: [[A2:%.*]] = ptrtoint ptr [[A]] to i64
117
+ ; CHECK-NEXT: [[B1:%.*]] = ptrtoint ptr [[B]] to i64
118
+ ; CHECK-NEXT: [[MIN_ITERS_CHECK:%.*]] = icmp ult i64 [[N]], 4
119
+ ; CHECK-NEXT: br i1 [[MIN_ITERS_CHECK]], [[SCALAR_PH:label %.*]], label %[[VECTOR_MEMCHECK:.*]]
120
+ ; CHECK: [[VECTOR_MEMCHECK]]:
116
121
; CHECK-NEXT: [[TMP0:%.*]] = add i64 [[B1]], -2
117
122
; CHECK-NEXT: [[TMP1:%.*]] = sub i64 [[TMP0]], [[A2]]
118
123
; CHECK-NEXT: [[DIFF_CHECK:%.*]] = icmp ult i64 [[TMP1]], 16
119
- ; CHECK-NEXT: br i1 [[DIFF_CHECK]], label %scalar.ph, label %vector.ph
124
+ ; CHECK-NEXT: br i1 [[DIFF_CHECK]], [[SCALAR_PH]], [[VECTOR_PH: label %.*]]
120
125
;
121
126
entry:
122
127
br label %loop
@@ -140,17 +145,18 @@ exit:
140
145
; Same as @steps_match_but_different_access_sizes_1, but with source and sink
141
146
; accesses flipped.
142
147
define void @steps_match_but_different_access_sizes_2 (ptr %a , ptr %b , i64 %n ) {
143
- ; CHECK-LABEL: @steps_match_but_different_access_sizes_2(
144
- ; CHECK-NEXT: entry:
145
- ; CHECK-NEXT: [[B2:%.*]] = ptrtoint ptr [[B:%.*]] to i64
146
- ; CHECK-NEXT: [[A1:%.*]] = ptrtoint ptr [[A:%.*]] to i64
147
- ; CHECK-NEXT: [[MIN_ITERS_CHECK:%.*]] = icmp ult i64 [[N:%.*]], 4
148
- ; CHECK-NEXT: br i1 [[MIN_ITERS_CHECK]], label %scalar.ph, label %vector.memcheck
149
- ; CHECK: vector.memcheck:
148
+ ; CHECK-LABEL: define void @steps_match_but_different_access_sizes_2(
149
+ ; CHECK-SAME: ptr [[A:%.*]], ptr [[B:%.*]], i64 [[N:%.*]]) {
150
+ ; CHECK-NEXT: [[ENTRY:.*:]]
151
+ ; CHECK-NEXT: [[B2:%.*]] = ptrtoint ptr [[B]] to i64
152
+ ; CHECK-NEXT: [[A1:%.*]] = ptrtoint ptr [[A]] to i64
153
+ ; CHECK-NEXT: [[MIN_ITERS_CHECK:%.*]] = icmp ult i64 [[N]], 4
154
+ ; CHECK-NEXT: br i1 [[MIN_ITERS_CHECK]], [[SCALAR_PH:label %.*]], label %[[VECTOR_MEMCHECK:.*]]
155
+ ; CHECK: [[VECTOR_MEMCHECK]]:
150
156
; CHECK-NEXT: [[TMP0:%.*]] = add i64 [[A1]], 2
151
157
; CHECK-NEXT: [[TMP1:%.*]] = sub i64 [[TMP0]], [[B2]]
152
158
; CHECK-NEXT: [[DIFF_CHECK:%.*]] = icmp ult i64 [[TMP1]], 16
153
- ; CHECK-NEXT: br i1 [[DIFF_CHECK]], label %scalar.ph, label %vector.ph
159
+ ; CHECK-NEXT: br i1 [[DIFF_CHECK]], [[SCALAR_PH]], [[VECTOR_PH: label %.*]]
154
160
;
155
161
entry:
156
162
br label %loop
@@ -175,26 +181,29 @@ exit:
175
181
; one of the add-recs used is invariant in the inner loop.
176
182
; Test case for PR57315.
177
183
define void @nested_loop_outer_iv_addrec_invariant_in_inner1 (ptr %a , ptr %b , i64 %n ) {
178
- ; CHECK-LABEL: @nested_loop_outer_iv_addrec_invariant_in_inner1(
179
- ; CHECK: entry:
180
- ; CHECK-NEXT: [[N_SHL_2:%.]] = shl i64 %n, 2
181
- ; CHECK-NEXT: [[B_GEP_UPPER:%.*]] = getelementptr i8, ptr %b, i64 [[N_SHL_2]]
182
- ; CHECK-NEXT: br label %outer
183
-
184
- ; CHECK: outer.header:
185
- ; CHECK: [[OUTER_IV_SHL_2:%.]] = shl i64 %outer.iv, 2
186
- ; CHECK-NEXT: [[A_GEP_UPPER:%.*]] = getelementptr nuw i8, ptr %a, i64 [[OUTER_IV_SHL_2]]
187
- ; CHECK-NEXT: [[OUTER_IV_4:%.]] = add i64 [[OUTER_IV_SHL_2]], 4
188
- ; CHECK-NEXT: [[A_GEP_UPPER_4:%.*]] = getelementptr i8, ptr %a, i64 [[OUTER_IV_4]]
189
- ; CHECK: [[MIN_ITERS_CHECK:%.*]] = icmp ult i64 [[N:%.*]], 4
190
- ; CHECK-NEXT: br i1 [[MIN_ITERS_CHECK]], label %scalar.ph, label %vector.memcheck
191
-
192
- ; CHECK: vector.memcheck:
193
- ; CHECK-NEXT: [[BOUND0:%.*]] = icmp ult ptr [[A_GEP_UPPER]], [[B_GEP_UPPER]]
194
- ; CHECK-NEXT: [[BOUND1:%.*]] = icmp ult ptr %b, [[A_GEP_UPPER_4]]
184
+ ; CHECK-LABEL: define void @nested_loop_outer_iv_addrec_invariant_in_inner1(
185
+ ; CHECK-SAME: ptr [[A:%.*]], ptr [[B:%.*]], i64 [[N:%.*]]) {
186
+ ; CHECK-NEXT: [[ENTRY:.*]]:
187
+ ; CHECK-NEXT: [[TMP0:%.*]] = shl i64 [[N]], 2
188
+ ; CHECK-NEXT: [[SCEVGEP2:%.*]] = getelementptr i8, ptr [[B]], i64 [[TMP0]]
189
+ ; CHECK-NEXT: br label %[[OUTER_HEADER:.*]]
190
+ ; CHECK: [[OUTER_HEADER]]:
191
+ ; CHECK-NEXT: [[OUTER_IV:%.*]] = phi i64 [ [[OUTER_IV_NEXT:%.*]], [[OUTER_LATCH:%.*]] ], [ 0, %[[ENTRY]] ]
192
+ ; CHECK-NEXT: [[TMP1:%.*]] = shl i64 [[OUTER_IV]], 2
193
+ ; CHECK-NEXT: [[SCEVGEP:%.*]] = getelementptr nuw i8, ptr [[A]], i64 [[TMP1]]
194
+ ; CHECK-NEXT: [[TMP2:%.*]] = add i64 [[TMP1]], 4
195
+ ; CHECK-NEXT: [[SCEVGEP1:%.*]] = getelementptr i8, ptr [[A]], i64 [[TMP2]]
196
+ ; CHECK-NEXT: [[GEP_A:%.*]] = getelementptr inbounds i32, ptr [[A]], i64 [[OUTER_IV]]
197
+ ; CHECK-NEXT: [[MIN_ITERS_CHECK:%.*]] = icmp ult i64 [[N]], 4
198
+ ; CHECK-NEXT: br i1 [[MIN_ITERS_CHECK]], [[SCALAR_PH:label %.*]], label %[[VECTOR_MEMCHECK:.*]]
199
+ ; CHECK: [[VECTOR_MEMCHECK]]:
200
+ ; CHECK-NEXT: [[BOUND0:%.*]] = icmp ult ptr [[SCEVGEP]], [[SCEVGEP2]]
201
+ ; CHECK-NEXT: [[BOUND1:%.*]] = icmp ult ptr [[B]], [[SCEVGEP1]]
195
202
; CHECK-NEXT: [[FOUND_CONFLICT:%.*]] = and i1 [[BOUND0]], [[BOUND1]]
196
- ; CHECK-NEXT: br i1 [[FOUND_CONFLICT]], label %scalar.ph, label %vector.ph
203
+ ; CHECK-NEXT: br i1 [[FOUND_CONFLICT]], [[SCALAR_PH]], [[VECTOR_PH: label %.*]]
197
204
;
205
+
206
+
198
207
entry:
199
208
br label %outer.header
200
209
@@ -225,26 +234,29 @@ exit:
225
234
; Same as @nested_loop_outer_iv_addrec_invariant_in_inner1 but with dependence
226
235
; sink and source swapped.
227
236
define void @nested_loop_outer_iv_addrec_invariant_in_inner2 (ptr %a , ptr %b , i64 %n ) {
228
- ; CHECK-LABEL: @nested_loop_outer_iv_addrec_invariant_in_inner2(
229
- ; CHECK: entry:
230
- ; CHECK-NEXT: [[N_SHL_2:%.]] = shl i64 %n, 2
231
- ; CHECK-NEXT: [[B_GEP_UPPER:%.*]] = getelementptr i8, ptr %b, i64 [[N_SHL_2]]
232
- ; CHECK-NEXT: br label %outer
233
-
234
- ; CHECK: outer.header:
235
- ; CHECK: [[OUTER_IV_SHL_2:%.]] = shl i64 %outer.iv, 2
236
- ; CHECK-NEXT: [[A_GEP_UPPER:%.*]] = getelementptr nuw i8, ptr %a, i64 [[OUTER_IV_SHL_2]]
237
- ; CHECK-NEXT: [[OUTER_IV_4:%.]] = add i64 [[OUTER_IV_SHL_2]], 4
238
- ; CHECK-NEXT: [[A_GEP_UPPER_4:%.*]] = getelementptr i8, ptr %a, i64 [[OUTER_IV_4]]
239
- ; CHECK: [[MIN_ITERS_CHECK:%.*]] = icmp ult i64 [[N:%.*]], 4
240
- ; CHECK-NEXT: br i1 [[MIN_ITERS_CHECK]], label %scalar.ph, label %vector.memcheck
241
-
242
- ; CHECK: vector.memcheck:
243
- ; CHECK-NEXT: [[BOUND0:%.*]] = icmp ult ptr %b, [[A_GEP_UPPER_4]]
244
- ; CHECK-NEXT: [[BOUND1:%.*]] = icmp ult ptr [[A_GEP_UPPER]], [[B_GEP_UPPER]]
237
+ ; CHECK-LABEL: define void @nested_loop_outer_iv_addrec_invariant_in_inner2(
238
+ ; CHECK-SAME: ptr [[A:%.*]], ptr [[B:%.*]], i64 [[N:%.*]]) {
239
+ ; CHECK-NEXT: [[ENTRY:.*]]:
240
+ ; CHECK-NEXT: [[TMP0:%.*]] = shl i64 [[N]], 2
241
+ ; CHECK-NEXT: [[SCEVGEP:%.*]] = getelementptr i8, ptr [[B]], i64 [[TMP0]]
242
+ ; CHECK-NEXT: br label %[[OUTER_HEADER:.*]]
243
+ ; CHECK: [[OUTER_HEADER]]:
244
+ ; CHECK-NEXT: [[OUTER_IV:%.*]] = phi i64 [ [[OUTER_IV_NEXT:%.*]], [[OUTER_LATCH:%.*]] ], [ 0, %[[ENTRY]] ]
245
+ ; CHECK-NEXT: [[TMP1:%.*]] = shl i64 [[OUTER_IV]], 2
246
+ ; CHECK-NEXT: [[SCEVGEP1:%.*]] = getelementptr nuw i8, ptr [[A]], i64 [[TMP1]]
247
+ ; CHECK-NEXT: [[TMP2:%.*]] = add i64 [[TMP1]], 4
248
+ ; CHECK-NEXT: [[SCEVGEP2:%.*]] = getelementptr i8, ptr [[A]], i64 [[TMP2]]
249
+ ; CHECK-NEXT: [[GEP_A:%.*]] = getelementptr inbounds i32, ptr [[A]], i64 [[OUTER_IV]]
250
+ ; CHECK-NEXT: [[MIN_ITERS_CHECK:%.*]] = icmp ult i64 [[N]], 4
251
+ ; CHECK-NEXT: br i1 [[MIN_ITERS_CHECK]], [[SCALAR_PH:label %.*]], label %[[VECTOR_MEMCHECK:.*]]
252
+ ; CHECK: [[VECTOR_MEMCHECK]]:
253
+ ; CHECK-NEXT: [[BOUND0:%.*]] = icmp ult ptr [[B]], [[SCEVGEP2]]
254
+ ; CHECK-NEXT: [[BOUND1:%.*]] = icmp ult ptr [[SCEVGEP1]], [[SCEVGEP]]
245
255
; CHECK-NEXT: [[FOUND_CONFLICT:%.*]] = and i1 [[BOUND0]], [[BOUND1]]
246
- ; CHECK-NEXT: br i1 [[FOUND_CONFLICT]], label %scalar.ph, label %vector.ph
256
+ ; CHECK-NEXT: br i1 [[FOUND_CONFLICT]], [[SCALAR_PH]], [[VECTOR_PH: label %.*]]
247
257
;
258
+
259
+
248
260
entry:
249
261
br label %outer.header
250
262
@@ -276,20 +288,21 @@ exit:
276
288
; of the outer loop as start value. It is sufficient to subtract the start
277
289
; values (%dst, %src) of the outer AddRecs.
278
290
define void @nested_loop_start_of_inner_ptr_addrec_is_same_outer_addrec (ptr nocapture noundef %dst , ptr nocapture noundef readonly %src , i64 noundef %m , i64 noundef %n ) {
279
- ; CHECK-LABEL: @nested_loop_start_of_inner_ptr_addrec_is_same_outer_addrec(
280
- ; CHECK-NEXT: entry:
281
- ; CHECK-NEXT: [[SRC2:%.*]] = ptrtoint ptr [[SRC:%.*]] to i64
282
- ; CHECK-NEXT: [[DST1:%.*]] = ptrtoint ptr [[DST:%.*]] to i64
291
+ ; CHECK-LABEL: define void @nested_loop_start_of_inner_ptr_addrec_is_same_outer_addrec(
292
+ ; CHECK-SAME: ptr noundef captures(none) [[DST:%.*]], ptr noundef readonly captures(none) [[SRC:%.*]], i64 noundef [[M:%.*]], i64 noundef [[N:%.*]]) {
293
+ ; CHECK-NEXT: [[ENTRY:.*]]:
294
+ ; CHECK-NEXT: [[SRC2:%.*]] = ptrtoint ptr [[SRC]] to i64
295
+ ; CHECK-NEXT: [[DST1:%.*]] = ptrtoint ptr [[DST]] to i64
283
296
; CHECK-NEXT: [[SUB:%.*]] = sub i64 [[DST1]], [[SRC2]]
284
- ; CHECK-NEXT: br label [[OUTER_LOOP:% .*]]
285
- ; CHECK: outer.loop :
286
- ; CHECK-NEXT: [[OUTER_IV:%.*]] = phi i64 [ 0, [[ENTRY:%.* ]] ], [ [[OUTER_IV_NEXT:%.*]], [[INNER_EXIT:%.*]] ]
297
+ ; CHECK-NEXT: br label % [[OUTER_LOOP:.*]]
298
+ ; CHECK: [[OUTER_LOOP]] :
299
+ ; CHECK-NEXT: [[OUTER_IV:%.*]] = phi i64 [ 0, % [[ENTRY]] ], [ [[OUTER_IV_NEXT:%.*]], [[INNER_EXIT:%.*]] ]
287
300
; CHECK-NEXT: [[MUL:%.*]] = mul nsw i64 [[OUTER_IV]], [[N]]
288
301
; CHECK-NEXT: [[MIN_ITERS_CHECK:%.*]] = icmp ult i64 [[N]], 4
289
- ; CHECK-NEXT: br i1 [[MIN_ITERS_CHECK]], label [[SCALAR_PH:%.*]], label [[VECTOR_MEMCHECK:% .*]]
290
- ; CHECK: vector.memcheck :
302
+ ; CHECK-NEXT: br i1 [[MIN_ITERS_CHECK]], [[SCALAR_PH:label %.*]], label % [[VECTOR_MEMCHECK:.*]]
303
+ ; CHECK: [[VECTOR_MEMCHECK]] :
291
304
; CHECK-NEXT: [[DIFF_CHECK:%.*]] = icmp ult i64 [[SUB]], 16
292
- ; CHECK-NEXT: br i1 [[DIFF_CHECK]], label [[SCALAR_PH]], label [[VECTOR_PH:%.*]]
305
+ ; CHECK-NEXT: br i1 [[DIFF_CHECK]], [[SCALAR_PH]], [[VECTOR_PH:label %.*]]
293
306
;
294
307
entry:
295
308
br label %outer.loop
@@ -321,15 +334,16 @@ outer.exit:
321
334
}
322
335
323
336
define void @use_diff_checks_when_retrying_with_rt_checks (i64 %off , ptr %dst , ptr %src ) {
324
- ; CHECK-LABEL: @use_diff_checks_when_retrying_with_rt_checks(
325
- ; CHECK-NEXT: entry:
326
- ; CHECK-NEXT: [[SRC2:%.*]] = ptrtoint ptr %src to i64
327
- ; CHECK-NEXT: [[DST1:%.*]] = ptrtoint ptr %dst to i64
328
- ; CHECK-NEXT: br i1 false, label %scalar.ph, label %vector.memcheck
329
- ; CHECK: vector.memcheck:
330
- ; CHECK-NEXT: [[TMP0:%.*]] = mul i64 %off, -8
337
+ ; CHECK-LABEL: define void @use_diff_checks_when_retrying_with_rt_checks(
338
+ ; CHECK-SAME: i64 [[OFF:%.*]], ptr [[DST:%.*]], ptr [[SRC:%.*]]) {
339
+ ; CHECK-NEXT: [[ENTRY:.*:]]
340
+ ; CHECK-NEXT: [[SRC2:%.*]] = ptrtoint ptr [[SRC]] to i64
341
+ ; CHECK-NEXT: [[DST1:%.*]] = ptrtoint ptr [[DST]] to i64
342
+ ; CHECK-NEXT: br i1 false, [[SCALAR_PH:label %.*]], label %[[VECTOR_MEMCHECK:.*]]
343
+ ; CHECK: [[VECTOR_MEMCHECK]]:
344
+ ; CHECK-NEXT: [[TMP0:%.*]] = mul i64 [[OFF]], -8
331
345
; CHECK-NEXT: [[DIFF_CHECK:%.*]] = icmp ult i64 [[TMP0]], 32
332
- ; CHECK-NEXT: [[TMP1:%.*]] = shl i64 %off , 3
346
+ ; CHECK-NEXT: [[TMP1:%.*]] = shl i64 [[OFF]] , 3
333
347
; CHECK-NEXT: [[TMP2:%.*]] = add i64 [[DST1]], [[TMP1]]
334
348
; CHECK-NEXT: [[TMP3:%.*]] = sub i64 [[TMP2]], [[SRC2]]
335
349
; CHECK-NEXT: [[DIFF_CHECK3:%.*]] = icmp ult i64 [[TMP3]], 32
@@ -346,9 +360,7 @@ define void @use_diff_checks_when_retrying_with_rt_checks(i64 %off, ptr %dst, pt
346
360
; CHECK-NEXT: [[TMP9:%.*]] = sub i64 [[TMP8]], [[SRC2]]
347
361
; CHECK-NEXT: [[DIFF_CHECK8:%.*]] = icmp ult i64 [[TMP9]], 32
348
362
; CHECK-NEXT: [[CONFLICT_RDX9:%.*]] = or i1 [[CONFLICT_RDX7]], [[DIFF_CHECK8]]
349
- ; CHECK-NEXT: br i1 [[CONFLICT_RDX9]], label %scalar.ph, label %vector.ph
350
- ; CHECK: vector.ph:
351
- ; CHECK-NEXT: br label %vector.body
363
+ ; CHECK-NEXT: br i1 [[CONFLICT_RDX9]], [[SCALAR_PH]], [[VECTOR_PH:label %.*]]
352
364
;
353
365
entry:
354
366
br label %loop
0 commit comments