1+ ; NOTE: Assertions have been autogenerated by utils/update_test_checks.py UTC_ARGS: --check-globals none --filter-out-after "vector.ph" --version 5
12; RUN: opt %s -passes=loop-vectorize -hoist-runtime-checks=false -force-vector-width=4 -force-vector-interleave=1 -S | FileCheck %s
23
34target datalayout = "e-m:e-i64:64-i128:128-n32:64-S128"
45
56define void @same_step_and_size (ptr %a , ptr %b , i64 %n ) {
6- ; CHECK-LABEL: @same_step_and_size(
7- ; CHECK-NEXT: entry:
8- ; CHECK-NEXT: [[A2:%.*]] = ptrtoint ptr [[A:%.*]] to i64
9- ; CHECK-NEXT: [[B1:%.*]] = ptrtoint ptr [[B:%.*]] to i64
10- ; CHECK-NEXT: [[MIN_ITERS_CHECK:%.*]] = icmp ult i64 [[N:%.*]], 4
11- ; CHECK-NEXT: br i1 [[MIN_ITERS_CHECK]], label %scalar.ph, label %vector.memcheck
12- ; CHECK: vector.memcheck:
7+ ; CHECK-LABEL: define void @same_step_and_size(
8+ ; CHECK-SAME: ptr [[A:%.*]], ptr [[B:%.*]], i64 [[N:%.*]]) {
9+ ; CHECK-NEXT: [[ENTRY:.*:]]
10+ ; CHECK-NEXT: [[A2:%.*]] = ptrtoint ptr [[A]] to i64
11+ ; CHECK-NEXT: [[B1:%.*]] = ptrtoint ptr [[B]] to i64
12+ ; CHECK-NEXT: [[MIN_ITERS_CHECK:%.*]] = icmp ult i64 [[N]], 4
13+ ; CHECK-NEXT: br i1 [[MIN_ITERS_CHECK]], [[SCALAR_PH:label %.*]], label %[[VECTOR_MEMCHECK:.*]]
14+ ; CHECK: [[VECTOR_MEMCHECK]]:
1315; CHECK-NEXT: [[TMP0:%.*]] = sub i64 [[B1]], [[A2]]
1416; CHECK-NEXT: [[DIFF_CHECK:%.*]] = icmp ult i64 [[TMP0]], 16
15- ; CHECK-NEXT: br i1 [[DIFF_CHECK]], label %scalar.ph, label %vector.ph
17+ ; CHECK-NEXT: br i1 [[DIFF_CHECK]], [[SCALAR_PH]], [[VECTOR_PH: label %.*]]
1618;
1719entry:
1820 br label %loop
@@ -33,16 +35,17 @@ exit:
3335}
3436
3537define void @same_step_and_size_no_dominance_between_accesses (ptr %a , ptr %b , i64 %n , i64 %x ) {
36- ; CHECK-LABEL: @same_step_and_size_no_dominance_between_accesses(
37- ; CHECK-NEXT: entry:
38- ; CHECK-NEXT: [[B2:%.*]] = ptrtoint ptr [[B:%.*]] to i64
39- ; CHECK-NEXT: [[A1:%.*]] = ptrtoint ptr [[A:%.*]] to i64
40- ; CHECK-NEXT: [[MIN_ITERS_CHECK:%.*]] = icmp ult i64 [[N:%.*]], 4
41- ; CHECK-NEXT: br i1 [[MIN_ITERS_CHECK]], label %scalar.ph, label %vector.memcheck
42- ; CHECK: vector.memcheck:
38+ ; CHECK-LABEL: define void @same_step_and_size_no_dominance_between_accesses(
39+ ; CHECK-SAME: ptr [[A:%.*]], ptr [[B:%.*]], i64 [[N:%.*]], i64 [[X:%.*]]) {
40+ ; CHECK-NEXT: [[ENTRY:.*:]]
41+ ; CHECK-NEXT: [[B2:%.*]] = ptrtoint ptr [[B]] to i64
42+ ; CHECK-NEXT: [[A1:%.*]] = ptrtoint ptr [[A]] to i64
43+ ; CHECK-NEXT: [[MIN_ITERS_CHECK:%.*]] = icmp ult i64 [[N]], 4
44+ ; CHECK-NEXT: br i1 [[MIN_ITERS_CHECK]], [[SCALAR_PH:label %.*]], label %[[VECTOR_MEMCHECK:.*]]
45+ ; CHECK: [[VECTOR_MEMCHECK]]:
4346; CHECK-NEXT: [[TMP0:%.*]] = sub i64 [[A1]], [[B2]]
4447; CHECK-NEXT: [[DIFF_CHECK:%.*]] = icmp ult i64 [[TMP0]], 16
45- ; CHECK-NEXT: br i1 [[DIFF_CHECK]], label %scalar.ph, label %vector.ph
48+ ; CHECK-NEXT: br i1 [[DIFF_CHECK]], [[SCALAR_PH]], [[VECTOR_PH: label %.*]]
4649;
4750entry:
4851 br label %loop
@@ -72,19 +75,20 @@ exit:
7275}
7376
7477define void @different_steps_and_different_access_sizes (ptr %a , ptr %b , i64 %n ) {
75- ; CHECK-LABEL: @different_steps_and_different_access_sizes(
76- ; CHECK-NEXT: entry:
77- ; CHECK-NEXT: [[MIN_ITERS_CHECK:%.*]] = icmp ult i64 [[N:%.*]], 4
78- ; CHECK-NEXT: br i1 [[MIN_ITERS_CHECK]], label %scalar.ph, label %vector.memcheck
79- ; CHECK: vector.memcheck:
80- ; CHECK-NEXT: [[N_SHL_2:%.]] = shl i64 %n, 2
81- ; CHECK-NEXT: [[SCEVGEP:%.*]] = getelementptr i8, ptr %b, i64 [[N_SHL_2]]
82- ; CHECK-NEXT: [[N_SHL_1:%.]] = shl i64 %n, 1
83- ; CHECK-NEXT: [[SCEVGEP4:%.*]] = getelementptr i8, ptr %a, i64 [[N_SHL_1]]
84- ; CHECK-NEXT: [[BOUND0:%.*]] = icmp ult ptr %b, [[SCEVGEP4]]
85- ; CHECK-NEXT: [[BOUND1:%.*]] = icmp ult ptr %a, [[SCEVGEP]]
78+ ; CHECK-LABEL: define void @different_steps_and_different_access_sizes(
79+ ; CHECK-SAME: ptr [[A:%.*]], ptr [[B:%.*]], i64 [[N:%.*]]) {
80+ ; CHECK-NEXT: [[ENTRY:.*:]]
81+ ; CHECK-NEXT: [[MIN_ITERS_CHECK:%.*]] = icmp ult i64 [[N]], 4
82+ ; CHECK-NEXT: br i1 [[MIN_ITERS_CHECK]], [[SCALAR_PH:label %.*]], label %[[VECTOR_MEMCHECK:.*]]
83+ ; CHECK: [[VECTOR_MEMCHECK]]:
84+ ; CHECK-NEXT: [[TMP0:%.*]] = shl i64 [[N]], 2
85+ ; CHECK-NEXT: [[SCEVGEP:%.*]] = getelementptr i8, ptr [[B]], i64 [[TMP0]]
86+ ; CHECK-NEXT: [[TMP1:%.*]] = shl i64 [[N]], 1
87+ ; CHECK-NEXT: [[SCEVGEP1:%.*]] = getelementptr i8, ptr [[A]], i64 [[TMP1]]
88+ ; CHECK-NEXT: [[BOUND0:%.*]] = icmp ult ptr [[B]], [[SCEVGEP1]]
89+ ; CHECK-NEXT: [[BOUND1:%.*]] = icmp ult ptr [[A]], [[SCEVGEP]]
8690; CHECK-NEXT: [[FOUND_CONFLICT:%.*]] = and i1 [[BOUND0]], [[BOUND1]]
87- ; CHECK-NEXT: br i1 [[FOUND_CONFLICT]], label %scalar.ph, label %vector.ph
91+ ; CHECK-NEXT: br i1 [[FOUND_CONFLICT]], [[SCALAR_PH]], [[VECTOR_PH: label %.*]]
8892;
8993entry:
9094 br label %loop
@@ -106,17 +110,18 @@ exit:
106110}
107111
108112define void @steps_match_but_different_access_sizes_1 (ptr %a , ptr %b , i64 %n ) {
109- ; CHECK-LABEL: @steps_match_but_different_access_sizes_1(
110- ; CHECK-NEXT: entry:
111- ; CHECK-NEXT: [[A2:%.*]] = ptrtoint ptr [[A:%.*]] to i64
112- ; CHECK-NEXT: [[B1:%.*]] = ptrtoint ptr [[B:%.*]] to i64
113- ; CHECK-NEXT: [[MIN_ITERS_CHECK:%.*]] = icmp ult i64 [[N:%.*]], 4
114- ; CHECK-NEXT: br i1 [[MIN_ITERS_CHECK]], label %scalar.ph, label %vector.memcheck
115- ; CHECK: vector.memcheck:
113+ ; CHECK-LABEL: define void @steps_match_but_different_access_sizes_1(
114+ ; CHECK-SAME: ptr [[A:%.*]], ptr [[B:%.*]], i64 [[N:%.*]]) {
115+ ; CHECK-NEXT: [[ENTRY:.*:]]
116+ ; CHECK-NEXT: [[A2:%.*]] = ptrtoint ptr [[A]] to i64
117+ ; CHECK-NEXT: [[B1:%.*]] = ptrtoint ptr [[B]] to i64
118+ ; CHECK-NEXT: [[MIN_ITERS_CHECK:%.*]] = icmp ult i64 [[N]], 4
119+ ; CHECK-NEXT: br i1 [[MIN_ITERS_CHECK]], [[SCALAR_PH:label %.*]], label %[[VECTOR_MEMCHECK:.*]]
120+ ; CHECK: [[VECTOR_MEMCHECK]]:
116121; CHECK-NEXT: [[TMP0:%.*]] = add i64 [[B1]], -2
117122; CHECK-NEXT: [[TMP1:%.*]] = sub i64 [[TMP0]], [[A2]]
118123; CHECK-NEXT: [[DIFF_CHECK:%.*]] = icmp ult i64 [[TMP1]], 16
119- ; CHECK-NEXT: br i1 [[DIFF_CHECK]], label %scalar.ph, label %vector.ph
124+ ; CHECK-NEXT: br i1 [[DIFF_CHECK]], [[SCALAR_PH]], [[VECTOR_PH: label %.*]]
120125;
121126entry:
122127 br label %loop
@@ -140,17 +145,18 @@ exit:
140145; Same as @steps_match_but_different_access_sizes_1, but with source and sink
141146; accesses flipped.
142147define void @steps_match_but_different_access_sizes_2 (ptr %a , ptr %b , i64 %n ) {
143- ; CHECK-LABEL: @steps_match_but_different_access_sizes_2(
144- ; CHECK-NEXT: entry:
145- ; CHECK-NEXT: [[B2:%.*]] = ptrtoint ptr [[B:%.*]] to i64
146- ; CHECK-NEXT: [[A1:%.*]] = ptrtoint ptr [[A:%.*]] to i64
147- ; CHECK-NEXT: [[MIN_ITERS_CHECK:%.*]] = icmp ult i64 [[N:%.*]], 4
148- ; CHECK-NEXT: br i1 [[MIN_ITERS_CHECK]], label %scalar.ph, label %vector.memcheck
149- ; CHECK: vector.memcheck:
148+ ; CHECK-LABEL: define void @steps_match_but_different_access_sizes_2(
149+ ; CHECK-SAME: ptr [[A:%.*]], ptr [[B:%.*]], i64 [[N:%.*]]) {
150+ ; CHECK-NEXT: [[ENTRY:.*:]]
151+ ; CHECK-NEXT: [[B2:%.*]] = ptrtoint ptr [[B]] to i64
152+ ; CHECK-NEXT: [[A1:%.*]] = ptrtoint ptr [[A]] to i64
153+ ; CHECK-NEXT: [[MIN_ITERS_CHECK:%.*]] = icmp ult i64 [[N]], 4
154+ ; CHECK-NEXT: br i1 [[MIN_ITERS_CHECK]], [[SCALAR_PH:label %.*]], label %[[VECTOR_MEMCHECK:.*]]
155+ ; CHECK: [[VECTOR_MEMCHECK]]:
150156; CHECK-NEXT: [[TMP0:%.*]] = add i64 [[A1]], 2
151157; CHECK-NEXT: [[TMP1:%.*]] = sub i64 [[TMP0]], [[B2]]
152158; CHECK-NEXT: [[DIFF_CHECK:%.*]] = icmp ult i64 [[TMP1]], 16
153- ; CHECK-NEXT: br i1 [[DIFF_CHECK]], label %scalar.ph, label %vector.ph
159+ ; CHECK-NEXT: br i1 [[DIFF_CHECK]], [[SCALAR_PH]], [[VECTOR_PH: label %.*]]
154160;
155161entry:
156162 br label %loop
@@ -175,26 +181,29 @@ exit:
175181; one of the add-recs used is invariant in the inner loop.
176182; Test case for PR57315.
177183define void @nested_loop_outer_iv_addrec_invariant_in_inner1 (ptr %a , ptr %b , i64 %n ) {
178- ; CHECK-LABEL: @nested_loop_outer_iv_addrec_invariant_in_inner1(
179- ; CHECK: entry:
180- ; CHECK-NEXT: [[N_SHL_2:%.]] = shl i64 %n, 2
181- ; CHECK-NEXT: [[B_GEP_UPPER:%.*]] = getelementptr i8, ptr %b, i64 [[N_SHL_2]]
182- ; CHECK-NEXT: br label %outer
183-
184- ; CHECK: outer.header:
185- ; CHECK: [[OUTER_IV_SHL_2:%.]] = shl i64 %outer.iv, 2
186- ; CHECK-NEXT: [[A_GEP_UPPER:%.*]] = getelementptr nuw i8, ptr %a, i64 [[OUTER_IV_SHL_2]]
187- ; CHECK-NEXT: [[OUTER_IV_4:%.]] = add i64 [[OUTER_IV_SHL_2]], 4
188- ; CHECK-NEXT: [[A_GEP_UPPER_4:%.*]] = getelementptr i8, ptr %a, i64 [[OUTER_IV_4]]
189- ; CHECK: [[MIN_ITERS_CHECK:%.*]] = icmp ult i64 [[N:%.*]], 4
190- ; CHECK-NEXT: br i1 [[MIN_ITERS_CHECK]], label %scalar.ph, label %vector.memcheck
191-
192- ; CHECK: vector.memcheck:
193- ; CHECK-NEXT: [[BOUND0:%.*]] = icmp ult ptr [[A_GEP_UPPER]], [[B_GEP_UPPER]]
194- ; CHECK-NEXT: [[BOUND1:%.*]] = icmp ult ptr %b, [[A_GEP_UPPER_4]]
184+ ; CHECK-LABEL: define void @nested_loop_outer_iv_addrec_invariant_in_inner1(
185+ ; CHECK-SAME: ptr [[A:%.*]], ptr [[B:%.*]], i64 [[N:%.*]]) {
186+ ; CHECK-NEXT: [[ENTRY:.*]]:
187+ ; CHECK-NEXT: [[TMP0:%.*]] = shl i64 [[N]], 2
188+ ; CHECK-NEXT: [[SCEVGEP2:%.*]] = getelementptr i8, ptr [[B]], i64 [[TMP0]]
189+ ; CHECK-NEXT: br label %[[OUTER_HEADER:.*]]
190+ ; CHECK: [[OUTER_HEADER]]:
191+ ; CHECK-NEXT: [[OUTER_IV:%.*]] = phi i64 [ [[OUTER_IV_NEXT:%.*]], [[OUTER_LATCH:%.*]] ], [ 0, %[[ENTRY]] ]
192+ ; CHECK-NEXT: [[TMP1:%.*]] = shl i64 [[OUTER_IV]], 2
193+ ; CHECK-NEXT: [[SCEVGEP:%.*]] = getelementptr nuw i8, ptr [[A]], i64 [[TMP1]]
194+ ; CHECK-NEXT: [[TMP2:%.*]] = add i64 [[TMP1]], 4
195+ ; CHECK-NEXT: [[SCEVGEP1:%.*]] = getelementptr i8, ptr [[A]], i64 [[TMP2]]
196+ ; CHECK-NEXT: [[GEP_A:%.*]] = getelementptr inbounds i32, ptr [[A]], i64 [[OUTER_IV]]
197+ ; CHECK-NEXT: [[MIN_ITERS_CHECK:%.*]] = icmp ult i64 [[N]], 4
198+ ; CHECK-NEXT: br i1 [[MIN_ITERS_CHECK]], [[SCALAR_PH:label %.*]], label %[[VECTOR_MEMCHECK:.*]]
199+ ; CHECK: [[VECTOR_MEMCHECK]]:
200+ ; CHECK-NEXT: [[BOUND0:%.*]] = icmp ult ptr [[SCEVGEP]], [[SCEVGEP2]]
201+ ; CHECK-NEXT: [[BOUND1:%.*]] = icmp ult ptr [[B]], [[SCEVGEP1]]
195202; CHECK-NEXT: [[FOUND_CONFLICT:%.*]] = and i1 [[BOUND0]], [[BOUND1]]
196- ; CHECK-NEXT: br i1 [[FOUND_CONFLICT]], label %scalar.ph, label %vector.ph
203+ ; CHECK-NEXT: br i1 [[FOUND_CONFLICT]], [[SCALAR_PH]], [[VECTOR_PH: label %.*]]
197204;
205+
206+
198207entry:
199208 br label %outer.header
200209
@@ -225,26 +234,29 @@ exit:
225234; Same as @nested_loop_outer_iv_addrec_invariant_in_inner1 but with dependence
226235; sink and source swapped.
227236define void @nested_loop_outer_iv_addrec_invariant_in_inner2 (ptr %a , ptr %b , i64 %n ) {
228- ; CHECK-LABEL: @nested_loop_outer_iv_addrec_invariant_in_inner2(
229- ; CHECK: entry:
230- ; CHECK-NEXT: [[N_SHL_2:%.]] = shl i64 %n, 2
231- ; CHECK-NEXT: [[B_GEP_UPPER:%.*]] = getelementptr i8, ptr %b, i64 [[N_SHL_2]]
232- ; CHECK-NEXT: br label %outer
233-
234- ; CHECK: outer.header:
235- ; CHECK: [[OUTER_IV_SHL_2:%.]] = shl i64 %outer.iv, 2
236- ; CHECK-NEXT: [[A_GEP_UPPER:%.*]] = getelementptr nuw i8, ptr %a, i64 [[OUTER_IV_SHL_2]]
237- ; CHECK-NEXT: [[OUTER_IV_4:%.]] = add i64 [[OUTER_IV_SHL_2]], 4
238- ; CHECK-NEXT: [[A_GEP_UPPER_4:%.*]] = getelementptr i8, ptr %a, i64 [[OUTER_IV_4]]
239- ; CHECK: [[MIN_ITERS_CHECK:%.*]] = icmp ult i64 [[N:%.*]], 4
240- ; CHECK-NEXT: br i1 [[MIN_ITERS_CHECK]], label %scalar.ph, label %vector.memcheck
241-
242- ; CHECK: vector.memcheck:
243- ; CHECK-NEXT: [[BOUND0:%.*]] = icmp ult ptr %b, [[A_GEP_UPPER_4]]
244- ; CHECK-NEXT: [[BOUND1:%.*]] = icmp ult ptr [[A_GEP_UPPER]], [[B_GEP_UPPER]]
237+ ; CHECK-LABEL: define void @nested_loop_outer_iv_addrec_invariant_in_inner2(
238+ ; CHECK-SAME: ptr [[A:%.*]], ptr [[B:%.*]], i64 [[N:%.*]]) {
239+ ; CHECK-NEXT: [[ENTRY:.*]]:
240+ ; CHECK-NEXT: [[TMP0:%.*]] = shl i64 [[N]], 2
241+ ; CHECK-NEXT: [[SCEVGEP:%.*]] = getelementptr i8, ptr [[B]], i64 [[TMP0]]
242+ ; CHECK-NEXT: br label %[[OUTER_HEADER:.*]]
243+ ; CHECK: [[OUTER_HEADER]]:
244+ ; CHECK-NEXT: [[OUTER_IV:%.*]] = phi i64 [ [[OUTER_IV_NEXT:%.*]], [[OUTER_LATCH:%.*]] ], [ 0, %[[ENTRY]] ]
245+ ; CHECK-NEXT: [[TMP1:%.*]] = shl i64 [[OUTER_IV]], 2
246+ ; CHECK-NEXT: [[SCEVGEP1:%.*]] = getelementptr nuw i8, ptr [[A]], i64 [[TMP1]]
247+ ; CHECK-NEXT: [[TMP2:%.*]] = add i64 [[TMP1]], 4
248+ ; CHECK-NEXT: [[SCEVGEP2:%.*]] = getelementptr i8, ptr [[A]], i64 [[TMP2]]
249+ ; CHECK-NEXT: [[GEP_A:%.*]] = getelementptr inbounds i32, ptr [[A]], i64 [[OUTER_IV]]
250+ ; CHECK-NEXT: [[MIN_ITERS_CHECK:%.*]] = icmp ult i64 [[N]], 4
251+ ; CHECK-NEXT: br i1 [[MIN_ITERS_CHECK]], [[SCALAR_PH:label %.*]], label %[[VECTOR_MEMCHECK:.*]]
252+ ; CHECK: [[VECTOR_MEMCHECK]]:
253+ ; CHECK-NEXT: [[BOUND0:%.*]] = icmp ult ptr [[B]], [[SCEVGEP2]]
254+ ; CHECK-NEXT: [[BOUND1:%.*]] = icmp ult ptr [[SCEVGEP1]], [[SCEVGEP]]
245255; CHECK-NEXT: [[FOUND_CONFLICT:%.*]] = and i1 [[BOUND0]], [[BOUND1]]
246- ; CHECK-NEXT: br i1 [[FOUND_CONFLICT]], label %scalar.ph, label %vector.ph
256+ ; CHECK-NEXT: br i1 [[FOUND_CONFLICT]], [[SCALAR_PH]], [[VECTOR_PH: label %.*]]
247257;
258+
259+
248260entry:
249261 br label %outer.header
250262
@@ -276,20 +288,21 @@ exit:
276288; of the outer loop as start value. It is sufficient to subtract the start
277289; values (%dst, %src) of the outer AddRecs.
278290define void @nested_loop_start_of_inner_ptr_addrec_is_same_outer_addrec (ptr nocapture noundef %dst , ptr nocapture noundef readonly %src , i64 noundef %m , i64 noundef %n ) {
279- ; CHECK-LABEL: @nested_loop_start_of_inner_ptr_addrec_is_same_outer_addrec(
280- ; CHECK-NEXT: entry:
281- ; CHECK-NEXT: [[SRC2:%.*]] = ptrtoint ptr [[SRC:%.*]] to i64
282- ; CHECK-NEXT: [[DST1:%.*]] = ptrtoint ptr [[DST:%.*]] to i64
291+ ; CHECK-LABEL: define void @nested_loop_start_of_inner_ptr_addrec_is_same_outer_addrec(
292+ ; CHECK-SAME: ptr noundef captures(none) [[DST:%.*]], ptr noundef readonly captures(none) [[SRC:%.*]], i64 noundef [[M:%.*]], i64 noundef [[N:%.*]]) {
293+ ; CHECK-NEXT: [[ENTRY:.*]]:
294+ ; CHECK-NEXT: [[SRC2:%.*]] = ptrtoint ptr [[SRC]] to i64
295+ ; CHECK-NEXT: [[DST1:%.*]] = ptrtoint ptr [[DST]] to i64
283296; CHECK-NEXT: [[SUB:%.*]] = sub i64 [[DST1]], [[SRC2]]
284- ; CHECK-NEXT: br label [[OUTER_LOOP:% .*]]
285- ; CHECK: outer.loop :
286- ; CHECK-NEXT: [[OUTER_IV:%.*]] = phi i64 [ 0, [[ENTRY:%.* ]] ], [ [[OUTER_IV_NEXT:%.*]], [[INNER_EXIT:%.*]] ]
297+ ; CHECK-NEXT: br label % [[OUTER_LOOP:.*]]
298+ ; CHECK: [[OUTER_LOOP]] :
299+ ; CHECK-NEXT: [[OUTER_IV:%.*]] = phi i64 [ 0, % [[ENTRY]] ], [ [[OUTER_IV_NEXT:%.*]], [[INNER_EXIT:%.*]] ]
287300; CHECK-NEXT: [[MUL:%.*]] = mul nsw i64 [[OUTER_IV]], [[N]]
288301; CHECK-NEXT: [[MIN_ITERS_CHECK:%.*]] = icmp ult i64 [[N]], 4
289- ; CHECK-NEXT: br i1 [[MIN_ITERS_CHECK]], label [[SCALAR_PH:%.*]], label [[VECTOR_MEMCHECK:% .*]]
290- ; CHECK: vector.memcheck :
302+ ; CHECK-NEXT: br i1 [[MIN_ITERS_CHECK]], [[SCALAR_PH:label %.*]], label % [[VECTOR_MEMCHECK:.*]]
303+ ; CHECK: [[VECTOR_MEMCHECK]] :
291304; CHECK-NEXT: [[DIFF_CHECK:%.*]] = icmp ult i64 [[SUB]], 16
292- ; CHECK-NEXT: br i1 [[DIFF_CHECK]], label [[SCALAR_PH]], label [[VECTOR_PH:%.*]]
305+ ; CHECK-NEXT: br i1 [[DIFF_CHECK]], [[SCALAR_PH]], [[VECTOR_PH:label %.*]]
293306;
294307entry:
295308 br label %outer.loop
@@ -321,15 +334,16 @@ outer.exit:
321334}
322335
323336define void @use_diff_checks_when_retrying_with_rt_checks (i64 %off , ptr %dst , ptr %src ) {
324- ; CHECK-LABEL: @use_diff_checks_when_retrying_with_rt_checks(
325- ; CHECK-NEXT: entry:
326- ; CHECK-NEXT: [[SRC2:%.*]] = ptrtoint ptr %src to i64
327- ; CHECK-NEXT: [[DST1:%.*]] = ptrtoint ptr %dst to i64
328- ; CHECK-NEXT: br i1 false, label %scalar.ph, label %vector.memcheck
329- ; CHECK: vector.memcheck:
330- ; CHECK-NEXT: [[TMP0:%.*]] = mul i64 %off, -8
337+ ; CHECK-LABEL: define void @use_diff_checks_when_retrying_with_rt_checks(
338+ ; CHECK-SAME: i64 [[OFF:%.*]], ptr [[DST:%.*]], ptr [[SRC:%.*]]) {
339+ ; CHECK-NEXT: [[ENTRY:.*:]]
340+ ; CHECK-NEXT: [[SRC2:%.*]] = ptrtoint ptr [[SRC]] to i64
341+ ; CHECK-NEXT: [[DST1:%.*]] = ptrtoint ptr [[DST]] to i64
342+ ; CHECK-NEXT: br i1 false, [[SCALAR_PH:label %.*]], label %[[VECTOR_MEMCHECK:.*]]
343+ ; CHECK: [[VECTOR_MEMCHECK]]:
344+ ; CHECK-NEXT: [[TMP0:%.*]] = mul i64 [[OFF]], -8
331345; CHECK-NEXT: [[DIFF_CHECK:%.*]] = icmp ult i64 [[TMP0]], 32
332- ; CHECK-NEXT: [[TMP1:%.*]] = shl i64 %off , 3
346+ ; CHECK-NEXT: [[TMP1:%.*]] = shl i64 [[OFF]] , 3
333347; CHECK-NEXT: [[TMP2:%.*]] = add i64 [[DST1]], [[TMP1]]
334348; CHECK-NEXT: [[TMP3:%.*]] = sub i64 [[TMP2]], [[SRC2]]
335349; CHECK-NEXT: [[DIFF_CHECK3:%.*]] = icmp ult i64 [[TMP3]], 32
@@ -346,9 +360,7 @@ define void @use_diff_checks_when_retrying_with_rt_checks(i64 %off, ptr %dst, pt
346360; CHECK-NEXT: [[TMP9:%.*]] = sub i64 [[TMP8]], [[SRC2]]
347361; CHECK-NEXT: [[DIFF_CHECK8:%.*]] = icmp ult i64 [[TMP9]], 32
348362; CHECK-NEXT: [[CONFLICT_RDX9:%.*]] = or i1 [[CONFLICT_RDX7]], [[DIFF_CHECK8]]
349- ; CHECK-NEXT: br i1 [[CONFLICT_RDX9]], label %scalar.ph, label %vector.ph
350- ; CHECK: vector.ph:
351- ; CHECK-NEXT: br label %vector.body
363+ ; CHECK-NEXT: br i1 [[CONFLICT_RDX9]], [[SCALAR_PH]], [[VECTOR_PH:label %.*]]
352364;
353365entry:
354366 br label %loop
0 commit comments