|
1 | 1 | ; NOTE: Assertions have been autogenerated by utils/update_test_checks.py |
2 | | -; RUN: opt -passes=loop-idiom -S %s | FileCheck %s |
| 2 | +; RUN: opt -passes=loop-idiom -enable-loop-idiom-version=0 -S %s | FileCheck %s --check-prefix=CHECK-NO-VERSION |
| 3 | +; RUN: opt -passes=loop-idiom -S %s | FileCheck %s --check-prefix=CHECK-VERSION |
3 | 4 |
|
4 | 5 | ; Make sure we do not delete instructions not inserted during expansion, e.g. |
5 | | -; because the expande re-used existing instructions. |
| 6 | +; because the expander re-used existing instructions. |
6 | 7 |
|
7 | 8 | define void @test(i64 %init, ptr %ptr) { |
8 | | -; CHECK-LABEL: @test( |
9 | | -; CHECK-NEXT: entry: |
10 | | -; CHECK-NEXT: br label [[OUTER_HEADER:%.*]] |
11 | | -; CHECK: outer.header: |
12 | | -; CHECK-NEXT: [[J_0:%.*]] = phi i32 [ 0, [[ENTRY:%.*]] ], [ [[INC:%.*]], [[OUTER_LATCH:%.*]] ] |
13 | | -; CHECK-NEXT: [[I_0:%.*]] = phi i32 [ 0, [[ENTRY]] ], [ [[ADD:%.*]], [[OUTER_LATCH]] ] |
14 | | -; CHECK-NEXT: [[ADD_PTR:%.*]] = getelementptr inbounds float, ptr [[PTR:%.*]], i32 [[I_0]] |
15 | | -; CHECK-NEXT: br label [[INNER:%.*]] |
16 | | -; CHECK: inner: |
17 | | -; CHECK-NEXT: [[INNER_IV:%.*]] = phi i64 [ [[INNER_IV_NEXT:%.*]], [[INNER]] ], [ [[INIT:%.*]], [[OUTER_HEADER]] ] |
18 | | -; CHECK-NEXT: [[ARRAYIDX:%.*]] = getelementptr inbounds float, ptr [[PTR]], i64 [[INNER_IV]] |
19 | | -; CHECK-NEXT: [[TMP1:%.*]] = load i32, ptr [[ARRAYIDX]], align 4 |
20 | | -; CHECK-NEXT: [[ARRAYIDX3:%.*]] = getelementptr inbounds float, ptr [[ADD_PTR]], i64 [[INNER_IV]] |
21 | | -; CHECK-NEXT: store i32 [[TMP1]], ptr [[ARRAYIDX3]], align 4 |
22 | | -; CHECK-NEXT: [[INNER_IV_NEXT]] = add nsw i64 [[INNER_IV]], 1 |
23 | | -; CHECK-NEXT: [[EC_1:%.*]] = icmp eq i64 [[INNER_IV_NEXT]], 0 |
24 | | -; CHECK-NEXT: br i1 [[EC_1]], label [[OUTER_LATCH]], label [[INNER]] |
25 | | -; CHECK: outer.latch: |
26 | | -; CHECK-NEXT: [[INC]] = add nuw nsw i32 [[J_0]], 1 |
27 | | -; CHECK-NEXT: [[ADD]] = add nuw nsw i32 [[I_0]], [[INC]] |
28 | | -; CHECK-NEXT: [[EC_2:%.*]] = icmp eq i32 [[ADD]], 4000 |
29 | | -; CHECK-NEXT: br i1 [[EC_2]], label [[EXIT:%.*]], label [[OUTER_HEADER]] |
30 | | -; CHECK: exit: |
31 | | -; CHECK-NEXT: ret void |
| 9 | +; CHECK-NO-VERSION-LABEL: @test( |
| 10 | +; CHECK-NO-VERSION-NEXT: entry: |
| 11 | +; CHECK-NO-VERSION-NEXT: br label [[OUTER_HEADER:%.*]] |
| 12 | +; CHECK-NO-VERSION: outer.header: |
| 13 | +; CHECK-NO-VERSION-NEXT: [[J_0:%.*]] = phi i32 [ 0, [[ENTRY:%.*]] ], [ [[INC:%.*]], [[OUTER_LATCH:%.*]] ] |
| 14 | +; CHECK-NO-VERSION-NEXT: [[I_0:%.*]] = phi i32 [ 0, [[ENTRY]] ], [ [[ADD:%.*]], [[OUTER_LATCH]] ] |
| 15 | +; CHECK-NO-VERSION-NEXT: [[ADD_PTR:%.*]] = getelementptr inbounds float, ptr [[PTR:%.*]], i32 [[I_0]] |
| 16 | +; CHECK-NO-VERSION-NEXT: br label [[INNER:%.*]] |
| 17 | +; CHECK-NO-VERSION: inner: |
| 18 | +; CHECK-NO-VERSION-NEXT: [[INNER_IV:%.*]] = phi i64 [ [[INNER_IV_NEXT:%.*]], [[INNER]] ], [ [[INIT:%.*]], [[OUTER_HEADER]] ] |
| 19 | +; CHECK-NO-VERSION-NEXT: [[ARRAYIDX:%.*]] = getelementptr inbounds float, ptr [[PTR]], i64 [[INNER_IV]] |
| 20 | +; CHECK-NO-VERSION-NEXT: [[TMP0:%.*]] = load i32, ptr [[ARRAYIDX]], align 4 |
| 21 | +; CHECK-NO-VERSION-NEXT: [[ARRAYIDX3:%.*]] = getelementptr inbounds float, ptr [[ADD_PTR]], i64 [[INNER_IV]] |
| 22 | +; CHECK-NO-VERSION-NEXT: store i32 [[TMP0]], ptr [[ARRAYIDX3]], align 4 |
| 23 | +; CHECK-NO-VERSION-NEXT: [[INNER_IV_NEXT]] = add nsw i64 [[INNER_IV]], 1 |
| 24 | +; CHECK-NO-VERSION-NEXT: [[EC_1:%.*]] = icmp eq i64 [[INNER_IV_NEXT]], 0 |
| 25 | +; CHECK-NO-VERSION-NEXT: br i1 [[EC_1]], label [[OUTER_LATCH]], label [[INNER]] |
| 26 | +; CHECK-NO-VERSION: outer.latch: |
| 27 | +; CHECK-NO-VERSION-NEXT: [[INC]] = add nuw nsw i32 [[J_0]], 1 |
| 28 | +; CHECK-NO-VERSION-NEXT: [[ADD]] = add nuw nsw i32 [[I_0]], [[INC]] |
| 29 | +; CHECK-NO-VERSION-NEXT: [[EC_2:%.*]] = icmp eq i32 [[ADD]], 4000 |
| 30 | +; CHECK-NO-VERSION-NEXT: br i1 [[EC_2]], label [[EXIT:%.*]], label [[OUTER_HEADER]] |
| 31 | +; CHECK-NO-VERSION: exit: |
| 32 | +; CHECK-NO-VERSION-NEXT: ret void |
| 33 | +; |
| 34 | +; CHECK-VERSION-LABEL: @test( |
| 35 | +; CHECK-VERSION-NEXT: entry: |
| 36 | +; CHECK-VERSION-NEXT: [[TMP0:%.*]] = shl i64 [[INIT:%.*]], 2 |
| 37 | +; CHECK-VERSION-NEXT: [[SCEVGEP:%.*]] = getelementptr i8, ptr [[PTR:%.*]], i64 [[TMP0]] |
| 38 | +; CHECK-VERSION-NEXT: [[SCEVGEP2:%.*]] = getelementptr i8, ptr [[PTR]], i64 [[TMP0]] |
| 39 | +; CHECK-VERSION-NEXT: [[TMP9:%.*]] = sub i64 -1, [[INIT]] |
| 40 | +; CHECK-VERSION-NEXT: [[TMP1:%.*]] = mul i64 [[INIT]], -4 |
| 41 | +; CHECK-VERSION-NEXT: br label [[INNER_LVER_CHECK:%.*]] |
| 42 | +; CHECK-VERSION: inner.lver.check: |
| 43 | +; CHECK-VERSION-NEXT: [[J_0:%.*]] = phi i32 [ 0, [[ENTRY:%.*]] ], [ [[INC:%.*]], [[OUTER_LATCH:%.*]] ] |
| 44 | +; CHECK-VERSION-NEXT: [[I_0:%.*]] = phi i32 [ 0, [[ENTRY]] ], [ [[ADD:%.*]], [[OUTER_LATCH]] ] |
| 45 | +; CHECK-VERSION-NEXT: [[TMP2:%.*]] = sext i32 [[I_0]] to i64 |
| 46 | +; CHECK-VERSION-NEXT: [[TMP3:%.*]] = shl nsw i64 [[TMP2]], 2 |
| 47 | +; CHECK-VERSION-NEXT: [[SCEVGEP3:%.*]] = getelementptr i8, ptr [[SCEVGEP2]], i64 [[TMP3]] |
| 48 | +; CHECK-VERSION-NEXT: [[SCEVGEP4:%.*]] = getelementptr i8, ptr [[PTR]], i64 [[TMP3]] |
| 49 | +; CHECK-VERSION-NEXT: [[TMP4:%.*]] = sext i32 [[I_0]] to i64 |
| 50 | +; CHECK-VERSION-NEXT: [[TMP5:%.*]] = shl nsw i64 [[TMP4]], 2 |
| 51 | +; CHECK-VERSION-NEXT: [[SCEVGEP1:%.*]] = getelementptr i8, ptr [[SCEVGEP]], i64 [[TMP5]] |
| 52 | +; CHECK-VERSION-NEXT: [[ADD_PTR:%.*]] = getelementptr inbounds float, ptr [[PTR]], i32 [[I_0]] |
| 53 | +; CHECK-VERSION-NEXT: [[BOUND0:%.*]] = icmp ult ptr [[SCEVGEP3]], [[PTR]] |
| 54 | +; CHECK-VERSION-NEXT: [[BOUND1:%.*]] = icmp ult ptr [[SCEVGEP2]], [[SCEVGEP4]] |
| 55 | +; CHECK-VERSION-NEXT: [[FOUND_CONFLICT:%.*]] = and i1 [[BOUND0]], [[BOUND1]] |
| 56 | +; CHECK-VERSION-NEXT: [[TMP10:%.*]] = icmp slt i64 [[TMP9]], 12 |
| 57 | +; CHECK-VERSION-NEXT: [[TMP8:%.*]] = or i1 [[FOUND_CONFLICT]], [[TMP10]] |
| 58 | +; CHECK-VERSION-NEXT: br i1 [[TMP8]], label [[INNER_PH_LVER_ORIG:%.*]], label [[INNER_PH:%.*]] |
| 59 | +; CHECK-VERSION: inner.ph.lver.orig: |
| 60 | +; CHECK-VERSION-NEXT: br label [[INNER_LVER_ORIG:%.*]] |
| 61 | +; CHECK-VERSION: inner.lver.orig: |
| 62 | +; CHECK-VERSION-NEXT: [[INNER_IV_LVER_ORIG:%.*]] = phi i64 [ [[INNER_IV_NEXT_LVER_ORIG:%.*]], [[INNER_LVER_ORIG]] ], [ [[INIT]], [[INNER_PH_LVER_ORIG]] ] |
| 63 | +; CHECK-VERSION-NEXT: [[ARRAYIDX_LVER_ORIG:%.*]] = getelementptr inbounds float, ptr [[PTR]], i64 [[INNER_IV_LVER_ORIG]] |
| 64 | +; CHECK-VERSION-NEXT: [[TMP6:%.*]] = load i32, ptr [[ARRAYIDX_LVER_ORIG]], align 4 |
| 65 | +; CHECK-VERSION-NEXT: [[ARRAYIDX3_LVER_ORIG:%.*]] = getelementptr inbounds float, ptr [[ADD_PTR]], i64 [[INNER_IV_LVER_ORIG]] |
| 66 | +; CHECK-VERSION-NEXT: store i32 [[TMP6]], ptr [[ARRAYIDX3_LVER_ORIG]], align 4 |
| 67 | +; CHECK-VERSION-NEXT: [[INNER_IV_NEXT_LVER_ORIG]] = add nsw i64 [[INNER_IV_LVER_ORIG]], 1 |
| 68 | +; CHECK-VERSION-NEXT: [[EC_1_LVER_ORIG:%.*]] = icmp eq i64 [[INNER_IV_NEXT_LVER_ORIG]], 0 |
| 69 | +; CHECK-VERSION-NEXT: br i1 [[EC_1_LVER_ORIG]], label [[OUTER_LATCH_LOOPEXIT:%.*]], label [[INNER_LVER_ORIG]] |
| 70 | +; CHECK-VERSION: inner.ph: |
| 71 | +; CHECK-VERSION-NEXT: call void @llvm.memcpy.p0.p0.i64(ptr align 4 [[SCEVGEP1]], ptr align 4 [[SCEVGEP]], i64 [[TMP1]], i1 false) |
| 72 | +; CHECK-VERSION-NEXT: br label [[INNER:%.*]] |
| 73 | +; CHECK-VERSION: inner: |
| 74 | +; CHECK-VERSION-NEXT: [[INNER_IV:%.*]] = phi i64 [ [[INNER_IV_NEXT:%.*]], [[INNER]] ], [ [[INIT]], [[INNER_PH]] ] |
| 75 | +; CHECK-VERSION-NEXT: [[ARRAYIDX:%.*]] = getelementptr inbounds float, ptr [[PTR]], i64 [[INNER_IV]] |
| 76 | +; CHECK-VERSION-NEXT: [[TMP7:%.*]] = load i32, ptr [[ARRAYIDX]], align 4 |
| 77 | +; CHECK-VERSION-NEXT: [[ARRAYIDX3:%.*]] = getelementptr inbounds float, ptr [[ADD_PTR]], i64 [[INNER_IV]] |
| 78 | +; CHECK-VERSION-NEXT: [[INNER_IV_NEXT]] = add nsw i64 [[INNER_IV]], 1 |
| 79 | +; CHECK-VERSION-NEXT: [[EC_1:%.*]] = icmp eq i64 [[INNER_IV_NEXT]], 0 |
| 80 | +; CHECK-VERSION-NEXT: br i1 [[EC_1]], label [[OUTER_LATCH_LOOPEXIT5:%.*]], label [[INNER]] |
| 81 | +; CHECK-VERSION: outer.latch.loopexit: |
| 82 | +; CHECK-VERSION-NEXT: br label [[OUTER_LATCH]] |
| 83 | +; CHECK-VERSION: outer.latch.loopexit5: |
| 84 | +; CHECK-VERSION-NEXT: br label [[OUTER_LATCH]] |
| 85 | +; CHECK-VERSION: outer.latch: |
| 86 | +; CHECK-VERSION-NEXT: [[INC]] = add nuw nsw i32 [[J_0]], 1 |
| 87 | +; CHECK-VERSION-NEXT: [[ADD]] = add nuw nsw i32 [[I_0]], [[INC]] |
| 88 | +; CHECK-VERSION-NEXT: [[EC_2:%.*]] = icmp eq i32 [[ADD]], 4000 |
| 89 | +; CHECK-VERSION-NEXT: br i1 [[EC_2]], label [[EXIT:%.*]], label [[INNER_LVER_CHECK]] |
| 90 | +; CHECK-VERSION: exit: |
| 91 | +; CHECK-VERSION-NEXT: ret void |
32 | 92 | ; |
33 | 93 | entry: |
34 | 94 | br label %outer.header |
|
0 commit comments