Skip to content

Commit 7629e01

Browse files
committed
[InstCombine,PhaseOrder] Add additional tests with align assumptions.
1 parent 48d0ef1 commit 7629e01

File tree

2 files changed

+202
-0
lines changed

2 files changed

+202
-0
lines changed

llvm/test/Transforms/InstCombine/assume-align.ll

Lines changed: 82 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -171,3 +171,85 @@ define ptr @dont_fold_assume_align_zero_of_loaded_pointer_into_align_metadata(pt
171171
call void @llvm.assume(i1 true) [ "align"(ptr %p2, i64 0) ]
172172
ret ptr %p2
173173
}
174+
175+
define ptr @redundant_assume_align_1(ptr %p) {
176+
; CHECK-LABEL: @redundant_assume_align_1(
177+
; CHECK-NEXT: [[P2:%.*]] = load ptr, ptr [[P:%.*]], align 8
178+
; CHECK-NEXT: call void @llvm.assume(i1 true) [ "align"(ptr [[P2]], i32 1) ]
179+
; CHECK-NEXT: call void @foo(ptr [[P2]])
180+
; CHECK-NEXT: ret ptr [[P2]]
181+
;
182+
%p2 = load ptr, ptr %p
183+
call void @llvm.assume(i1 true) [ "align"(ptr %p2, i32 1) ]
184+
call void @foo(ptr %p2)
185+
ret ptr %p2
186+
}
187+
188+
189+
define ptr @redundant_assume_align_8_via_align_metadata(ptr %p) {
190+
; CHECK-LABEL: @redundant_assume_align_8_via_align_metadata(
191+
; CHECK-NEXT: [[P2:%.*]] = load ptr, ptr [[P:%.*]], align 8, !align [[META0:![0-9]+]]
192+
; CHECK-NEXT: call void @llvm.assume(i1 true) [ "align"(ptr [[P2]], i32 8) ]
193+
; CHECK-NEXT: call void @foo(ptr [[P2]])
194+
; CHECK-NEXT: ret ptr [[P2]]
195+
;
196+
%p2 = load ptr, ptr %p, !align !{i64 8}
197+
call void @llvm.assume(i1 true) [ "align"(ptr %p2, i32 8) ]
198+
call void @foo(ptr %p2)
199+
ret ptr %p2
200+
}
201+
202+
define ptr @assume_align_16_via_align_metadata(ptr %p) {
203+
; CHECK-LABEL: @assume_align_16_via_align_metadata(
204+
; CHECK-NEXT: [[P2:%.*]] = load ptr, ptr [[P:%.*]], align 8, !align [[META0]]
205+
; CHECK-NEXT: call void @llvm.assume(i1 true) [ "align"(ptr [[P2]], i32 16) ]
206+
; CHECK-NEXT: call void @foo(ptr [[P2]])
207+
; CHECK-NEXT: ret ptr [[P2]]
208+
;
209+
%p2 = load ptr, ptr %p, !align !{i64 8}
210+
call void @llvm.assume(i1 true) [ "align"(ptr %p2, i32 16) ]
211+
call void @foo(ptr %p2)
212+
ret ptr %p2
213+
}
214+
215+
define ptr @redundant_assume_align_8_via_align_attribute(ptr align 8 %p) {
216+
; CHECK-LABEL: @redundant_assume_align_8_via_align_attribute(
217+
; CHECK-NEXT: call void @llvm.assume(i1 true) [ "align"(ptr [[P:%.*]], i32 8) ]
218+
; CHECK-NEXT: call void @foo(ptr [[P]])
219+
; CHECK-NEXT: ret ptr [[P]]
220+
;
221+
call void @llvm.assume(i1 true) [ "align"(ptr %p, i32 8) ]
222+
call void @foo(ptr %p)
223+
ret ptr %p
224+
}
225+
226+
define ptr @assume_align_16_via_align_attribute(ptr align 8 %p) {
227+
; CHECK-LABEL: @assume_align_16_via_align_attribute(
228+
; CHECK-NEXT: call void @llvm.assume(i1 true) [ "align"(ptr [[P:%.*]], i32 16) ]
229+
; CHECK-NEXT: call void @foo(ptr [[P]])
230+
; CHECK-NEXT: ret ptr [[P]]
231+
;
232+
call void @llvm.assume(i1 true) [ "align"(ptr %p, i32 16) ]
233+
call void @foo(ptr %p)
234+
ret ptr %p
235+
}
236+
237+
define ptr @redundant_assume_align_8_via_asume(ptr %p) {
238+
; CHECK-LABEL: @redundant_assume_align_8_via_asume(
239+
; CHECK-NEXT: call void @llvm.assume(i1 true) [ "align"(ptr [[P:%.*]], i32 16) ]
240+
; CHECK-NEXT: call void @foo(ptr [[P]])
241+
; CHECK-NEXT: call void @llvm.assume(i1 true) [ "align"(ptr [[P]], i32 8) ]
242+
; CHECK-NEXT: call void @foo(ptr [[P]])
243+
; CHECK-NEXT: ret ptr [[P]]
244+
;
245+
call void @llvm.assume(i1 true) [ "align"(ptr %p, i32 16) ]
246+
call void @foo(ptr %p)
247+
call void @llvm.assume(i1 true) [ "align"(ptr %p, i32 8) ]
248+
call void @foo(ptr %p)
249+
ret ptr %p
250+
}
251+
252+
declare void @foo(ptr)
253+
;.
254+
; CHECK: [[META0]] = !{i64 8}
255+
;.
Lines changed: 120 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,120 @@
1+
; NOTE: Assertions have been autogenerated by utils/update_test_checks.py UTC_ARGS: --version 5
2+
; RUN: opt -passes='default<O3>' -S %s | FileCheck %s
3+
4+
target triple = "arm64-apple-macosx"
5+
6+
declare void @llvm.assume(i1 noundef)
7+
8+
define i32 @earlycse_entry(ptr %p) {
9+
; CHECK-LABEL: define i32 @earlycse_entry(
10+
; CHECK-SAME: ptr nocapture [[P:%.*]]) local_unnamed_addr {
11+
; CHECK-NEXT: [[L_I:%.*]] = load ptr, ptr [[P]], align 8
12+
; CHECK-NEXT: call void @llvm.assume(i1 true) [ "align"(ptr [[L_I]], i64 4) ]
13+
; CHECK-NEXT: [[L_ASSUME_ALIGNED_I_I:%.*]] = load i32, ptr [[L_I]], align 4
14+
; CHECK-NEXT: [[R_I_I:%.*]] = tail call i32 @swap(i32 [[L_ASSUME_ALIGNED_I_I]])
15+
; CHECK-NEXT: [[L_2_I:%.*]] = load ptr, ptr [[P]], align 8
16+
; CHECK-NEXT: [[GEP_I:%.*]] = getelementptr i8, ptr [[L_2_I]], i64 4
17+
; CHECK-NEXT: store ptr [[GEP_I]], ptr [[P]], align 8
18+
; CHECK-NEXT: call void @llvm.assume(i1 true) [ "align"(ptr [[GEP_I]], i64 4) ]
19+
; CHECK-NEXT: [[L_ASSUME_ALIGNED_I_I2:%.*]] = load i32, ptr [[GEP_I]], align 4
20+
; CHECK-NEXT: [[R_I_I3:%.*]] = tail call i32 @swap(i32 [[L_ASSUME_ALIGNED_I_I2]])
21+
; CHECK-NEXT: [[L_2_I4:%.*]] = load ptr, ptr [[P]], align 8
22+
; CHECK-NEXT: [[GEP_I5:%.*]] = getelementptr i8, ptr [[L_2_I4]], i64 4
23+
; CHECK-NEXT: store ptr [[GEP_I5]], ptr [[P]], align 8
24+
; CHECK-NEXT: ret i32 [[R_I_I3]]
25+
;
26+
%r.1 = call i32 @earlycse_fn1(ptr %p)
27+
%r.2 = call i32 @earlycse_fn1(ptr %p)
28+
ret i32 %r.2
29+
}
30+
31+
define i32 @earlycse_fn1(ptr %p) {
32+
; CHECK-LABEL: define i32 @earlycse_fn1(
33+
; CHECK-SAME: ptr nocapture [[P:%.*]]) local_unnamed_addr {
34+
; CHECK-NEXT: [[L:%.*]] = load ptr, ptr [[P]], align 8
35+
; CHECK-NEXT: call void @llvm.assume(i1 true) [ "align"(ptr [[L]], i64 4) ]
36+
; CHECK-NEXT: [[L_ASSUME_ALIGNED_I:%.*]] = load i32, ptr [[L]], align 4
37+
; CHECK-NEXT: [[R_I:%.*]] = tail call i32 @swap(i32 [[L_ASSUME_ALIGNED_I]])
38+
; CHECK-NEXT: [[L_2:%.*]] = load ptr, ptr [[P]], align 8
39+
; CHECK-NEXT: [[GEP:%.*]] = getelementptr i8, ptr [[L_2]], i64 4
40+
; CHECK-NEXT: store ptr [[GEP]], ptr [[P]], align 8
41+
; CHECK-NEXT: ret i32 [[R_I]]
42+
;
43+
%l = load ptr, ptr %p, align 8
44+
%r = call i32 @load_assume_aligned(ptr %l)
45+
%l.2 = load ptr, ptr %p, align 8
46+
%gep = getelementptr i8, ptr %l.2, i64 4
47+
store ptr %gep, ptr %p, align 8
48+
ret i32 %r
49+
}
50+
51+
define i32 @load_assume_aligned(ptr %p) {
52+
; CHECK-LABEL: define i32 @load_assume_aligned(
53+
; CHECK-SAME: ptr [[P:%.*]]) local_unnamed_addr {
54+
; CHECK-NEXT: call void @llvm.assume(i1 true) [ "align"(ptr [[P]], i64 4) ]
55+
; CHECK-NEXT: [[DOT0_COPYLOAD:%.*]] = load i32, ptr [[P]], align 4
56+
; CHECK-NEXT: [[TMP2:%.*]] = tail call i32 @swap(i32 [[DOT0_COPYLOAD]])
57+
; CHECK-NEXT: ret i32 [[TMP2]]
58+
;
59+
call void @llvm.assume(i1 true) [ "align"(ptr %p, i64 4) ]
60+
%l.assume_aligned = load i32, ptr %p, align 1
61+
%r = call i32 @swap(i32 %l.assume_aligned)
62+
ret i32 %r
63+
}
64+
65+
declare i32 @swap(i32)
66+
67+
define void @sroa_align_entry(ptr %p) {
68+
; CHECK-LABEL: define void @sroa_align_entry(
69+
; CHECK-SAME: ptr [[P:%.*]]) local_unnamed_addr #[[ATTR1:[0-9]+]] {
70+
; CHECK-NEXT: call void @llvm.assume(i1 true) [ "align"(ptr [[P]], i64 8) ]
71+
; CHECK-NEXT: [[DOT0_COPYLOAD_I_I_I:%.*]] = load i64, ptr [[P]], align 8
72+
; CHECK-NEXT: [[TMP2:%.*]] = inttoptr i64 [[DOT0_COPYLOAD_I_I_I]] to ptr
73+
; CHECK-NEXT: store i32 0, ptr [[TMP2]], align 4
74+
; CHECK-NEXT: ret void
75+
;
76+
%a = alloca ptr, align 8
77+
store ptr %p, ptr %a, align 8
78+
%r = call ptr @sroa_fn1(ptr %a)
79+
store i32 0, ptr %r, align 4
80+
ret void
81+
}
82+
83+
define ptr @sroa_fn1(ptr %p) {
84+
; CHECK-LABEL: define ptr @sroa_fn1(
85+
; CHECK-SAME: ptr nocapture readonly [[P:%.*]]) local_unnamed_addr #[[ATTR2:[0-9]+]] {
86+
; CHECK-NEXT: [[L:%.*]] = load ptr, ptr [[P]], align 8
87+
; CHECK-NEXT: call void @llvm.assume(i1 true) [ "align"(ptr [[L]], i64 8) ]
88+
; CHECK-NEXT: [[L_FN3_I_I:%.*]] = load i64, ptr [[L]], align 8
89+
; CHECK-NEXT: [[I_I:%.*]] = inttoptr i64 [[L_FN3_I_I]] to ptr
90+
; CHECK-NEXT: ret ptr [[I_I]]
91+
;
92+
%l = load ptr, ptr %p, align 8
93+
%r = call ptr @sroa_fn2(ptr %l)
94+
ret ptr %r
95+
}
96+
97+
define ptr @sroa_fn2(ptr %p) {
98+
; CHECK-LABEL: define ptr @sroa_fn2(
99+
; CHECK-SAME: ptr [[P:%.*]]) local_unnamed_addr #[[ATTR3:[0-9]+]] {
100+
; CHECK-NEXT: call void @llvm.assume(i1 true) [ "align"(ptr [[P]], i64 8) ]
101+
; CHECK-NEXT: [[DOT0_COPYLOAD_I_I:%.*]] = load i64, ptr [[P]], align 8
102+
; CHECK-NEXT: [[TMP3:%.*]] = inttoptr i64 [[DOT0_COPYLOAD_I_I]] to ptr
103+
; CHECK-NEXT: ret ptr [[TMP3]]
104+
;
105+
%r = call i64 @sroa_fn3(ptr %p)
106+
%i = inttoptr i64 %r to ptr
107+
ret ptr %i
108+
}
109+
110+
define i64 @sroa_fn3(ptr %0) {
111+
; CHECK-LABEL: define i64 @sroa_fn3(
112+
; CHECK-SAME: ptr [[TMP0:%.*]]) local_unnamed_addr #[[ATTR3]] {
113+
; CHECK-NEXT: call void @llvm.assume(i1 true) [ "align"(ptr [[TMP0]], i64 8) ]
114+
; CHECK-NEXT: [[DOT0_COPYLOAD_I:%.*]] = load i64, ptr [[TMP0]], align 8
115+
; CHECK-NEXT: ret i64 [[DOT0_COPYLOAD_I]]
116+
;
117+
call void @llvm.assume(i1 true) [ "align"(ptr %0, i64 8) ]
118+
%l.fn3 = load i64, ptr %0, align 1
119+
ret i64 %l.fn3
120+
}

0 commit comments

Comments
 (0)