Skip to content

Commit 8cef004

Browse files
sparker-armmemfrob
authored andcommitted
[TypePromotion] Avoid some unnecessary truncs
Check for legal zext 'sinks' before inserting a trunc. Differential Revision: https://reviews.llvm.org/D115451
1 parent c51a37c commit 8cef004

File tree

3 files changed

+60
-0
lines changed

3 files changed

+60
-0
lines changed

llvm/lib/CodeGen/TypePromotion.cpp

Lines changed: 5 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -550,6 +550,11 @@ void IRPromoter::TruncateSinks() {
550550
continue;
551551
}
552552

553+
// Don't insert a trunc for a zext which can still legally promote.
554+
if (auto ZExt = dyn_cast<ZExtInst>(I))
555+
if (ZExt->getType()->getScalarSizeInBits() > PromotedWidth)
556+
continue;
557+
553558
// Now handle the others.
554559
for (unsigned i = 0; i < I->getNumOperands(); ++i) {
555560
Type *Ty = TruncTysMap[I][i];
Lines changed: 2 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,2 @@
1+
if not 'AArch64' in config.root.targets:
2+
config.unsupported = True
Lines changed: 53 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,53 @@
1+
; NOTE: Assertions have been autogenerated by utils/update_test_checks.py
2+
; RUN: opt -mtriple=aarch64 -type-promotion -verify -S %s -o - | FileCheck %s
3+
4+
target datalayout = "e-m:e-i8:8:32-i16:16:32-i64:64-i128:128-n32:64-S128"
5+
6+
define dso_local i32 @avoid_trunc_gep(i8* nocapture readonly %ip) {
7+
; CHECK-LABEL: @avoid_trunc_gep(
8+
; CHECK-NEXT: entry:
9+
; CHECK-NEXT: [[TAG_0_IN8:%.*]] = load i8, i8* [[IP:%.*]], align 1
10+
; CHECK-NEXT: [[TMP0:%.*]] = zext i8 [[TAG_0_IN8]] to i32
11+
; CHECK-NEXT: [[CMP9:%.*]] = icmp ult i32 [[TMP0]], 100
12+
; CHECK-NEXT: br i1 [[CMP9]], label [[FOR_BODY_PREHEADER:%.*]], label [[FOR_END:%.*]]
13+
; CHECK: for.body.preheader:
14+
; CHECK-NEXT: br label [[FOR_BODY:%.*]]
15+
; CHECK: for.body:
16+
; CHECK-NEXT: [[TAG_0_IN10:%.*]] = phi i32 [ [[TMP1:%.*]], [[FOR_BODY]] ], [ [[TMP0]], [[FOR_BODY_PREHEADER]] ]
17+
; CHECK-NEXT: [[TAG_0:%.*]] = zext i32 [[TAG_0_IN10]] to i64
18+
; CHECK-NEXT: [[ARRAYIDX:%.*]] = getelementptr inbounds i8, i8* [[IP]], i64 [[TAG_0]]
19+
; CHECK-NEXT: [[TAG_0_IN:%.*]] = load i8, i8* [[ARRAYIDX]], align 1
20+
; CHECK-NEXT: [[TMP1]] = zext i8 [[TAG_0_IN]] to i32
21+
; CHECK-NEXT: [[CMP:%.*]] = icmp ult i32 [[TMP1]], 100
22+
; CHECK-NEXT: br i1 [[CMP]], label [[FOR_BODY]], label [[FOR_END_LOOPEXIT:%.*]]
23+
; CHECK: for.end.loopexit:
24+
; CHECK-NEXT: br label [[FOR_END]]
25+
; CHECK: for.end:
26+
; CHECK-NEXT: [[TAG_0_IN_LCSSA:%.*]] = phi i32 [ [[TMP0]], [[ENTRY:%.*]] ], [ [[TMP1]], [[FOR_END_LOOPEXIT]] ]
27+
; CHECK-NEXT: [[TMP2:%.*]] = trunc i32 [[TAG_0_IN_LCSSA]] to i8
28+
; CHECK-NEXT: ret i32 [[TAG_0_IN_LCSSA]]
29+
;
30+
entry:
31+
%tag.0.in8 = load i8, i8* %ip, align 1
32+
%cmp9 = icmp ult i8 %tag.0.in8, 100
33+
br i1 %cmp9, label %for.body.preheader, label %for.end
34+
35+
for.body.preheader: ; preds = %entry
36+
br label %for.body
37+
38+
for.body: ; preds = %for.body.preheader, %for.body
39+
%tag.0.in10 = phi i8 [ %tag.0.in, %for.body ], [ %tag.0.in8, %for.body.preheader ]
40+
%tag.0 = zext i8 %tag.0.in10 to i64
41+
%arrayidx = getelementptr inbounds i8, i8* %ip, i64 %tag.0
42+
%tag.0.in = load i8, i8* %arrayidx, align 1
43+
%cmp = icmp ult i8 %tag.0.in, 100
44+
br i1 %cmp, label %for.body, label %for.end.loopexit
45+
46+
for.end.loopexit: ; preds = %for.body
47+
br label %for.end
48+
49+
for.end: ; preds = %for.end.loopexit, %entry
50+
%tag.0.in.lcssa = phi i8 [ %tag.0.in8, %entry ], [ %tag.0.in, %for.end.loopexit ]
51+
%conv3 = zext i8 %tag.0.in.lcssa to i32
52+
ret i32 %conv3
53+
}

0 commit comments

Comments
 (0)