Skip to content

Commit 7f6098e

Browse files
authored
[X86] Fix expand-fp on optnone functions (#156900)
As observed by @mikaelholmen, PR #130988 "[AMDGPU] Implement IR expansion for frem instruction" introduced a regression on x86. Its changes led to the pass being skipped on functions with the optnone attribute. @bjope also noted that a check concerning the optnone handling is wrong. This patch fixes both issues which together fixes the regression. During the review it was observed that, even before PR #130988, the pass would not run on optnone functions with the new pass manager. This is also fixed.
1 parent 94b164c commit 7f6098e

File tree

4 files changed

+353
-5
lines changed

4 files changed

+353
-5
lines changed

llvm/include/llvm/CodeGen/ExpandFp.h

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -25,7 +25,7 @@ class ExpandFpPass : public PassInfoMixin<ExpandFpPass> {
2525
explicit ExpandFpPass(const TargetMachine *TM, CodeGenOptLevel OptLevel);
2626

2727
PreservedAnalyses run(Function &F, FunctionAnalysisManager &AM);
28-
28+
static bool isRequired() { return true; }
2929
void printPipeline(raw_ostream &OS,
3030
function_ref<StringRef(StringRef)> MapClassName2PassName);
3131
};

llvm/lib/CodeGen/ExpandFp.cpp

Lines changed: 1 addition & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -1108,14 +1108,11 @@ class ExpandFpLegacyPass : public FunctionPass {
11081108
ExpandFpLegacyPass() : ExpandFpLegacyPass(CodeGenOptLevel::None) {};
11091109

11101110
bool runOnFunction(Function &F) override {
1111-
if (skipFunction(F))
1112-
return false;
1113-
11141111
auto *TM = &getAnalysis<TargetPassConfig>().getTM<TargetMachine>();
11151112
auto *TLI = TM->getSubtargetImpl(F)->getTargetLowering();
11161113
AssumptionCache *AC = nullptr;
11171114

1118-
if (OptLevel != CodeGenOptLevel::None || F.hasOptNone())
1115+
if (OptLevel != CodeGenOptLevel::None && !F.hasOptNone())
11191116
AC = &getAnalysis<AssumptionCacheTracker>().getAssumptionCache(F);
11201117
return runImpl(F, *TLI, AC);
11211118
}
Lines changed: 252 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,252 @@
1+
; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py UTC_ARGS: --version 5
2+
; RUN: llc -mtriple=x86_64-- < %s | FileCheck %s
3+
4+
; expand-fp must also run with optnone
5+
6+
; Function Attrs: noinline optnone
7+
define double @main(i224 %0) #0 {
8+
; CHECK-LABEL: main:
9+
; CHECK: # %bb.0: # %entryitofp-entry
10+
; CHECK-NEXT: pushq %rbp
11+
; CHECK-NEXT: .cfi_def_cfa_offset 16
12+
; CHECK-NEXT: pushq %r15
13+
; CHECK-NEXT: .cfi_def_cfa_offset 24
14+
; CHECK-NEXT: pushq %r14
15+
; CHECK-NEXT: .cfi_def_cfa_offset 32
16+
; CHECK-NEXT: pushq %r13
17+
; CHECK-NEXT: .cfi_def_cfa_offset 40
18+
; CHECK-NEXT: pushq %r12
19+
; CHECK-NEXT: .cfi_def_cfa_offset 48
20+
; CHECK-NEXT: pushq %rbx
21+
; CHECK-NEXT: .cfi_def_cfa_offset 56
22+
; CHECK-NEXT: subq $88, %rsp
23+
; CHECK-NEXT: .cfi_def_cfa_offset 144
24+
; CHECK-NEXT: .cfi_offset %rbx, -56
25+
; CHECK-NEXT: .cfi_offset %r12, -48
26+
; CHECK-NEXT: .cfi_offset %r13, -40
27+
; CHECK-NEXT: .cfi_offset %r14, -32
28+
; CHECK-NEXT: .cfi_offset %r15, -24
29+
; CHECK-NEXT: .cfi_offset %rbp, -16
30+
; CHECK-NEXT: movq %rdi, %rax
31+
; CHECK-NEXT: orq %rdx, %rax
32+
; CHECK-NEXT: movl %ecx, %r8d
33+
; CHECK-NEXT: movq %rsi, %r9
34+
; CHECK-NEXT: orq %r8, %r9
35+
; CHECK-NEXT: xorps %xmm0, %xmm0
36+
; CHECK-NEXT: orq %r9, %rax
37+
; CHECK-NEXT: je .LBB0_10
38+
; CHECK-NEXT: jmp .LBB0_1
39+
; CHECK-NEXT: .LBB0_1: # %itofp-if-end
40+
; CHECK-NEXT: movslq %ecx, %rax
41+
; CHECK-NEXT: movq %rax, %r9
42+
; CHECK-NEXT: sarq $31, %r9
43+
; CHECK-NEXT: sarq $63, %rax
44+
; CHECK-NEXT: xorq %rax, %rcx
45+
; CHECK-NEXT: xorq %rax, %rdx
46+
; CHECK-NEXT: xorq %rax, %rsi
47+
; CHECK-NEXT: xorq %r9, %rdi
48+
; CHECK-NEXT: subq %r9, %rdi
49+
; CHECK-NEXT: sbbq %rax, %rsi
50+
; CHECK-NEXT: sbbq %rax, %rdx
51+
; CHECK-NEXT: sbbq %rax, %rcx
52+
; CHECK-NEXT: movq %rcx, %r8
53+
; CHECK-NEXT: shldq $32, %rdx, %r8
54+
; CHECK-NEXT: bsrq %r8, %rax
55+
; CHECK-NEXT: xorl $63, %eax
56+
; CHECK-NEXT: movq %rdx, %r10
57+
; CHECK-NEXT: shldq $32, %rsi, %r10
58+
; CHECK-NEXT: bsrq %r10, %r11
59+
; CHECK-NEXT: xorl $63, %r11d
60+
; CHECK-NEXT: orl $64, %r11d
61+
; CHECK-NEXT: testq %r8, %r8
62+
; CHECK-NEXT: cmovnel %eax, %r11d
63+
; CHECK-NEXT: movq %rsi, %rbx
64+
; CHECK-NEXT: shldq $32, %rdi, %rbx
65+
; CHECK-NEXT: bsrq %rbx, %r14
66+
; CHECK-NEXT: xorl $63, %r14d
67+
; CHECK-NEXT: movq %rdi, %rax
68+
; CHECK-NEXT: shlq $32, %rax
69+
; CHECK-NEXT: bsrq %rax, %rax
70+
; CHECK-NEXT: xorl $63, %eax
71+
; CHECK-NEXT: orl $64, %eax
72+
; CHECK-NEXT: testq %rbx, %rbx
73+
; CHECK-NEXT: cmovnel %r14d, %eax
74+
; CHECK-NEXT: subl $-128, %eax
75+
; CHECK-NEXT: orq %r8, %r10
76+
; CHECK-NEXT: cmovnel %r11d, %eax
77+
; CHECK-NEXT: movl $224, %r11d
78+
; CHECK-NEXT: subl %eax, %r11d
79+
; CHECK-NEXT: movl $223, %r10d
80+
; CHECK-NEXT: subl %eax, %r10d
81+
; CHECK-NEXT: cmpl $53, %r11d
82+
; CHECK-NEXT: jle .LBB0_8
83+
; CHECK-NEXT: # %bb.2: # %itofp-if-then4
84+
; CHECK-NEXT: movl %r11d, %r8d
85+
; CHECK-NEXT: subl $54, %r8d
86+
; CHECK-NEXT: je .LBB0_4
87+
; CHECK-NEXT: jmp .LBB0_3
88+
; CHECK-NEXT: .LBB0_3: # %itofp-if-then4
89+
; CHECK-NEXT: movl %r11d, %r8d
90+
; CHECK-NEXT: subl $55, %r8d
91+
; CHECK-NEXT: jne .LBB0_5
92+
; CHECK-NEXT: # %bb.11:
93+
; CHECK-NEXT: jmp .LBB0_6
94+
; CHECK-NEXT: .LBB0_4: # %itofp-sw-bb
95+
; CHECK-NEXT: movq %rsi, %rax
96+
; CHECK-NEXT: shldq $1, %rdi, %rax
97+
; CHECK-NEXT: movq %rdx, %r8
98+
; CHECK-NEXT: shldq $1, %rsi, %r8
99+
; CHECK-NEXT: shldq $1, %rdx, %rcx
100+
; CHECK-NEXT: addq %rdi, %rdi
101+
; CHECK-NEXT: movq %rax, %rsi
102+
; CHECK-NEXT: movq %r8, %rdx
103+
; CHECK-NEXT: jmp .LBB0_6
104+
; CHECK-NEXT: .LBB0_5: # %itofp-sw-default
105+
; CHECK-NEXT: movq %rdi, -{{[0-9]+}}(%rsp)
106+
; CHECK-NEXT: movq %rsi, -{{[0-9]+}}(%rsp)
107+
; CHECK-NEXT: movq %rdx, -{{[0-9]+}}(%rsp)
108+
; CHECK-NEXT: movl %ecx, %r8d
109+
; CHECK-NEXT: movq %r8, -{{[0-9]+}}(%rsp)
110+
; CHECK-NEXT: movb $-87, %r8b
111+
; CHECK-NEXT: subb %al, %r8b
112+
; CHECK-NEXT: movb %r8b, %bl
113+
; CHECK-NEXT: shrb $6, %bl
114+
; CHECK-NEXT: movzbl %bl, %r12d
115+
; CHECK-NEXT: movq $0, {{[0-9]+}}(%rsp)
116+
; CHECK-NEXT: movq $0, (%rsp)
117+
; CHECK-NEXT: movq $0, -{{[0-9]+}}(%rsp)
118+
; CHECK-NEXT: movq $0, -{{[0-9]+}}(%rsp)
119+
; CHECK-NEXT: movq -24(%rsp,%r12,8), %rbx
120+
; CHECK-NEXT: movq -32(%rsp,%r12,8), %r13
121+
; CHECK-NEXT: movq %rcx, %rbp
122+
; CHECK-NEXT: movb %r8b, %cl
123+
; CHECK-NEXT: movq %r13, %r14
124+
; CHECK-NEXT: shrdq %cl, %rbx, %r14
125+
; CHECK-NEXT: movq %r14, {{[-0-9]+}}(%r{{[sb]}}p) # 8-byte Spill
126+
; CHECK-NEXT: movq -48(%rsp,%r12,8), %r15
127+
; CHECK-NEXT: movq -40(%rsp,%r12,8), %r12
128+
; CHECK-NEXT: movb %r8b, %cl
129+
; CHECK-NEXT: movq %r12, %r14
130+
; CHECK-NEXT: shrdq %cl, %r13, %r14
131+
; CHECK-NEXT: movb %r8b, %cl
132+
; CHECK-NEXT: shrq %cl, %rbx
133+
; CHECK-NEXT: movb %r8b, %cl
134+
; CHECK-NEXT: shrdq %cl, %r12, %r15
135+
; CHECK-NEXT: addb $55, %al
136+
; CHECK-NEXT: movq %rdi, -{{[0-9]+}}(%rsp)
137+
; CHECK-NEXT: movq %rsi, -{{[0-9]+}}(%rsp)
138+
; CHECK-NEXT: movq %rdx, -{{[0-9]+}}(%rsp)
139+
; CHECK-NEXT: movq %rbp, -{{[0-9]+}}(%rsp)
140+
; CHECK-NEXT: movq $0, -{{[0-9]+}}(%rsp)
141+
; CHECK-NEXT: movq $0, -{{[0-9]+}}(%rsp)
142+
; CHECK-NEXT: movq $0, -{{[0-9]+}}(%rsp)
143+
; CHECK-NEXT: movq $0, -{{[0-9]+}}(%rsp)
144+
; CHECK-NEXT: movb %al, %cl
145+
; CHECK-NEXT: shrb $3, %cl
146+
; CHECK-NEXT: andb $24, %cl
147+
; CHECK-NEXT: negb %cl
148+
; CHECK-NEXT: movsbq %cl, %rdx
149+
; CHECK-NEXT: movq -80(%rsp,%rdx), %rsi
150+
; CHECK-NEXT: movq -72(%rsp,%rdx), %rdi
151+
; CHECK-NEXT: movq -64(%rsp,%rdx), %r8
152+
; CHECK-NEXT: movb %al, %cl
153+
; CHECK-NEXT: movq %r8, %r12
154+
; CHECK-NEXT: shldq %cl, %rdi, %r12
155+
; CHECK-NEXT: movb %al, %cl
156+
; CHECK-NEXT: movq %rsi, %r13
157+
; CHECK-NEXT: shlq %cl, %r13
158+
; CHECK-NEXT: orq %r12, %r13
159+
; CHECK-NEXT: movq -56(%rsp,%rdx), %rdx
160+
; CHECK-NEXT: movb %al, %cl
161+
; CHECK-NEXT: shldq %cl, %r8, %rdx
162+
; CHECK-NEXT: movl %edx, %edx
163+
; CHECK-NEXT: movb %al, %cl
164+
; CHECK-NEXT: shldq %cl, %rsi, %rdi
165+
; CHECK-NEXT: orq %rdx, %rdi
166+
; CHECK-NEXT: xorl %eax, %eax
167+
; CHECK-NEXT: orq %rdi, %r13
168+
; CHECK-NEXT: setne %al
169+
; CHECK-NEXT: orq %rax, %r15
170+
; CHECK-NEXT: movq %r15, %rdi
171+
; CHECK-NEXT: movq %r14, %rsi
172+
; CHECK-NEXT: movq {{[-0-9]+}}(%r{{[sb]}}p), %rdx # 8-byte Reload
173+
; CHECK-NEXT: movq %rbx, %rcx
174+
; CHECK-NEXT: jmp .LBB0_6
175+
; CHECK-NEXT: .LBB0_6: # %itofp-sw-epilog
176+
; CHECK-NEXT: movl %edi, %eax
177+
; CHECK-NEXT: shrl $2, %eax
178+
; CHECK-NEXT: andl $1, %eax
179+
; CHECK-NEXT: orq %rax, %rdi
180+
; CHECK-NEXT: addq $1, %rdi
181+
; CHECK-NEXT: adcq $0, %rsi
182+
; CHECK-NEXT: adcq $0, %rdx
183+
; CHECK-NEXT: adcq $0, %rcx
184+
; CHECK-NEXT: movq %rsi, %rdx
185+
; CHECK-NEXT: shldq $62, %rdi, %rdx
186+
; CHECK-NEXT: movq %rdx, %rax
187+
; CHECK-NEXT: shrq $32, %rax
188+
; CHECK-NEXT: btq $55, %rdi
189+
; CHECK-NEXT: jae .LBB0_9
190+
; CHECK-NEXT: jmp .LBB0_7
191+
; CHECK-NEXT: .LBB0_7: # %itofp-if-then20
192+
; CHECK-NEXT: shldq $61, %rdi, %rsi
193+
; CHECK-NEXT: movq %rsi, %rax
194+
; CHECK-NEXT: shrq $32, %rax
195+
; CHECK-NEXT: movq %rsi, %rdx
196+
; CHECK-NEXT: movl %r11d, %r10d
197+
; CHECK-NEXT: jmp .LBB0_9
198+
; CHECK-NEXT: .LBB0_8: # %itofp-if-else
199+
; CHECK-NEXT: movq %rdi, {{[0-9]+}}(%rsp)
200+
; CHECK-NEXT: movq %rsi, {{[0-9]+}}(%rsp)
201+
; CHECK-NEXT: movq %rdx, {{[0-9]+}}(%rsp)
202+
; CHECK-NEXT: movq %rcx, {{[0-9]+}}(%rsp)
203+
; CHECK-NEXT: movq $0, {{[0-9]+}}(%rsp)
204+
; CHECK-NEXT: movq $0, {{[0-9]+}}(%rsp)
205+
; CHECK-NEXT: movq $0, {{[0-9]+}}(%rsp)
206+
; CHECK-NEXT: movq $0, {{[0-9]+}}(%rsp)
207+
; CHECK-NEXT: addb $85, %al
208+
; CHECK-NEXT: movb %al, %cl
209+
; CHECK-NEXT: shrb $3, %cl
210+
; CHECK-NEXT: andb $24, %cl
211+
; CHECK-NEXT: negb %cl
212+
; CHECK-NEXT: movsbq %cl, %rcx
213+
; CHECK-NEXT: movq 48(%rsp,%rcx), %rdx
214+
; CHECK-NEXT: movb %al, %cl
215+
; CHECK-NEXT: shlq %cl, %rdx
216+
; CHECK-NEXT: movq %rdx, %rax
217+
; CHECK-NEXT: shrq $32, %rax
218+
; CHECK-NEXT: .LBB0_9: # %itofp-if-end26
219+
; CHECK-NEXT: andl $-2147483648, %r9d # imm = 0x80000000
220+
; CHECK-NEXT: shll $20, %r10d
221+
; CHECK-NEXT: addl $1072693248, %r10d # imm = 0x3FF00000
222+
; CHECK-NEXT: andl $1048575, %eax # imm = 0xFFFFF
223+
; CHECK-NEXT: orl %r9d, %eax
224+
; CHECK-NEXT: orl %r10d, %eax
225+
; CHECK-NEXT: movl %eax, %eax
226+
; CHECK-NEXT: shlq $32, %rax
227+
; CHECK-NEXT: movabsq $4294967295, %rcx # imm = 0xFFFFFFFF
228+
; CHECK-NEXT: andq %rcx, %rdx
229+
; CHECK-NEXT: orq %rdx, %rax
230+
; CHECK-NEXT: movq %rax, %xmm0
231+
; CHECK-NEXT: .LBB0_10: # %itofp-return
232+
; CHECK-NEXT: addq $88, %rsp
233+
; CHECK-NEXT: .cfi_def_cfa_offset 56
234+
; CHECK-NEXT: popq %rbx
235+
; CHECK-NEXT: .cfi_def_cfa_offset 48
236+
; CHECK-NEXT: popq %r12
237+
; CHECK-NEXT: .cfi_def_cfa_offset 40
238+
; CHECK-NEXT: popq %r13
239+
; CHECK-NEXT: .cfi_def_cfa_offset 32
240+
; CHECK-NEXT: popq %r14
241+
; CHECK-NEXT: .cfi_def_cfa_offset 24
242+
; CHECK-NEXT: popq %r15
243+
; CHECK-NEXT: .cfi_def_cfa_offset 16
244+
; CHECK-NEXT: popq %rbp
245+
; CHECK-NEXT: .cfi_def_cfa_offset 8
246+
; CHECK-NEXT: retq
247+
entry:
248+
%x = sitofp i224 %0 to double
249+
ret double %x
250+
}
251+
252+
attributes #0 = { noinline optnone }
Lines changed: 99 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,99 @@
1+
; NOTE: Assertions have been autogenerated by utils/update_test_checks.py UTC_ARGS: --version 5
2+
; RUN: opt -S -mtriple=x86_64-- --expand-fp < %s | FileCheck %s
3+
; RUN: opt -S -mtriple=x86_64-- -passes=expand-fp < %s | FileCheck %s
4+
5+
; expand-fp must also run with optnone
6+
7+
; Function Attrs: noinline optnone
8+
define double @main(i224 %0) #0 {
9+
; CHECK-LABEL: define double @main(
10+
; CHECK-SAME: i224 [[TMP0:%.*]]) #[[ATTR0:[0-9]+]] {
11+
; CHECK-NEXT: [[ENTRYITOFP_ENTRY:.*]]:
12+
; CHECK-NEXT: [[TMP1:%.*]] = icmp eq i224 [[TMP0]], 0
13+
; CHECK-NEXT: br i1 [[TMP1]], label %[[ITOFP_RETURN:.*]], label %[[ITOFP_IF_END:.*]]
14+
; CHECK: [[ITOFP_IF_END]]:
15+
; CHECK-NEXT: [[TMP2:%.*]] = ashr i224 [[TMP0]], 223
16+
; CHECK-NEXT: [[TMP3:%.*]] = xor i224 [[TMP2]], [[TMP0]]
17+
; CHECK-NEXT: [[TMP4:%.*]] = sub i224 [[TMP3]], [[TMP2]]
18+
; CHECK-NEXT: [[TMP5:%.*]] = call i224 @llvm.ctlz.i224(i224 [[TMP4]], i1 true)
19+
; CHECK-NEXT: [[TMP6:%.*]] = trunc i224 [[TMP5]] to i32
20+
; CHECK-NEXT: [[TMP7:%.*]] = sub i32 224, [[TMP6]]
21+
; CHECK-NEXT: [[TMP8:%.*]] = sub i32 223, [[TMP6]]
22+
; CHECK-NEXT: [[TMP9:%.*]] = icmp sgt i32 [[TMP7]], 53
23+
; CHECK-NEXT: br i1 [[TMP9]], label %[[ITOFP_IF_THEN4:.*]], label %[[ITOFP_IF_ELSE:.*]]
24+
; CHECK: [[ITOFP_IF_THEN4]]:
25+
; CHECK-NEXT: switch i32 [[TMP7]], label %[[ITOFP_SW_DEFAULT:.*]] [
26+
; CHECK-NEXT: i32 54, label %[[ITOFP_SW_BB:.*]]
27+
; CHECK-NEXT: i32 55, label %[[ITOFP_SW_EPILOG:.*]]
28+
; CHECK-NEXT: ]
29+
; CHECK: [[ITOFP_SW_BB]]:
30+
; CHECK-NEXT: [[TMP10:%.*]] = shl i224 [[TMP4]], 1
31+
; CHECK-NEXT: br label %[[ITOFP_SW_EPILOG]]
32+
; CHECK: [[ITOFP_SW_DEFAULT]]:
33+
; CHECK-NEXT: [[TMP11:%.*]] = sub i32 169, [[TMP6]]
34+
; CHECK-NEXT: [[TMP12:%.*]] = zext i32 [[TMP11]] to i224
35+
; CHECK-NEXT: [[TMP13:%.*]] = lshr i224 [[TMP4]], [[TMP12]]
36+
; CHECK-NEXT: [[TMP14:%.*]] = add i32 [[TMP6]], 55
37+
; CHECK-NEXT: [[TMP15:%.*]] = zext i32 [[TMP14]] to i224
38+
; CHECK-NEXT: [[TMP16:%.*]] = lshr i224 -1, [[TMP15]]
39+
; CHECK-NEXT: [[TMP17:%.*]] = and i224 [[TMP16]], [[TMP4]]
40+
; CHECK-NEXT: [[TMP18:%.*]] = icmp ne i224 [[TMP17]], 0
41+
; CHECK-NEXT: [[TMP19:%.*]] = zext i1 [[TMP18]] to i224
42+
; CHECK-NEXT: [[TMP20:%.*]] = or i224 [[TMP13]], [[TMP19]]
43+
; CHECK-NEXT: br label %[[ITOFP_SW_EPILOG]]
44+
; CHECK: [[ITOFP_SW_EPILOG]]:
45+
; CHECK-NEXT: [[TMP21:%.*]] = phi i224 [ [[TMP20]], %[[ITOFP_SW_DEFAULT]] ], [ [[TMP4]], %[[ITOFP_IF_THEN4]] ], [ [[TMP10]], %[[ITOFP_SW_BB]] ]
46+
; CHECK-NEXT: [[TMP22:%.*]] = trunc i224 [[TMP21]] to i32
47+
; CHECK-NEXT: [[TMP23:%.*]] = lshr i32 [[TMP22]], 2
48+
; CHECK-NEXT: [[TMP24:%.*]] = and i32 [[TMP23]], 1
49+
; CHECK-NEXT: [[TMP25:%.*]] = zext i32 [[TMP24]] to i224
50+
; CHECK-NEXT: [[TMP26:%.*]] = or i224 [[TMP21]], [[TMP25]]
51+
; CHECK-NEXT: [[TMP27:%.*]] = add i224 [[TMP26]], 1
52+
; CHECK-NEXT: [[TMP28:%.*]] = ashr i224 [[TMP27]], 2
53+
; CHECK-NEXT: [[A3:%.*]] = and i224 [[TMP27]], 36028797018963968
54+
; CHECK-NEXT: [[TMP29:%.*]] = icmp eq i224 [[A3]], 0
55+
; CHECK-NEXT: [[TMP30:%.*]] = trunc i224 [[TMP28]] to i64
56+
; CHECK-NEXT: [[TMP31:%.*]] = lshr i224 [[TMP28]], 32
57+
; CHECK-NEXT: [[TMP32:%.*]] = trunc i224 [[TMP31]] to i32
58+
; CHECK-NEXT: br i1 [[TMP29]], label %[[ITOFP_IF_END26:.*]], label %[[ITOFP_IF_THEN20:.*]]
59+
; CHECK: [[ITOFP_IF_THEN20]]:
60+
; CHECK-NEXT: [[TMP33:%.*]] = ashr i224 [[TMP27]], 3
61+
; CHECK-NEXT: [[TMP34:%.*]] = trunc i224 [[TMP33]] to i64
62+
; CHECK-NEXT: [[TMP35:%.*]] = lshr i224 [[TMP33]], 32
63+
; CHECK-NEXT: [[TMP36:%.*]] = trunc i224 [[TMP35]] to i32
64+
; CHECK-NEXT: br label %[[ITOFP_IF_END26]]
65+
; CHECK: [[ITOFP_IF_ELSE]]:
66+
; CHECK-NEXT: [[TMP37:%.*]] = add i32 [[TMP6]], -171
67+
; CHECK-NEXT: [[TMP38:%.*]] = zext i32 [[TMP37]] to i224
68+
; CHECK-NEXT: [[TMP39:%.*]] = shl i224 [[TMP4]], [[TMP38]]
69+
; CHECK-NEXT: [[TMP40:%.*]] = trunc i224 [[TMP39]] to i64
70+
; CHECK-NEXT: [[TMP41:%.*]] = lshr i224 [[TMP39]], 32
71+
; CHECK-NEXT: [[TMP42:%.*]] = trunc i224 [[TMP41]] to i32
72+
; CHECK-NEXT: br label %[[ITOFP_IF_END26]]
73+
; CHECK: [[ITOFP_IF_END26]]:
74+
; CHECK-NEXT: [[TMP43:%.*]] = phi i64 [ [[TMP34]], %[[ITOFP_IF_THEN20]] ], [ [[TMP30]], %[[ITOFP_SW_EPILOG]] ], [ [[TMP40]], %[[ITOFP_IF_ELSE]] ]
75+
; CHECK-NEXT: [[TMP44:%.*]] = phi i32 [ [[TMP36]], %[[ITOFP_IF_THEN20]] ], [ [[TMP32]], %[[ITOFP_SW_EPILOG]] ], [ [[TMP42]], %[[ITOFP_IF_ELSE]] ]
76+
; CHECK-NEXT: [[TMP45:%.*]] = phi i32 [ [[TMP7]], %[[ITOFP_IF_THEN20]] ], [ [[TMP8]], %[[ITOFP_SW_EPILOG]] ], [ [[TMP8]], %[[ITOFP_IF_ELSE]] ]
77+
; CHECK-NEXT: [[TMP46:%.*]] = trunc i224 [[TMP2]] to i32
78+
; CHECK-NEXT: [[TMP47:%.*]] = and i32 [[TMP46]], -2147483648
79+
; CHECK-NEXT: [[TMP48:%.*]] = shl i32 [[TMP45]], 20
80+
; CHECK-NEXT: [[TMP49:%.*]] = add i32 [[TMP48]], 1072693248
81+
; CHECK-NEXT: [[TMP50:%.*]] = and i32 [[TMP44]], 1048575
82+
; CHECK-NEXT: [[TMP51:%.*]] = or i32 [[TMP50]], [[TMP47]]
83+
; CHECK-NEXT: [[TMP52:%.*]] = or i32 [[TMP51]], [[TMP49]]
84+
; CHECK-NEXT: [[TMP53:%.*]] = zext i32 [[TMP52]] to i64
85+
; CHECK-NEXT: [[TMP54:%.*]] = shl i64 [[TMP53]], 32
86+
; CHECK-NEXT: [[TMP55:%.*]] = and i64 [[TMP43]], 4294967295
87+
; CHECK-NEXT: [[TMP56:%.*]] = or i64 [[TMP54]], [[TMP55]]
88+
; CHECK-NEXT: [[TMP57:%.*]] = bitcast i64 [[TMP56]] to double
89+
; CHECK-NEXT: br label %[[ITOFP_RETURN]]
90+
; CHECK: [[ITOFP_RETURN]]:
91+
; CHECK-NEXT: [[TMP58:%.*]] = phi double [ [[TMP57]], %[[ITOFP_IF_END26]] ], [ 0.000000e+00, %[[ENTRYITOFP_ENTRY]] ]
92+
; CHECK-NEXT: ret double [[TMP58]]
93+
;
94+
entry:
95+
%x = sitofp i224 %0 to double
96+
ret double %x
97+
}
98+
99+
attributes #0 = { noinline optnone }

0 commit comments

Comments
 (0)