Skip to content

Commit 027b647

Browse files
authored
[X86] Add additional test coverage for #160111 (#162838)
1 parent 1d3ad74 commit 027b647

File tree

1 file changed

+240
-0
lines changed

1 file changed

+240
-0
lines changed
Lines changed: 240 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,240 @@
1+
; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py
2+
; RUN: llc < %s -mtriple=x86_64-unknown -mcpu=x86-64 | FileCheck %s --check-prefixes=SSE
3+
; RUN: llc < %s -mtriple=x86_64-unknown -mcpu=x86-64-v2 | FileCheck %s --check-prefixes=SSE
4+
; RUN: llc < %s -mtriple=x86_64-unknown -mcpu=x86-64-v3 | FileCheck %s --check-prefixes=AVX,AVX2
5+
; RUN: llc < %s -mtriple=x86_64-unknown -mcpu=x86-64-v4 | FileCheck %s --check-prefixes=AVX,AVX512,AVX512-VL
6+
; RUN: llc < %s -mtriple=x86_64-unknown -mcpu=x86-64-v4 -mattr=-avx512vl | FileCheck %s --check-prefixes=AVX,AVX512,AVX512-NOVL
7+
8+
;
9+
; fptosi -> sitofp
10+
;
11+
12+
define double @scvtf64_i32(double %a0) {
13+
; SSE-LABEL: scvtf64_i32:
14+
; SSE: # %bb.0:
15+
; SSE-NEXT: cvttpd2dq %xmm0, %xmm0
16+
; SSE-NEXT: cvtdq2pd %xmm0, %xmm0
17+
; SSE-NEXT: retq
18+
;
19+
; AVX-LABEL: scvtf64_i32:
20+
; AVX: # %bb.0:
21+
; AVX-NEXT: vcvttpd2dq %xmm0, %xmm0
22+
; AVX-NEXT: vcvtdq2pd %xmm0, %xmm0
23+
; AVX-NEXT: retq
24+
%ii = fptosi double %a0 to i32
25+
%ff = sitofp i32 %ii to double
26+
ret double %ff
27+
}
28+
29+
define double @scvtf64_i64(double %a0) {
30+
; SSE-LABEL: scvtf64_i64:
31+
; SSE: # %bb.0:
32+
; SSE-NEXT: cvttsd2si %xmm0, %rax
33+
; SSE-NEXT: xorps %xmm0, %xmm0
34+
; SSE-NEXT: cvtsi2sd %rax, %xmm0
35+
; SSE-NEXT: retq
36+
;
37+
; AVX-LABEL: scvtf64_i64:
38+
; AVX: # %bb.0:
39+
; AVX-NEXT: vcvttsd2si %xmm0, %rax
40+
; AVX-NEXT: vcvtsi2sd %rax, %xmm15, %xmm0
41+
; AVX-NEXT: retq
42+
%ii = fptosi double %a0 to i64
43+
%ff = sitofp i64 %ii to double
44+
ret double %ff
45+
}
46+
47+
define float @scvtf32_i32(float %a0) {
48+
; SSE-LABEL: scvtf32_i32:
49+
; SSE: # %bb.0:
50+
; SSE-NEXT: cvttps2dq %xmm0, %xmm0
51+
; SSE-NEXT: cvtdq2ps %xmm0, %xmm0
52+
; SSE-NEXT: retq
53+
;
54+
; AVX-LABEL: scvtf32_i32:
55+
; AVX: # %bb.0:
56+
; AVX-NEXT: vcvttps2dq %xmm0, %xmm0
57+
; AVX-NEXT: vcvtdq2ps %xmm0, %xmm0
58+
; AVX-NEXT: retq
59+
%ii = fptosi float %a0 to i32
60+
%ff = sitofp i32 %ii to float
61+
ret float %ff
62+
}
63+
64+
define float @scvtf32_i64(float %a0) {
65+
; SSE-LABEL: scvtf32_i64:
66+
; SSE: # %bb.0:
67+
; SSE-NEXT: cvttss2si %xmm0, %rax
68+
; SSE-NEXT: xorps %xmm0, %xmm0
69+
; SSE-NEXT: cvtsi2ss %rax, %xmm0
70+
; SSE-NEXT: retq
71+
;
72+
; AVX-LABEL: scvtf32_i64:
73+
; AVX: # %bb.0:
74+
; AVX-NEXT: vcvttss2si %xmm0, %rax
75+
; AVX-NEXT: vcvtsi2ss %rax, %xmm15, %xmm0
76+
; AVX-NEXT: retq
77+
%ii = fptosi float %a0 to i64
78+
%ff = sitofp i64 %ii to float
79+
ret float %ff
80+
}
81+
82+
;
83+
; fptoui -> uitofp
84+
;
85+
86+
define double @ucvtf64_i32(double %a0) {
87+
; SSE-LABEL: ucvtf64_i32:
88+
; SSE: # %bb.0:
89+
; SSE-NEXT: cvttsd2si %xmm0, %rax
90+
; SSE-NEXT: movl %eax, %eax
91+
; SSE-NEXT: xorps %xmm0, %xmm0
92+
; SSE-NEXT: cvtsi2sd %rax, %xmm0
93+
; SSE-NEXT: retq
94+
;
95+
; AVX2-LABEL: ucvtf64_i32:
96+
; AVX2: # %bb.0:
97+
; AVX2-NEXT: vcvttsd2si %xmm0, %rax
98+
; AVX2-NEXT: movl %eax, %eax
99+
; AVX2-NEXT: vcvtsi2sd %rax, %xmm15, %xmm0
100+
; AVX2-NEXT: retq
101+
;
102+
; AVX512-LABEL: ucvtf64_i32:
103+
; AVX512: # %bb.0:
104+
; AVX512-NEXT: vcvttsd2usi %xmm0, %eax
105+
; AVX512-NEXT: vcvtusi2sd %eax, %xmm15, %xmm0
106+
; AVX512-NEXT: retq
107+
%ii = fptoui double %a0 to i32
108+
%ff = uitofp i32 %ii to double
109+
ret double %ff
110+
}
111+
112+
define double @ucvtf64_i64(double %a0) {
113+
; SSE-LABEL: ucvtf64_i64:
114+
; SSE: # %bb.0:
115+
; SSE-NEXT: cvttsd2si %xmm0, %rax
116+
; SSE-NEXT: movq %rax, %rcx
117+
; SSE-NEXT: subsd {{\.?LCPI[0-9]+_[0-9]+}}(%rip), %xmm0
118+
; SSE-NEXT: cvttsd2si %xmm0, %rdx
119+
; SSE-NEXT: sarq $63, %rcx
120+
; SSE-NEXT: andq %rcx, %rdx
121+
; SSE-NEXT: orq %rax, %rdx
122+
; SSE-NEXT: movq %rdx, %xmm1
123+
; SSE-NEXT: punpckldq {{.*#+}} xmm1 = xmm1[0],mem[0],xmm1[1],mem[1]
124+
; SSE-NEXT: subpd {{\.?LCPI[0-9]+_[0-9]+}}(%rip), %xmm1
125+
; SSE-NEXT: movapd %xmm1, %xmm0
126+
; SSE-NEXT: unpckhpd {{.*#+}} xmm0 = xmm0[1],xmm1[1]
127+
; SSE-NEXT: addsd %xmm1, %xmm0
128+
; SSE-NEXT: retq
129+
;
130+
; AVX2-LABEL: ucvtf64_i64:
131+
; AVX2: # %bb.0:
132+
; AVX2-NEXT: vcvttsd2si %xmm0, %rax
133+
; AVX2-NEXT: movq %rax, %rcx
134+
; AVX2-NEXT: vsubsd {{\.?LCPI[0-9]+_[0-9]+}}(%rip), %xmm0, %xmm0
135+
; AVX2-NEXT: sarq $63, %rcx
136+
; AVX2-NEXT: vcvttsd2si %xmm0, %rdx
137+
; AVX2-NEXT: andq %rcx, %rdx
138+
; AVX2-NEXT: orq %rax, %rdx
139+
; AVX2-NEXT: vmovq %rdx, %xmm0
140+
; AVX2-NEXT: vpunpckldq {{.*#+}} xmm0 = xmm0[0],mem[0],xmm0[1],mem[1]
141+
; AVX2-NEXT: vsubpd {{\.?LCPI[0-9]+_[0-9]+}}(%rip), %xmm0, %xmm0
142+
; AVX2-NEXT: vshufpd {{.*#+}} xmm1 = xmm0[1,0]
143+
; AVX2-NEXT: vaddsd %xmm0, %xmm1, %xmm0
144+
; AVX2-NEXT: retq
145+
;
146+
; AVX512-LABEL: ucvtf64_i64:
147+
; AVX512: # %bb.0:
148+
; AVX512-NEXT: vcvttsd2usi %xmm0, %rax
149+
; AVX512-NEXT: vcvtusi2sd %rax, %xmm15, %xmm0
150+
; AVX512-NEXT: retq
151+
%ii = fptoui double %a0 to i64
152+
%ff = uitofp i64 %ii to double
153+
ret double %ff
154+
}
155+
156+
define float @ucvtf32_i32(float %a0) {
157+
; SSE-LABEL: ucvtf32_i32:
158+
; SSE: # %bb.0:
159+
; SSE-NEXT: cvttss2si %xmm0, %rax
160+
; SSE-NEXT: movl %eax, %eax
161+
; SSE-NEXT: xorps %xmm0, %xmm0
162+
; SSE-NEXT: cvtsi2ss %rax, %xmm0
163+
; SSE-NEXT: retq
164+
;
165+
; AVX2-LABEL: ucvtf32_i32:
166+
; AVX2: # %bb.0:
167+
; AVX2-NEXT: vcvttss2si %xmm0, %rax
168+
; AVX2-NEXT: movl %eax, %eax
169+
; AVX2-NEXT: vcvtsi2ss %rax, %xmm15, %xmm0
170+
; AVX2-NEXT: retq
171+
;
172+
; AVX512-LABEL: ucvtf32_i32:
173+
; AVX512: # %bb.0:
174+
; AVX512-NEXT: vcvttss2usi %xmm0, %eax
175+
; AVX512-NEXT: vcvtusi2ss %eax, %xmm15, %xmm0
176+
; AVX512-NEXT: retq
177+
%ii = fptoui float %a0 to i32
178+
%ff = uitofp i32 %ii to float
179+
ret float %ff
180+
}
181+
182+
define float @ucvtf32_i64(float %a0) {
183+
; SSE-LABEL: ucvtf32_i64:
184+
; SSE: # %bb.0:
185+
; SSE-NEXT: cvttss2si %xmm0, %rcx
186+
; SSE-NEXT: movq %rcx, %rdx
187+
; SSE-NEXT: sarq $63, %rdx
188+
; SSE-NEXT: subss {{\.?LCPI[0-9]+_[0-9]+}}(%rip), %xmm0
189+
; SSE-NEXT: cvttss2si %xmm0, %rax
190+
; SSE-NEXT: andq %rdx, %rax
191+
; SSE-NEXT: orq %rcx, %rax
192+
; SSE-NEXT: js .LBB7_1
193+
; SSE-NEXT: # %bb.2:
194+
; SSE-NEXT: xorps %xmm0, %xmm0
195+
; SSE-NEXT: cvtsi2ss %rax, %xmm0
196+
; SSE-NEXT: retq
197+
; SSE-NEXT: .LBB7_1:
198+
; SSE-NEXT: movq %rax, %rcx
199+
; SSE-NEXT: shrq %rcx
200+
; SSE-NEXT: andl $1, %eax
201+
; SSE-NEXT: orq %rcx, %rax
202+
; SSE-NEXT: xorps %xmm0, %xmm0
203+
; SSE-NEXT: cvtsi2ss %rax, %xmm0
204+
; SSE-NEXT: addss %xmm0, %xmm0
205+
; SSE-NEXT: retq
206+
;
207+
; AVX2-LABEL: ucvtf32_i64:
208+
; AVX2: # %bb.0:
209+
; AVX2-NEXT: vcvttss2si %xmm0, %rcx
210+
; AVX2-NEXT: movq %rcx, %rdx
211+
; AVX2-NEXT: sarq $63, %rdx
212+
; AVX2-NEXT: vsubss {{\.?LCPI[0-9]+_[0-9]+}}(%rip), %xmm0, %xmm0
213+
; AVX2-NEXT: vcvttss2si %xmm0, %rax
214+
; AVX2-NEXT: andq %rdx, %rax
215+
; AVX2-NEXT: orq %rcx, %rax
216+
; AVX2-NEXT: js .LBB7_1
217+
; AVX2-NEXT: # %bb.2:
218+
; AVX2-NEXT: vcvtsi2ss %rax, %xmm15, %xmm0
219+
; AVX2-NEXT: retq
220+
; AVX2-NEXT: .LBB7_1:
221+
; AVX2-NEXT: movq %rax, %rcx
222+
; AVX2-NEXT: shrq %rcx
223+
; AVX2-NEXT: andl $1, %eax
224+
; AVX2-NEXT: orq %rcx, %rax
225+
; AVX2-NEXT: vcvtsi2ss %rax, %xmm15, %xmm0
226+
; AVX2-NEXT: vaddss %xmm0, %xmm0, %xmm0
227+
; AVX2-NEXT: retq
228+
;
229+
; AVX512-LABEL: ucvtf32_i64:
230+
; AVX512: # %bb.0:
231+
; AVX512-NEXT: vcvttss2usi %xmm0, %rax
232+
; AVX512-NEXT: vcvtusi2ss %rax, %xmm15, %xmm0
233+
; AVX512-NEXT: retq
234+
%ii = fptoui float %a0 to i64
235+
%ff = uitofp i64 %ii to float
236+
ret float %ff
237+
}
238+
;; NOTE: These prefixes are unused and the list is autogenerated. Do not add tests below this line:
239+
; AVX512-NOVL: {{.*}}
240+
; AVX512-VL: {{.*}}

0 commit comments

Comments
 (0)