|
1 | 1 | ; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py |
2 | | -; RUN: llc < %s -mtriple=i386-apple-darwin -mcpu=yonah -regalloc=basic | FileCheck %s --check-prefix=X32 |
| 2 | +; RUN: llc < %s -mtriple=i386-apple-darwin -mcpu=yonah -regalloc=basic | FileCheck %s --check-prefix=X86 |
3 | 3 | ; RUN: llc < %s -mtriple=x86_64-apple-darwin -regalloc=basic | FileCheck %s --check-prefix=X64 |
4 | 4 |
|
5 | 5 | ; This testcase should need to spill the -1 value on both x86-32 and x86-64, |
|
15 | 15 | %struct._image2d_t = type <{ ptr, %struct._cl_image_format_t, i32, i32, i32, i32, i32, i32 }> |
16 | 16 |
|
17 | 17 | define void @program_1(ptr %dest, ptr %t0, <4 x float> %p0, <4 x float> %p1, <4 x float> %p4, <4 x float> %p5, <4 x float> %p6) nounwind { |
18 | | -; X32-LABEL: program_1: |
19 | | -; X32: ## %bb.0: ## %entry |
20 | | -; X32-NEXT: cmpl $0, 0 |
21 | | -; X32-NEXT: jle LBB0_2 |
22 | | -; X32-NEXT: ## %bb.1: ## %forcond |
23 | | -; X32-NEXT: cmpl $0, 0 |
24 | | -; X32-NEXT: jg LBB0_3 |
25 | | -; X32-NEXT: LBB0_2: ## %ifthen |
26 | | -; X32-NEXT: retl |
27 | | -; X32-NEXT: LBB0_3: ## %forbody |
28 | | -; X32-NEXT: pushl %esi |
29 | | -; X32-NEXT: subl $88, %esp |
30 | | -; X32-NEXT: movaps {{.*#+}} xmm1 = [1.28E+2,1.28E+2,1.28E+2,1.28E+2] |
31 | | -; X32-NEXT: minps {{\.?LCPI[0-9]+_[0-9]+}}, %xmm1 |
32 | | -; X32-NEXT: cvttps2dq %xmm1, %xmm0 |
33 | | -; X32-NEXT: cvtdq2ps %xmm0, %xmm0 |
34 | | -; X32-NEXT: subps %xmm0, %xmm1 |
35 | | -; X32-NEXT: movaps %xmm1, {{[-0-9]+}}(%e{{[sb]}}p) ## 16-byte Spill |
36 | | -; X32-NEXT: movaps {{[-0-9]+}}(%e{{[sb]}}p), %xmm0 ## 16-byte Reload |
37 | | -; X32-NEXT: mulps {{\.?LCPI[0-9]+_[0-9]+}}, %xmm0 |
38 | | -; X32-NEXT: movaps %xmm0, {{[-0-9]+}}(%e{{[sb]}}p) ## 16-byte Spill |
39 | | -; X32-NEXT: movaps {{[-0-9]+}}(%e{{[sb]}}p), %xmm0 ## 16-byte Reload |
40 | | -; X32-NEXT: addps {{\.?LCPI[0-9]+_[0-9]+}}, %xmm0 |
41 | | -; X32-NEXT: movaps %xmm0, {{[-0-9]+}}(%e{{[sb]}}p) ## 16-byte Spill |
42 | | -; X32-NEXT: movaps {{[-0-9]+}}(%e{{[sb]}}p), %xmm0 ## 16-byte Reload |
43 | | -; X32-NEXT: mulps %xmm1, %xmm0 |
44 | | -; X32-NEXT: movaps %xmm0, {{[-0-9]+}}(%e{{[sb]}}p) ## 16-byte Spill |
45 | | -; X32-NEXT: movaps {{[-0-9]+}}(%e{{[sb]}}p), %xmm0 ## 16-byte Reload |
46 | | -; X32-NEXT: addps {{\.?LCPI[0-9]+_[0-9]+}}, %xmm0 |
47 | | -; X32-NEXT: movaps %xmm0, {{[-0-9]+}}(%e{{[sb]}}p) ## 16-byte Spill |
48 | | -; X32-NEXT: movdqa {{[-0-9]+}}(%e{{[sb]}}p), %xmm0 ## 16-byte Reload |
49 | | -; X32-NEXT: psubd {{\.?LCPI[0-9]+_[0-9]+}}, %xmm0 |
50 | | -; X32-NEXT: movdqa %xmm0, {{[-0-9]+}}(%e{{[sb]}}p) ## 16-byte Spill |
51 | | -; X32-NEXT: movaps {{[-0-9]+}}(%e{{[sb]}}p), %xmm0 ## 16-byte Reload |
52 | | -; X32-NEXT: mulps {{\.?LCPI[0-9]+_[0-9]+}}, %xmm0 |
53 | | -; X32-NEXT: movaps %xmm0, {{[-0-9]+}}(%e{{[sb]}}p) ## 16-byte Spill |
54 | | -; X32-NEXT: xorps %xmm0, %xmm0 |
55 | | -; X32-NEXT: movaps %xmm0, {{[-0-9]+}}(%e{{[sb]}}p) ## 16-byte Spill |
56 | | -; X32-NEXT: movaps {{[-0-9]+}}(%e{{[sb]}}p), %xmm0 ## 16-byte Reload |
57 | | -; X32-NEXT: mulps %xmm0, %xmm0 |
58 | | -; X32-NEXT: movaps %xmm0, {{[-0-9]+}}(%e{{[sb]}}p) ## 16-byte Spill |
59 | | -; X32-NEXT: movaps {{[-0-9]+}}(%e{{[sb]}}p), %xmm0 ## 16-byte Reload |
60 | | -; X32-NEXT: mulps {{\.?LCPI[0-9]+_[0-9]+}}, %xmm0 |
61 | | -; X32-NEXT: movaps %xmm0, {{[-0-9]+}}(%e{{[sb]}}p) ## 16-byte Spill |
62 | | -; X32-NEXT: xorps %xmm0, %xmm0 |
63 | | -; X32-NEXT: movaps %xmm0, {{[-0-9]+}}(%e{{[sb]}}p) ## 16-byte Spill |
64 | | -; X32-NEXT: movaps {{[-0-9]+}}(%e{{[sb]}}p), %xmm0 ## 16-byte Reload |
65 | | -; X32-NEXT: cmpunordps %xmm0, %xmm0 |
66 | | -; X32-NEXT: movaps %xmm0, {{[-0-9]+}}(%e{{[sb]}}p) ## 16-byte Spill |
67 | | -; X32-NEXT: movaps {{[-0-9]+}}(%e{{[sb]}}p), %xmm0 ## 16-byte Reload |
68 | | -; X32-NEXT: minps {{\.?LCPI[0-9]+_[0-9]+}}, %xmm0 |
69 | | -; X32-NEXT: movaps %xmm0, {{[-0-9]+}}(%e{{[sb]}}p) ## 16-byte Spill |
70 | | -; X32-NEXT: xorps %xmm0, %xmm0 |
71 | | -; X32-NEXT: movaps %xmm0, {{[0-9]+}}(%esp) |
72 | | -; X32-NEXT: movl $0, (%esp) |
73 | | -; X32-NEXT: xorl %esi, %esi |
74 | | -; X32-NEXT: xorps %xmm3, %xmm3 |
75 | | -; X32-NEXT: movaps {{[-0-9]+}}(%e{{[sb]}}p), %xmm0 ## 16-byte Reload |
76 | | -; X32-NEXT: movdqa {{[-0-9]+}}(%e{{[sb]}}p), %xmm1 ## 16-byte Reload |
77 | | -; X32-NEXT: movaps {{[-0-9]+}}(%e{{[sb]}}p), %xmm2 ## 16-byte Reload |
78 | | -; X32-NEXT: calll *%esi |
79 | | -; X32-NEXT: movaps {{[-0-9]+}}(%e{{[sb]}}p), %xmm0 ## 16-byte Reload |
80 | | -; X32-NEXT: minps {{\.?LCPI[0-9]+_[0-9]+}}, %xmm0 |
81 | | -; X32-NEXT: movaps %xmm0, {{[-0-9]+}}(%e{{[sb]}}p) ## 16-byte Spill |
82 | | -; X32-NEXT: pxor %xmm1, %xmm1 |
83 | | -; X32-NEXT: psubd {{[-0-9]+}}(%e{{[sb]}}p), %xmm1 ## 16-byte Folded Reload |
84 | | -; X32-NEXT: movdqa {{[-0-9]+}}(%e{{[sb]}}p), %xmm0 ## 16-byte Reload |
85 | | -; X32-NEXT: psubd {{\.?LCPI[0-9]+_[0-9]+}}, %xmm0 |
86 | | -; X32-NEXT: movdqa %xmm0, {{[-0-9]+}}(%e{{[sb]}}p) ## 16-byte Spill |
87 | | -; X32-NEXT: movdqa {{[-0-9]+}}(%e{{[sb]}}p), %xmm0 ## 16-byte Reload |
88 | | -; X32-NEXT: por %xmm1, %xmm0 |
89 | | -; X32-NEXT: movdqa %xmm0, {{[-0-9]+}}(%e{{[sb]}}p) ## 16-byte Spill |
90 | | -; X32-NEXT: pxor %xmm0, %xmm0 |
91 | | -; X32-NEXT: movdqa %xmm0, {{[0-9]+}}(%esp) |
92 | | -; X32-NEXT: movl $0, (%esp) |
93 | | -; X32-NEXT: xorps %xmm3, %xmm3 |
94 | | -; X32-NEXT: movaps {{[-0-9]+}}(%e{{[sb]}}p), %xmm0 ## 16-byte Reload |
95 | | -; X32-NEXT: movaps {{[-0-9]+}}(%e{{[sb]}}p), %xmm1 ## 16-byte Reload |
96 | | -; X32-NEXT: movaps {{[-0-9]+}}(%e{{[sb]}}p), %xmm2 ## 16-byte Reload |
97 | | -; X32-NEXT: calll *%esi |
98 | | -; X32-NEXT: ud2 |
| 18 | +; X86-LABEL: program_1: |
| 19 | +; X86: ## %bb.0: ## %entry |
| 20 | +; X86-NEXT: cmpl $0, 0 |
| 21 | +; X86-NEXT: jle LBB0_2 |
| 22 | +; X86-NEXT: ## %bb.1: ## %forcond |
| 23 | +; X86-NEXT: cmpl $0, 0 |
| 24 | +; X86-NEXT: jg LBB0_3 |
| 25 | +; X86-NEXT: LBB0_2: ## %ifthen |
| 26 | +; X86-NEXT: retl |
| 27 | +; X86-NEXT: LBB0_3: ## %forbody |
| 28 | +; X86-NEXT: pushl %esi |
| 29 | +; X86-NEXT: subl $88, %esp |
| 30 | +; X86-NEXT: movaps {{.*#+}} xmm1 = [1.28E+2,1.28E+2,1.28E+2,1.28E+2] |
| 31 | +; X86-NEXT: minps {{\.?LCPI[0-9]+_[0-9]+}}, %xmm1 |
| 32 | +; X86-NEXT: cvttps2dq %xmm1, %xmm0 |
| 33 | +; X86-NEXT: cvtdq2ps %xmm0, %xmm0 |
| 34 | +; X86-NEXT: subps %xmm0, %xmm1 |
| 35 | +; X86-NEXT: movaps %xmm1, {{[-0-9]+}}(%e{{[sb]}}p) ## 16-byte Spill |
| 36 | +; X86-NEXT: movaps {{[-0-9]+}}(%e{{[sb]}}p), %xmm0 ## 16-byte Reload |
| 37 | +; X86-NEXT: mulps {{\.?LCPI[0-9]+_[0-9]+}}, %xmm0 |
| 38 | +; X86-NEXT: movaps %xmm0, {{[-0-9]+}}(%e{{[sb]}}p) ## 16-byte Spill |
| 39 | +; X86-NEXT: movaps {{[-0-9]+}}(%e{{[sb]}}p), %xmm0 ## 16-byte Reload |
| 40 | +; X86-NEXT: addps {{\.?LCPI[0-9]+_[0-9]+}}, %xmm0 |
| 41 | +; X86-NEXT: movaps %xmm0, {{[-0-9]+}}(%e{{[sb]}}p) ## 16-byte Spill |
| 42 | +; X86-NEXT: movaps {{[-0-9]+}}(%e{{[sb]}}p), %xmm0 ## 16-byte Reload |
| 43 | +; X86-NEXT: mulps %xmm1, %xmm0 |
| 44 | +; X86-NEXT: movaps %xmm0, {{[-0-9]+}}(%e{{[sb]}}p) ## 16-byte Spill |
| 45 | +; X86-NEXT: movaps {{[-0-9]+}}(%e{{[sb]}}p), %xmm0 ## 16-byte Reload |
| 46 | +; X86-NEXT: addps {{\.?LCPI[0-9]+_[0-9]+}}, %xmm0 |
| 47 | +; X86-NEXT: movaps %xmm0, {{[-0-9]+}}(%e{{[sb]}}p) ## 16-byte Spill |
| 48 | +; X86-NEXT: movdqa {{[-0-9]+}}(%e{{[sb]}}p), %xmm0 ## 16-byte Reload |
| 49 | +; X86-NEXT: psubd {{\.?LCPI[0-9]+_[0-9]+}}, %xmm0 |
| 50 | +; X86-NEXT: movdqa %xmm0, {{[-0-9]+}}(%e{{[sb]}}p) ## 16-byte Spill |
| 51 | +; X86-NEXT: movaps {{[-0-9]+}}(%e{{[sb]}}p), %xmm0 ## 16-byte Reload |
| 52 | +; X86-NEXT: mulps {{\.?LCPI[0-9]+_[0-9]+}}, %xmm0 |
| 53 | +; X86-NEXT: movaps %xmm0, {{[-0-9]+}}(%e{{[sb]}}p) ## 16-byte Spill |
| 54 | +; X86-NEXT: xorps %xmm0, %xmm0 |
| 55 | +; X86-NEXT: movaps %xmm0, {{[-0-9]+}}(%e{{[sb]}}p) ## 16-byte Spill |
| 56 | +; X86-NEXT: movaps {{[-0-9]+}}(%e{{[sb]}}p), %xmm0 ## 16-byte Reload |
| 57 | +; X86-NEXT: mulps %xmm0, %xmm0 |
| 58 | +; X86-NEXT: movaps %xmm0, {{[-0-9]+}}(%e{{[sb]}}p) ## 16-byte Spill |
| 59 | +; X86-NEXT: movaps {{[-0-9]+}}(%e{{[sb]}}p), %xmm0 ## 16-byte Reload |
| 60 | +; X86-NEXT: mulps {{\.?LCPI[0-9]+_[0-9]+}}, %xmm0 |
| 61 | +; X86-NEXT: movaps %xmm0, {{[-0-9]+}}(%e{{[sb]}}p) ## 16-byte Spill |
| 62 | +; X86-NEXT: xorps %xmm0, %xmm0 |
| 63 | +; X86-NEXT: movaps %xmm0, {{[-0-9]+}}(%e{{[sb]}}p) ## 16-byte Spill |
| 64 | +; X86-NEXT: movaps {{[-0-9]+}}(%e{{[sb]}}p), %xmm0 ## 16-byte Reload |
| 65 | +; X86-NEXT: cmpunordps %xmm0, %xmm0 |
| 66 | +; X86-NEXT: movaps %xmm0, {{[-0-9]+}}(%e{{[sb]}}p) ## 16-byte Spill |
| 67 | +; X86-NEXT: movaps {{[-0-9]+}}(%e{{[sb]}}p), %xmm0 ## 16-byte Reload |
| 68 | +; X86-NEXT: minps {{\.?LCPI[0-9]+_[0-9]+}}, %xmm0 |
| 69 | +; X86-NEXT: movaps %xmm0, {{[-0-9]+}}(%e{{[sb]}}p) ## 16-byte Spill |
| 70 | +; X86-NEXT: xorps %xmm0, %xmm0 |
| 71 | +; X86-NEXT: movaps %xmm0, {{[0-9]+}}(%esp) |
| 72 | +; X86-NEXT: movl $0, (%esp) |
| 73 | +; X86-NEXT: xorl %esi, %esi |
| 74 | +; X86-NEXT: xorps %xmm3, %xmm3 |
| 75 | +; X86-NEXT: movaps {{[-0-9]+}}(%e{{[sb]}}p), %xmm0 ## 16-byte Reload |
| 76 | +; X86-NEXT: movdqa {{[-0-9]+}}(%e{{[sb]}}p), %xmm1 ## 16-byte Reload |
| 77 | +; X86-NEXT: movaps {{[-0-9]+}}(%e{{[sb]}}p), %xmm2 ## 16-byte Reload |
| 78 | +; X86-NEXT: calll *%esi |
| 79 | +; X86-NEXT: movaps {{[-0-9]+}}(%e{{[sb]}}p), %xmm0 ## 16-byte Reload |
| 80 | +; X86-NEXT: minps {{\.?LCPI[0-9]+_[0-9]+}}, %xmm0 |
| 81 | +; X86-NEXT: movaps %xmm0, {{[-0-9]+}}(%e{{[sb]}}p) ## 16-byte Spill |
| 82 | +; X86-NEXT: pxor %xmm1, %xmm1 |
| 83 | +; X86-NEXT: psubd {{[-0-9]+}}(%e{{[sb]}}p), %xmm1 ## 16-byte Folded Reload |
| 84 | +; X86-NEXT: movdqa {{[-0-9]+}}(%e{{[sb]}}p), %xmm0 ## 16-byte Reload |
| 85 | +; X86-NEXT: psubd {{\.?LCPI[0-9]+_[0-9]+}}, %xmm0 |
| 86 | +; X86-NEXT: movdqa %xmm0, {{[-0-9]+}}(%e{{[sb]}}p) ## 16-byte Spill |
| 87 | +; X86-NEXT: movdqa {{[-0-9]+}}(%e{{[sb]}}p), %xmm0 ## 16-byte Reload |
| 88 | +; X86-NEXT: por %xmm1, %xmm0 |
| 89 | +; X86-NEXT: movdqa %xmm0, {{[-0-9]+}}(%e{{[sb]}}p) ## 16-byte Spill |
| 90 | +; X86-NEXT: pxor %xmm0, %xmm0 |
| 91 | +; X86-NEXT: movdqa %xmm0, {{[0-9]+}}(%esp) |
| 92 | +; X86-NEXT: movl $0, (%esp) |
| 93 | +; X86-NEXT: xorps %xmm3, %xmm3 |
| 94 | +; X86-NEXT: movaps {{[-0-9]+}}(%e{{[sb]}}p), %xmm0 ## 16-byte Reload |
| 95 | +; X86-NEXT: movaps {{[-0-9]+}}(%e{{[sb]}}p), %xmm1 ## 16-byte Reload |
| 96 | +; X86-NEXT: movaps {{[-0-9]+}}(%e{{[sb]}}p), %xmm2 ## 16-byte Reload |
| 97 | +; X86-NEXT: calll *%esi |
| 98 | +; X86-NEXT: ud2 |
99 | 99 | ; |
100 | 100 | ; X64-LABEL: program_1: |
101 | 101 | ; X64: ## %bb.0: ## %entry |
|
0 commit comments