|
| 1 | +; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py |
| 2 | +; RUN: llc %s -o - -mtriple=x86_64-unknown-linux -enable-spill2reg -mattr=+sse4.1 | FileCheck %s |
| 3 | + |
| 4 | +; End-to-end check that Spill2Reg works with 16-bit registers. |
| 5 | + |
| 6 | +target datalayout = "e-m:e-p270:32:32-p271:32:32-p272:64:64-i64:64-f80:128-n8:16:32:64-S128" |
| 7 | +target triple = "x86_64-unknown-linux-gnu" |
| 8 | + |
| 9 | +@D0 = dso_local local_unnamed_addr global i16 0, align 4 |
| 10 | +@D1 = dso_local local_unnamed_addr global i16 0, align 4 |
| 11 | +@D2 = dso_local local_unnamed_addr global i16 0, align 4 |
| 12 | +@D3 = dso_local local_unnamed_addr global i16 0, align 4 |
| 13 | +@D4 = dso_local local_unnamed_addr global i16 0, align 4 |
| 14 | +@D5 = dso_local local_unnamed_addr global i16 0, align 4 |
| 15 | +@D6 = dso_local local_unnamed_addr global i16 0, align 4 |
| 16 | +@D7 = dso_local local_unnamed_addr global i16 0, align 4 |
| 17 | +@D8 = dso_local local_unnamed_addr global i16 0, align 4 |
| 18 | +@D9 = dso_local local_unnamed_addr global i16 0, align 4 |
| 19 | +@D10 = dso_local local_unnamed_addr global i16 0, align 4 |
| 20 | +@D11 = dso_local local_unnamed_addr global i16 0, align 4 |
| 21 | +@D12 = dso_local local_unnamed_addr global i16 0, align 4 |
| 22 | +@D13 = dso_local local_unnamed_addr global i16 0, align 4 |
| 23 | +@D14 = dso_local local_unnamed_addr global i16 0, align 4 |
| 24 | +@D15 = dso_local local_unnamed_addr global i16 0, align 4 |
| 25 | +@D16 = dso_local local_unnamed_addr global i16 0, align 4 |
| 26 | +@D17 = dso_local local_unnamed_addr global i16 0, align 4 |
| 27 | +@D18 = dso_local local_unnamed_addr global i16 0, align 4 |
| 28 | +@U0 = dso_local local_unnamed_addr global i16 0, align 4 |
| 29 | +@U1 = dso_local local_unnamed_addr global i16 0, align 4 |
| 30 | +@U2 = dso_local local_unnamed_addr global i16 0, align 4 |
| 31 | +@U3 = dso_local local_unnamed_addr global i16 0, align 4 |
| 32 | +@U4 = dso_local local_unnamed_addr global i16 0, align 4 |
| 33 | +@U5 = dso_local local_unnamed_addr global i16 0, align 4 |
| 34 | +@U6 = dso_local local_unnamed_addr global i16 0, align 4 |
| 35 | +@U7 = dso_local local_unnamed_addr global i16 0, align 4 |
| 36 | +@U8 = dso_local local_unnamed_addr global i16 0, align 4 |
| 37 | +@U9 = dso_local local_unnamed_addr global i16 0, align 4 |
| 38 | +@U10 = dso_local local_unnamed_addr global i16 0, align 4 |
| 39 | +@U11 = dso_local local_unnamed_addr global i16 0, align 4 |
| 40 | +@U12 = dso_local local_unnamed_addr global i16 0, align 4 |
| 41 | +@U13 = dso_local local_unnamed_addr global i16 0, align 4 |
| 42 | +@U14 = dso_local local_unnamed_addr global i16 0, align 4 |
| 43 | +@U15 = dso_local local_unnamed_addr global i16 0, align 4 |
| 44 | +@U16 = dso_local local_unnamed_addr global i16 0, align 4 |
| 45 | +@U17 = dso_local local_unnamed_addr global i16 0, align 4 |
| 46 | +@U18 = dso_local local_unnamed_addr global i16 0, align 4 |
| 47 | + |
| 48 | +; Function Attrs: mustprogress noinline nounwind uwtable |
| 49 | +define dso_local void @_Z5spillv() local_unnamed_addr #0 { |
| 50 | +; CHECK-LABEL: _Z5spillv: |
| 51 | +; CHECK: # %bb.0: # %entry |
| 52 | +; CHECK-NEXT: pushq %rbp |
| 53 | +; CHECK-NEXT: .cfi_def_cfa_offset 16 |
| 54 | +; CHECK-NEXT: pushq %r15 |
| 55 | +; CHECK-NEXT: .cfi_def_cfa_offset 24 |
| 56 | +; CHECK-NEXT: pushq %r14 |
| 57 | +; CHECK-NEXT: .cfi_def_cfa_offset 32 |
| 58 | +; CHECK-NEXT: pushq %r13 |
| 59 | +; CHECK-NEXT: .cfi_def_cfa_offset 40 |
| 60 | +; CHECK-NEXT: pushq %r12 |
| 61 | +; CHECK-NEXT: .cfi_def_cfa_offset 48 |
| 62 | +; CHECK-NEXT: pushq %rbx |
| 63 | +; CHECK-NEXT: .cfi_def_cfa_offset 56 |
| 64 | +; CHECK-NEXT: .cfi_offset %rbx, -56 |
| 65 | +; CHECK-NEXT: .cfi_offset %r12, -48 |
| 66 | +; CHECK-NEXT: .cfi_offset %r13, -40 |
| 67 | +; CHECK-NEXT: .cfi_offset %r14, -32 |
| 68 | +; CHECK-NEXT: .cfi_offset %r15, -24 |
| 69 | +; CHECK-NEXT: .cfi_offset %rbp, -16 |
| 70 | +; CHECK-NEXT: movzwl D0(%rip), %eax |
| 71 | +; CHECK-NEXT: movw %ax, {{[-0-9]+}}(%r{{[sb]}}p) # 2-byte Spill |
| 72 | +; CHECK-NEXT: movzwl D1(%rip), %ecx |
| 73 | +; CHECK-NEXT: movzwl D2(%rip), %edx |
| 74 | +; CHECK-NEXT: movzwl D3(%rip), %esi |
| 75 | +; CHECK-NEXT: movzwl D4(%rip), %edi |
| 76 | +; CHECK-NEXT: movzwl D5(%rip), %r8d |
| 77 | +; CHECK-NEXT: movzwl D6(%rip), %r9d |
| 78 | +; CHECK-NEXT: movzwl D7(%rip), %r10d |
| 79 | +; CHECK-NEXT: movzwl D8(%rip), %r11d |
| 80 | +; CHECK-NEXT: movzwl D9(%rip), %ebx |
| 81 | +; CHECK-NEXT: movzwl D10(%rip), %ebp |
| 82 | +; CHECK-NEXT: movzwl D11(%rip), %r14d |
| 83 | +; CHECK-NEXT: movzwl D12(%rip), %r15d |
| 84 | +; CHECK-NEXT: movzwl D13(%rip), %r12d |
| 85 | +; CHECK-NEXT: movzwl D14(%rip), %r13d |
| 86 | +; CHECK-NEXT: movzwl D15(%rip), %eax |
| 87 | +; CHECK-NEXT: movw %ax, {{[-0-9]+}}(%r{{[sb]}}p) # 2-byte Spill |
| 88 | +; CHECK-NEXT: movzwl D16(%rip), %eax |
| 89 | +; CHECK-NEXT: movw %ax, {{[-0-9]+}}(%r{{[sb]}}p) # 2-byte Spill |
| 90 | +; CHECK-NEXT: movzwl D17(%rip), %eax |
| 91 | +; CHECK-NEXT: movw %ax, {{[-0-9]+}}(%r{{[sb]}}p) # 2-byte Spill |
| 92 | +; CHECK-NEXT: movzwl D18(%rip), %eax |
| 93 | +; CHECK-NEXT: movw %ax, {{[-0-9]+}}(%r{{[sb]}}p) # 2-byte Spill |
| 94 | +; CHECK-NEXT: #APP |
| 95 | +; CHECK-NEXT: #NO_APP |
| 96 | +; CHECK-NEXT: movzwl {{[-0-9]+}}(%r{{[sb]}}p), %eax # 2-byte Folded Reload |
| 97 | +; CHECK-NEXT: movw %ax, U0(%rip) |
| 98 | +; CHECK-NEXT: movw %cx, U1(%rip) |
| 99 | +; CHECK-NEXT: movw %dx, U2(%rip) |
| 100 | +; CHECK-NEXT: movw %si, U3(%rip) |
| 101 | +; CHECK-NEXT: movw %di, U4(%rip) |
| 102 | +; CHECK-NEXT: movw %r8w, U5(%rip) |
| 103 | +; CHECK-NEXT: movw %r9w, U6(%rip) |
| 104 | +; CHECK-NEXT: movw %r10w, U7(%rip) |
| 105 | +; CHECK-NEXT: movw %r11w, U8(%rip) |
| 106 | +; CHECK-NEXT: movw %bx, U9(%rip) |
| 107 | +; CHECK-NEXT: movw %bp, U10(%rip) |
| 108 | +; CHECK-NEXT: movw %r14w, U11(%rip) |
| 109 | +; CHECK-NEXT: movw %r15w, U12(%rip) |
| 110 | +; CHECK-NEXT: movw %r12w, U13(%rip) |
| 111 | +; CHECK-NEXT: movw %r13w, U14(%rip) |
| 112 | +; CHECK-NEXT: movzwl {{[-0-9]+}}(%r{{[sb]}}p), %eax # 2-byte Folded Reload |
| 113 | +; CHECK-NEXT: movw %ax, U15(%rip) |
| 114 | +; CHECK-NEXT: movzwl {{[-0-9]+}}(%r{{[sb]}}p), %eax # 2-byte Folded Reload |
| 115 | +; CHECK-NEXT: movw %ax, U16(%rip) |
| 116 | +; CHECK-NEXT: movzwl {{[-0-9]+}}(%r{{[sb]}}p), %eax # 2-byte Folded Reload |
| 117 | +; CHECK-NEXT: movw %ax, U17(%rip) |
| 118 | +; CHECK-NEXT: movzwl {{[-0-9]+}}(%r{{[sb]}}p), %eax # 2-byte Folded Reload |
| 119 | +; CHECK-NEXT: movw %ax, U18(%rip) |
| 120 | +; CHECK-NEXT: popq %rbx |
| 121 | +; CHECK-NEXT: .cfi_def_cfa_offset 48 |
| 122 | +; CHECK-NEXT: popq %r12 |
| 123 | +; CHECK-NEXT: .cfi_def_cfa_offset 40 |
| 124 | +; CHECK-NEXT: popq %r13 |
| 125 | +; CHECK-NEXT: .cfi_def_cfa_offset 32 |
| 126 | +; CHECK-NEXT: popq %r14 |
| 127 | +; CHECK-NEXT: .cfi_def_cfa_offset 24 |
| 128 | +; CHECK-NEXT: popq %r15 |
| 129 | +; CHECK-NEXT: .cfi_def_cfa_offset 16 |
| 130 | +; CHECK-NEXT: popq %rbp |
| 131 | +; CHECK-NEXT: .cfi_def_cfa_offset 8 |
| 132 | +; CHECK-NEXT: retq |
| 133 | +entry: |
| 134 | + %0 = load i16, i16* @D0 |
| 135 | + %1 = load i16, i16* @D1 |
| 136 | + %2 = load i16, i16* @D2 |
| 137 | + %3 = load i16, i16* @D3 |
| 138 | + %4 = load i16, i16* @D4 |
| 139 | + %5 = load i16, i16* @D5 |
| 140 | + %6 = load i16, i16* @D6 |
| 141 | + %7 = load i16, i16* @D7 |
| 142 | + %8 = load i16, i16* @D8 |
| 143 | + %9 = load i16, i16* @D9 |
| 144 | + %10 = load i16, i16* @D10 |
| 145 | + %11 = load i16, i16* @D11 |
| 146 | + %12 = load i16, i16* @D12 |
| 147 | + %13 = load i16, i16* @D13 |
| 148 | + %14 = load i16, i16* @D14 |
| 149 | + %15 = load i16, i16* @D15 |
| 150 | + %16 = load i16, i16* @D16 |
| 151 | + %17 = load i16, i16* @D17 |
| 152 | + %18 = load i16, i16* @D18 |
| 153 | + call void asm sideeffect "", "~{memory}"() #1 |
| 154 | + store i16 %0, i16* @U0 |
| 155 | + store i16 %1, i16* @U1 |
| 156 | + store i16 %2, i16* @U2 |
| 157 | + store i16 %3, i16* @U3 |
| 158 | + store i16 %4, i16* @U4 |
| 159 | + store i16 %5, i16* @U5 |
| 160 | + store i16 %6, i16* @U6 |
| 161 | + store i16 %7, i16* @U7 |
| 162 | + store i16 %8, i16* @U8 |
| 163 | + store i16 %9, i16* @U9 |
| 164 | + store i16 %10, i16* @U10 |
| 165 | + store i16 %11, i16* @U11 |
| 166 | + store i16 %12, i16* @U12 |
| 167 | + store i16 %13, i16* @U13 |
| 168 | + store i16 %14, i16* @U14 |
| 169 | + store i16 %15, i16* @U15 |
| 170 | + store i16 %16, i16* @U16 |
| 171 | + store i16 %17, i16* @U17 |
| 172 | + store i16 %18, i16* @U18 |
| 173 | + ret void |
| 174 | +} |
| 175 | + |
| 176 | +attributes #0 = { mustprogress noinline nounwind uwtable "frame-pointer"="none" "min-legal-vector-width"="0" "no-trapping-math"="true" "stack-protector-buffer-size"="8" "target-cpu"="x86-64" "target-features"="+cx8,+fxsr,+mmx,+sse,+sse2,+x87" "tune-cpu"="generic" } |
| 177 | +attributes #1 = { nounwind } |
0 commit comments