|
1 | 1 | ; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py |
2 | 2 | ; RUN: llc -mtriple=riscv32 -relocation-model=pic -verify-machineinstrs < %s \ |
3 | | -; RUN: | FileCheck -check-prefixes=RV32I %s |
| 3 | +; RUN: | FileCheck -check-prefixes=RV32I,RV32NOFUSION %s |
4 | 4 | ; RUN: llc -mtriple=riscv64 -relocation-model=pic -verify-machineinstrs < %s \ |
5 | | -; RUN: | FileCheck -check-prefixes=RV64I %s |
| 5 | +; RUN: | FileCheck -check-prefixes=RV64I,RV64NOFUSION %s |
| 6 | +; RUN: llc -mtriple=riscv32 -relocation-model=pic -verify-machineinstrs < %s \ |
| 7 | +; RUN: -mattr=+auipc-addi-fusion | FileCheck -check-prefixes=RV32I,RV32FUSION %s |
| 8 | +; RUN: llc -mtriple=riscv64 -relocation-model=pic -verify-machineinstrs < %s \ |
| 9 | +; RUN: -mattr=+auipc-addi-fusion | FileCheck -check-prefixes=RV64I,RV64FUSION %s |
6 | 10 |
|
7 | 11 | ; Verifies that MachineLICM can hoist address generation pseudos out of loops. |
8 | 12 |
|
@@ -141,59 +145,113 @@ ret: |
141 | 145 | @gd = external thread_local global i32 |
142 | 146 |
|
143 | 147 | define void @test_la_tls_gd(i32 signext %n) nounwind { |
144 | | -; RV32I-LABEL: test_la_tls_gd: |
145 | | -; RV32I: # %bb.0: # %entry |
146 | | -; RV32I-NEXT: addi sp, sp, -16 |
147 | | -; RV32I-NEXT: sw ra, 12(sp) # 4-byte Folded Spill |
148 | | -; RV32I-NEXT: sw s0, 8(sp) # 4-byte Folded Spill |
149 | | -; RV32I-NEXT: sw s1, 4(sp) # 4-byte Folded Spill |
150 | | -; RV32I-NEXT: sw s2, 0(sp) # 4-byte Folded Spill |
151 | | -; RV32I-NEXT: mv s0, a0 |
152 | | -; RV32I-NEXT: li s2, 0 |
153 | | -; RV32I-NEXT: .Lpcrel_hi3: |
154 | | -; RV32I-NEXT: auipc a0, %tls_gd_pcrel_hi(gd) |
155 | | -; RV32I-NEXT: addi s1, a0, %pcrel_lo(.Lpcrel_hi3) |
156 | | -; RV32I-NEXT: .LBB3_1: # %loop |
157 | | -; RV32I-NEXT: # =>This Inner Loop Header: Depth=1 |
158 | | -; RV32I-NEXT: mv a0, s1 |
159 | | -; RV32I-NEXT: call __tls_get_addr |
160 | | -; RV32I-NEXT: lw zero, 0(a0) |
161 | | -; RV32I-NEXT: addi s2, s2, 1 |
162 | | -; RV32I-NEXT: blt s2, s0, .LBB3_1 |
163 | | -; RV32I-NEXT: # %bb.2: # %ret |
164 | | -; RV32I-NEXT: lw ra, 12(sp) # 4-byte Folded Reload |
165 | | -; RV32I-NEXT: lw s0, 8(sp) # 4-byte Folded Reload |
166 | | -; RV32I-NEXT: lw s1, 4(sp) # 4-byte Folded Reload |
167 | | -; RV32I-NEXT: lw s2, 0(sp) # 4-byte Folded Reload |
168 | | -; RV32I-NEXT: addi sp, sp, 16 |
169 | | -; RV32I-NEXT: ret |
| 148 | +; RV32NOFUSION-LABEL: test_la_tls_gd: |
| 149 | +; RV32NOFUSION: # %bb.0: # %entry |
| 150 | +; RV32NOFUSION-NEXT: addi sp, sp, -16 |
| 151 | +; RV32NOFUSION-NEXT: sw ra, 12(sp) # 4-byte Folded Spill |
| 152 | +; RV32NOFUSION-NEXT: sw s0, 8(sp) # 4-byte Folded Spill |
| 153 | +; RV32NOFUSION-NEXT: sw s1, 4(sp) # 4-byte Folded Spill |
| 154 | +; RV32NOFUSION-NEXT: sw s2, 0(sp) # 4-byte Folded Spill |
| 155 | +; RV32NOFUSION-NEXT: mv s0, a0 |
| 156 | +; RV32NOFUSION-NEXT: li s2, 0 |
| 157 | +; RV32NOFUSION-NEXT: .Lpcrel_hi3: |
| 158 | +; RV32NOFUSION-NEXT: auipc a0, %tls_gd_pcrel_hi(gd) |
| 159 | +; RV32NOFUSION-NEXT: addi s1, a0, %pcrel_lo(.Lpcrel_hi3) |
| 160 | +; RV32NOFUSION-NEXT: .LBB3_1: # %loop |
| 161 | +; RV32NOFUSION-NEXT: # =>This Inner Loop Header: Depth=1 |
| 162 | +; RV32NOFUSION-NEXT: mv a0, s1 |
| 163 | +; RV32NOFUSION-NEXT: call __tls_get_addr |
| 164 | +; RV32NOFUSION-NEXT: lw zero, 0(a0) |
| 165 | +; RV32NOFUSION-NEXT: addi s2, s2, 1 |
| 166 | +; RV32NOFUSION-NEXT: blt s2, s0, .LBB3_1 |
| 167 | +; RV32NOFUSION-NEXT: # %bb.2: # %ret |
| 168 | +; RV32NOFUSION-NEXT: lw ra, 12(sp) # 4-byte Folded Reload |
| 169 | +; RV32NOFUSION-NEXT: lw s0, 8(sp) # 4-byte Folded Reload |
| 170 | +; RV32NOFUSION-NEXT: lw s1, 4(sp) # 4-byte Folded Reload |
| 171 | +; RV32NOFUSION-NEXT: lw s2, 0(sp) # 4-byte Folded Reload |
| 172 | +; RV32NOFUSION-NEXT: addi sp, sp, 16 |
| 173 | +; RV32NOFUSION-NEXT: ret |
170 | 174 | ; |
171 | | -; RV64I-LABEL: test_la_tls_gd: |
172 | | -; RV64I: # %bb.0: # %entry |
173 | | -; RV64I-NEXT: addi sp, sp, -32 |
174 | | -; RV64I-NEXT: sd ra, 24(sp) # 8-byte Folded Spill |
175 | | -; RV64I-NEXT: sd s0, 16(sp) # 8-byte Folded Spill |
176 | | -; RV64I-NEXT: sd s1, 8(sp) # 8-byte Folded Spill |
177 | | -; RV64I-NEXT: sd s2, 0(sp) # 8-byte Folded Spill |
178 | | -; RV64I-NEXT: mv s0, a0 |
179 | | -; RV64I-NEXT: li s2, 0 |
180 | | -; RV64I-NEXT: .Lpcrel_hi3: |
181 | | -; RV64I-NEXT: auipc a0, %tls_gd_pcrel_hi(gd) |
182 | | -; RV64I-NEXT: addi s1, a0, %pcrel_lo(.Lpcrel_hi3) |
183 | | -; RV64I-NEXT: .LBB3_1: # %loop |
184 | | -; RV64I-NEXT: # =>This Inner Loop Header: Depth=1 |
185 | | -; RV64I-NEXT: mv a0, s1 |
186 | | -; RV64I-NEXT: call __tls_get_addr |
187 | | -; RV64I-NEXT: lw zero, 0(a0) |
188 | | -; RV64I-NEXT: addiw s2, s2, 1 |
189 | | -; RV64I-NEXT: blt s2, s0, .LBB3_1 |
190 | | -; RV64I-NEXT: # %bb.2: # %ret |
191 | | -; RV64I-NEXT: ld ra, 24(sp) # 8-byte Folded Reload |
192 | | -; RV64I-NEXT: ld s0, 16(sp) # 8-byte Folded Reload |
193 | | -; RV64I-NEXT: ld s1, 8(sp) # 8-byte Folded Reload |
194 | | -; RV64I-NEXT: ld s2, 0(sp) # 8-byte Folded Reload |
195 | | -; RV64I-NEXT: addi sp, sp, 32 |
196 | | -; RV64I-NEXT: ret |
| 175 | +; RV64NOFUSION-LABEL: test_la_tls_gd: |
| 176 | +; RV64NOFUSION: # %bb.0: # %entry |
| 177 | +; RV64NOFUSION-NEXT: addi sp, sp, -32 |
| 178 | +; RV64NOFUSION-NEXT: sd ra, 24(sp) # 8-byte Folded Spill |
| 179 | +; RV64NOFUSION-NEXT: sd s0, 16(sp) # 8-byte Folded Spill |
| 180 | +; RV64NOFUSION-NEXT: sd s1, 8(sp) # 8-byte Folded Spill |
| 181 | +; RV64NOFUSION-NEXT: sd s2, 0(sp) # 8-byte Folded Spill |
| 182 | +; RV64NOFUSION-NEXT: mv s0, a0 |
| 183 | +; RV64NOFUSION-NEXT: li s2, 0 |
| 184 | +; RV64NOFUSION-NEXT: .Lpcrel_hi3: |
| 185 | +; RV64NOFUSION-NEXT: auipc a0, %tls_gd_pcrel_hi(gd) |
| 186 | +; RV64NOFUSION-NEXT: addi s1, a0, %pcrel_lo(.Lpcrel_hi3) |
| 187 | +; RV64NOFUSION-NEXT: .LBB3_1: # %loop |
| 188 | +; RV64NOFUSION-NEXT: # =>This Inner Loop Header: Depth=1 |
| 189 | +; RV64NOFUSION-NEXT: mv a0, s1 |
| 190 | +; RV64NOFUSION-NEXT: call __tls_get_addr |
| 191 | +; RV64NOFUSION-NEXT: lw zero, 0(a0) |
| 192 | +; RV64NOFUSION-NEXT: addiw s2, s2, 1 |
| 193 | +; RV64NOFUSION-NEXT: blt s2, s0, .LBB3_1 |
| 194 | +; RV64NOFUSION-NEXT: # %bb.2: # %ret |
| 195 | +; RV64NOFUSION-NEXT: ld ra, 24(sp) # 8-byte Folded Reload |
| 196 | +; RV64NOFUSION-NEXT: ld s0, 16(sp) # 8-byte Folded Reload |
| 197 | +; RV64NOFUSION-NEXT: ld s1, 8(sp) # 8-byte Folded Reload |
| 198 | +; RV64NOFUSION-NEXT: ld s2, 0(sp) # 8-byte Folded Reload |
| 199 | +; RV64NOFUSION-NEXT: addi sp, sp, 32 |
| 200 | +; RV64NOFUSION-NEXT: ret |
| 201 | +; |
| 202 | +; RV32FUSION-LABEL: test_la_tls_gd: |
| 203 | +; RV32FUSION: # %bb.0: # %entry |
| 204 | +; RV32FUSION-NEXT: addi sp, sp, -16 |
| 205 | +; RV32FUSION-NEXT: sw ra, 12(sp) # 4-byte Folded Spill |
| 206 | +; RV32FUSION-NEXT: sw s0, 8(sp) # 4-byte Folded Spill |
| 207 | +; RV32FUSION-NEXT: sw s1, 4(sp) # 4-byte Folded Spill |
| 208 | +; RV32FUSION-NEXT: sw s2, 0(sp) # 4-byte Folded Spill |
| 209 | +; RV32FUSION-NEXT: mv s0, a0 |
| 210 | +; RV32FUSION-NEXT: li s2, 0 |
| 211 | +; RV32FUSION-NEXT: .Lpcrel_hi3: |
| 212 | +; RV32FUSION-NEXT: auipc s1, %tls_gd_pcrel_hi(gd) |
| 213 | +; RV32FUSION-NEXT: addi s1, s1, %pcrel_lo(.Lpcrel_hi3) |
| 214 | +; RV32FUSION-NEXT: .LBB3_1: # %loop |
| 215 | +; RV32FUSION-NEXT: # =>This Inner Loop Header: Depth=1 |
| 216 | +; RV32FUSION-NEXT: mv a0, s1 |
| 217 | +; RV32FUSION-NEXT: call __tls_get_addr |
| 218 | +; RV32FUSION-NEXT: lw zero, 0(a0) |
| 219 | +; RV32FUSION-NEXT: addi s2, s2, 1 |
| 220 | +; RV32FUSION-NEXT: blt s2, s0, .LBB3_1 |
| 221 | +; RV32FUSION-NEXT: # %bb.2: # %ret |
| 222 | +; RV32FUSION-NEXT: lw ra, 12(sp) # 4-byte Folded Reload |
| 223 | +; RV32FUSION-NEXT: lw s0, 8(sp) # 4-byte Folded Reload |
| 224 | +; RV32FUSION-NEXT: lw s1, 4(sp) # 4-byte Folded Reload |
| 225 | +; RV32FUSION-NEXT: lw s2, 0(sp) # 4-byte Folded Reload |
| 226 | +; RV32FUSION-NEXT: addi sp, sp, 16 |
| 227 | +; RV32FUSION-NEXT: ret |
| 228 | +; |
| 229 | +; RV64FUSION-LABEL: test_la_tls_gd: |
| 230 | +; RV64FUSION: # %bb.0: # %entry |
| 231 | +; RV64FUSION-NEXT: addi sp, sp, -32 |
| 232 | +; RV64FUSION-NEXT: sd ra, 24(sp) # 8-byte Folded Spill |
| 233 | +; RV64FUSION-NEXT: sd s0, 16(sp) # 8-byte Folded Spill |
| 234 | +; RV64FUSION-NEXT: sd s1, 8(sp) # 8-byte Folded Spill |
| 235 | +; RV64FUSION-NEXT: sd s2, 0(sp) # 8-byte Folded Spill |
| 236 | +; RV64FUSION-NEXT: mv s0, a0 |
| 237 | +; RV64FUSION-NEXT: li s2, 0 |
| 238 | +; RV64FUSION-NEXT: .Lpcrel_hi3: |
| 239 | +; RV64FUSION-NEXT: auipc s1, %tls_gd_pcrel_hi(gd) |
| 240 | +; RV64FUSION-NEXT: addi s1, s1, %pcrel_lo(.Lpcrel_hi3) |
| 241 | +; RV64FUSION-NEXT: .LBB3_1: # %loop |
| 242 | +; RV64FUSION-NEXT: # =>This Inner Loop Header: Depth=1 |
| 243 | +; RV64FUSION-NEXT: mv a0, s1 |
| 244 | +; RV64FUSION-NEXT: call __tls_get_addr |
| 245 | +; RV64FUSION-NEXT: lw zero, 0(a0) |
| 246 | +; RV64FUSION-NEXT: addiw s2, s2, 1 |
| 247 | +; RV64FUSION-NEXT: blt s2, s0, .LBB3_1 |
| 248 | +; RV64FUSION-NEXT: # %bb.2: # %ret |
| 249 | +; RV64FUSION-NEXT: ld ra, 24(sp) # 8-byte Folded Reload |
| 250 | +; RV64FUSION-NEXT: ld s0, 16(sp) # 8-byte Folded Reload |
| 251 | +; RV64FUSION-NEXT: ld s1, 8(sp) # 8-byte Folded Reload |
| 252 | +; RV64FUSION-NEXT: ld s2, 0(sp) # 8-byte Folded Reload |
| 253 | +; RV64FUSION-NEXT: addi sp, sp, 32 |
| 254 | +; RV64FUSION-NEXT: ret |
197 | 255 | entry: |
198 | 256 | br label %loop |
199 | 257 |
|
|
0 commit comments