|
| 1 | +; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py UTC_ARGS: --version 5 |
| 2 | +; RUN: llc -mtriple=amdgcn -mcpu=gfx900 -O1 %s -o - | FileCheck %s |
| 3 | + |
| 4 | +define amdgpu_ps <4 x float> @caller(ptr %1) { |
| 5 | +; CHECK-LABEL: caller: |
| 6 | +; CHECK: ; %bb.0: |
| 7 | +; CHECK-NEXT: flat_load_dword v1, v[0:1] |
| 8 | +; CHECK-NEXT: s_getpc_b64 s[0:1] |
| 9 | +; CHECK-NEXT: s_add_u32 s0, s0, fn@gotpcrel32@lo+4 |
| 10 | +; CHECK-NEXT: s_addc_u32 s1, s1, fn@gotpcrel32@hi+12 |
| 11 | +; CHECK-NEXT: s_load_dwordx2 s[4:5], s[0:1], 0x0 |
| 12 | +; CHECK-NEXT: s_mov_b32 s0, 0 |
| 13 | +; CHECK-NEXT: s_mov_b32 s1, 0 |
| 14 | +; CHECK-NEXT: s_mov_b32 s2, 0 |
| 15 | +; CHECK-NEXT: s_mov_b64 s[8:9], 36 |
| 16 | +; CHECK-NEXT: v_mov_b32_e32 v0, 0 |
| 17 | +; CHECK-NEXT: s_mov_b32 s3, 0 |
| 18 | +; CHECK-NEXT: v_mov_b32_e32 v2, 0 |
| 19 | +; CHECK-NEXT: s_mov_b32 s32, 0 |
| 20 | +; CHECK-NEXT: s_waitcnt lgkmcnt(0) |
| 21 | +; CHECK-NEXT: s_swappc_b64 s[30:31], s[4:5] |
| 22 | +; CHECK-NEXT: ; return to shader part epilog |
| 23 | + %L = load i32, ptr %1, align 4 |
| 24 | + %R = call <4 x float> @fn(<4 x i32> zeroinitializer, i32 0, i32 %L, i32 0) |
| 25 | + ret <4 x float> %R |
| 26 | +} |
| 27 | + |
| 28 | +declare <4 x float> @fn(<4 x i32> inreg, i32, i32, i32) |
0 commit comments