11; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py UTC_ARGS: --version 5
22; RUN: llc -mtriple=amdgcn -mcpu=gfx900 -O1 %s -o - | FileCheck %s
33
4- define amdgpu_ps <4 x float > @caller (ptr %1 ) {
4+ define amdgpu_ps <4 x float > @caller (ptr %ptr ) {
55; CHECK-LABEL: caller:
66; CHECK: ; %bb.0:
77; CHECK-NEXT: flat_load_dword v1, v[0:1]
8- ; CHECK-NEXT: s_getpc_b64 s[0:1]
9- ; CHECK-NEXT: s_add_u32 s0, s0, fn@gotpcrel32@lo+4
10- ; CHECK-NEXT: s_addc_u32 s1, s1, fn@gotpcrel32@hi+12
11- ; CHECK-NEXT: s_load_dwordx2 s[4:5], s[0:1], 0x0
128; CHECK-NEXT: s_mov_b32 s0, 0
139; CHECK-NEXT: s_mov_b32 s1, 0
1410; CHECK-NEXT: s_mov_b32 s2, 0
@@ -17,12 +13,14 @@ define amdgpu_ps <4 x float> @caller(ptr %1) {
1713; CHECK-NEXT: s_mov_b32 s3, 0
1814; CHECK-NEXT: v_mov_b32_e32 v2, 0
1915; CHECK-NEXT: s_mov_b32 s32, 0
20- ; CHECK-NEXT: s_waitcnt lgkmcnt(0)
16+ ; CHECK-NEXT: s_getpc_b64 s[4:5]
17+ ; CHECK-NEXT: s_add_u32 s4, s4, fn@rel32@lo+4
18+ ; CHECK-NEXT: s_addc_u32 s5, s5, fn@rel32@hi+12
2119; CHECK-NEXT: s_swappc_b64 s[30:31], s[4:5]
2220; CHECK-NEXT: ; return to shader part epilog
23- %L = load i32 , ptr %1 , align 4
21+ %L = load i32 , ptr %ptr , align 4
2422 %R = call <4 x float > @fn (<4 x i32 > zeroinitializer , i32 0 , i32 %L , i32 0 )
2523 ret <4 x float > %R
2624}
2725
28- declare <4 x float > @fn (<4 x i32 > inreg , i32 , i32 , i32 )
26+ declare hidden <4 x float > @fn (<4 x i32 > inreg , i32 , i32 , i32 )
0 commit comments