@@ -148,23 +148,35 @@ define amdgpu_ps <2 x half> @test_fmaximum_v2f16_ss(<2 x half> inreg %a, <2 x ha
148148}
149149
150150define amdgpu_ps <3 x half > @test_fmaximum_v3f16_vv (<3 x half > %a , <3 x half > %b ) {
151- ; GCN-LABEL: test_fmaximum_v3f16_vv:
152- ; GCN: ; %bb.0:
153- ; GCN-NEXT: v_pk_maximum_f16 v0, v0, v2
154- ; GCN-NEXT: v_maximum_f16 v1, v1, v3
155- ; GCN-NEXT: ; return to shader part epilog
151+ ; GFX12-SDAG-LABEL: test_fmaximum_v3f16_vv:
152+ ; GFX12-SDAG: ; %bb.0:
153+ ; GFX12-SDAG-NEXT: v_pk_maximum_f16 v0, v0, v2
154+ ; GFX12-SDAG-NEXT: v_pk_maximum_f16 v1, v1, v3
155+ ; GFX12-SDAG-NEXT: ; return to shader part epilog
156+ ;
157+ ; GFX12-GISEL-LABEL: test_fmaximum_v3f16_vv:
158+ ; GFX12-GISEL: ; %bb.0:
159+ ; GFX12-GISEL-NEXT: v_pk_maximum_f16 v0, v0, v2
160+ ; GFX12-GISEL-NEXT: v_maximum_f16 v1, v1, v3
161+ ; GFX12-GISEL-NEXT: ; return to shader part epilog
156162 %val = call <3 x half > @llvm.maximum.v3f16 (<3 x half > %a , <3 x half > %b )
157163 ret <3 x half > %val
158164}
159165
160166define amdgpu_ps <3 x half > @test_fmaximum_v3f16_ss (<3 x half > inreg %a , <3 x half > inreg %b ) {
161- ; GCN-LABEL: test_fmaximum_v3f16_ss:
162- ; GCN: ; %bb.0:
163- ; GCN-NEXT: v_pk_maximum_f16 v0, s0, s2
164- ; GCN-NEXT: s_maximum_f16 s0, s1, s3
165- ; GCN-NEXT: s_delay_alu instid0(SALU_CYCLE_3)
166- ; GCN-NEXT: v_mov_b32_e32 v1, s0
167- ; GCN-NEXT: ; return to shader part epilog
167+ ; GFX12-SDAG-LABEL: test_fmaximum_v3f16_ss:
168+ ; GFX12-SDAG: ; %bb.0:
169+ ; GFX12-SDAG-NEXT: v_pk_maximum_f16 v0, s0, s2
170+ ; GFX12-SDAG-NEXT: v_pk_maximum_f16 v1, s1, s3
171+ ; GFX12-SDAG-NEXT: ; return to shader part epilog
172+ ;
173+ ; GFX12-GISEL-LABEL: test_fmaximum_v3f16_ss:
174+ ; GFX12-GISEL: ; %bb.0:
175+ ; GFX12-GISEL-NEXT: v_pk_maximum_f16 v0, s0, s2
176+ ; GFX12-GISEL-NEXT: s_maximum_f16 s0, s1, s3
177+ ; GFX12-GISEL-NEXT: s_delay_alu instid0(SALU_CYCLE_3)
178+ ; GFX12-GISEL-NEXT: v_mov_b32_e32 v1, s0
179+ ; GFX12-GISEL-NEXT: ; return to shader part epilog
168180 %val = call <3 x half > @llvm.maximum.v3f16 (<3 x half > %a , <3 x half > %b )
169181 ret <3 x half > %val
170182}
@@ -306,6 +318,3 @@ declare <4 x half> @llvm.maximum.v4f16(<4 x half>, <4 x half>)
306318declare double @llvm.maximum.f64 (double , double )
307319declare <2 x double > @llvm.maximum.v2f64 (<2 x double >, <2 x double >)
308320declare <4 x double > @llvm.maximum.v4f64 (<4 x double >, <4 x double >)
309- ;; NOTE: These prefixes are unused and the list is autogenerated. Do not add tests below this line:
310- ; GFX12-GISEL: {{.*}}
311- ; GFX12-SDAG: {{.*}}
0 commit comments