@@ -148,23 +148,35 @@ define amdgpu_ps <2 x half> @test_fmaximum_v2f16_ss(<2 x half> inreg %a, <2 x ha
148
148
}
149
149
150
150
define amdgpu_ps <3 x half > @test_fmaximum_v3f16_vv (<3 x half > %a , <3 x half > %b ) {
151
- ; GCN-LABEL: test_fmaximum_v3f16_vv:
152
- ; GCN: ; %bb.0:
153
- ; GCN-NEXT: v_pk_maximum_f16 v0, v0, v2
154
- ; GCN-NEXT: v_maximum_f16 v1, v1, v3
155
- ; GCN-NEXT: ; return to shader part epilog
151
+ ; GFX12-SDAG-LABEL: test_fmaximum_v3f16_vv:
152
+ ; GFX12-SDAG: ; %bb.0:
153
+ ; GFX12-SDAG-NEXT: v_pk_maximum_f16 v0, v0, v2
154
+ ; GFX12-SDAG-NEXT: v_pk_maximum_f16 v1, v1, v3
155
+ ; GFX12-SDAG-NEXT: ; return to shader part epilog
156
+ ;
157
+ ; GFX12-GISEL-LABEL: test_fmaximum_v3f16_vv:
158
+ ; GFX12-GISEL: ; %bb.0:
159
+ ; GFX12-GISEL-NEXT: v_pk_maximum_f16 v0, v0, v2
160
+ ; GFX12-GISEL-NEXT: v_maximum_f16 v1, v1, v3
161
+ ; GFX12-GISEL-NEXT: ; return to shader part epilog
156
162
%val = call <3 x half > @llvm.maximum.v3f16 (<3 x half > %a , <3 x half > %b )
157
163
ret <3 x half > %val
158
164
}
159
165
160
166
define amdgpu_ps <3 x half > @test_fmaximum_v3f16_ss (<3 x half > inreg %a , <3 x half > inreg %b ) {
161
- ; GCN-LABEL: test_fmaximum_v3f16_ss:
162
- ; GCN: ; %bb.0:
163
- ; GCN-NEXT: v_pk_maximum_f16 v0, s0, s2
164
- ; GCN-NEXT: s_maximum_f16 s0, s1, s3
165
- ; GCN-NEXT: s_delay_alu instid0(SALU_CYCLE_3)
166
- ; GCN-NEXT: v_mov_b32_e32 v1, s0
167
- ; GCN-NEXT: ; return to shader part epilog
167
+ ; GFX12-SDAG-LABEL: test_fmaximum_v3f16_ss:
168
+ ; GFX12-SDAG: ; %bb.0:
169
+ ; GFX12-SDAG-NEXT: v_pk_maximum_f16 v0, s0, s2
170
+ ; GFX12-SDAG-NEXT: v_pk_maximum_f16 v1, s1, s3
171
+ ; GFX12-SDAG-NEXT: ; return to shader part epilog
172
+ ;
173
+ ; GFX12-GISEL-LABEL: test_fmaximum_v3f16_ss:
174
+ ; GFX12-GISEL: ; %bb.0:
175
+ ; GFX12-GISEL-NEXT: v_pk_maximum_f16 v0, s0, s2
176
+ ; GFX12-GISEL-NEXT: s_maximum_f16 s0, s1, s3
177
+ ; GFX12-GISEL-NEXT: s_delay_alu instid0(SALU_CYCLE_3)
178
+ ; GFX12-GISEL-NEXT: v_mov_b32_e32 v1, s0
179
+ ; GFX12-GISEL-NEXT: ; return to shader part epilog
168
180
%val = call <3 x half > @llvm.maximum.v3f16 (<3 x half > %a , <3 x half > %b )
169
181
ret <3 x half > %val
170
182
}
@@ -306,6 +318,3 @@ declare <4 x half> @llvm.maximum.v4f16(<4 x half>, <4 x half>)
306
318
declare double @llvm.maximum.f64 (double , double )
307
319
declare <2 x double > @llvm.maximum.v2f64 (<2 x double >, <2 x double >)
308
320
declare <4 x double > @llvm.maximum.v4f64 (<4 x double >, <4 x double >)
309
- ;; NOTE: These prefixes are unused and the list is autogenerated. Do not add tests below this line:
310
- ; GFX12-GISEL: {{.*}}
311
- ; GFX12-SDAG: {{.*}}
0 commit comments