Skip to content

Commit cf67fcf

Browse files
AmrDeveloperlanza
authored andcommitted
[CIR][CIRGen][Builtin][Neon] Lower vmaxv_s32 (#1533)
Lower vmaxv_s32
1 parent 7ec6a86 commit cf67fcf

File tree

2 files changed

+13
-7
lines changed

2 files changed

+13
-7
lines changed

clang/lib/CIR/CodeGen/CIRGenBuiltinAArch64.cpp

Lines changed: 2 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -2786,7 +2786,8 @@ static mlir::Value emitCommonNeonSISDBuiltinExpr(
27862786
return emitNeonCall(builder, {argTy}, ops, "aarch64.neon.fmaxv", resultTy,
27872787
loc);
27882788
case NEON::BI__builtin_neon_vmaxv_s32:
2789-
llvm_unreachable(" neon_vmaxv_s32 NYI ");
2789+
return emitNeonCall(builder, {argTy}, ops, "aarch64.neon.smaxv", resultTy,
2790+
loc);
27902791
case NEON::BI__builtin_neon_vmaxv_u32:
27912792
llvm_unreachable(" neon_vmaxv_u32 NYI ");
27922793
case NEON::BI__builtin_neon_vmaxvq_f32:

clang/test/CIR/CodeGen/AArch64/neon.c

Lines changed: 11 additions & 6 deletions
Original file line numberDiff line numberDiff line change
@@ -19221,12 +19221,17 @@ float64x1_t test_vmax_f64(float64x1_t a, float64x1_t b) {
1922119221
// return vminv_u32(a);
1922219222
// }
1922319223

19224-
// NYI-LABEL: @test_vmaxv_s32(
19225-
// NYI: [[VMAXV_S32_I:%.*]] = call i32 @llvm.aarch64.neon.smaxv.i32.v2i32(<2 x i32> %a)
19226-
// NYI: ret i32 [[VMAXV_S32_I]]
19227-
// int32_t test_vmaxv_s32(int32x2_t a) {
19228-
// return vmaxv_s32(a);
19229-
// }
19224+
int32_t test_vmaxv_s32(int32x2_t a) {
19225+
return vmaxv_s32(a);
19226+
19227+
// CIR-LABEL: vmaxv_s32
19228+
// CIR: cir.llvm.intrinsic "aarch64.neon.smaxv" {{%.*}} : (!cir.vector<!s32i x 2>) -> !s32i
19229+
19230+
// LLVM-LABEL: @test_vmaxv_s32
19231+
// LLVM-SAME: (<2 x i32> [[a:%.*]])
19232+
// LLVM: [[VMAXV_S32_I:%.*]] = call i32 @llvm.aarch64.neon.smaxv.i32.v2i32(<2 x i32> [[a]])
19233+
// LLVM: ret i32 [[VMAXV_S32_I]]
19234+
}
1923019235

1923119236
// NYI-LABEL: @test_vmaxv_u32(
1923219237
// NYI: [[VMAXV_U32_I:%.*]] = call i32 @llvm.aarch64.neon.umaxv.i32.v2i32(<2 x i32> %a)

0 commit comments

Comments
 (0)