Skip to content

Commit cb5fe84

Browse files
Automerge: [CIR] Upstream CIR codegen for vec_ext x86 builtins (#167942)
This PR upstreams the codegen for the x86 vec_ext builtins from the incubator. It is part of #167752.
2 parents 1a750ed + e02fdf0 commit cb5fe84

File tree

6 files changed

+59
-31
lines changed

6 files changed

+59
-31
lines changed

clang/lib/CIR/CodeGen/CIRGenBuilder.h

Lines changed: 4 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -315,8 +315,10 @@ class CIRGenBuilderTy : public cir::CIRBaseBuilderTy {
315315
return getConstantInt(loc, getUInt32Ty(), c);
316316
}
317317
cir::ConstantOp getSInt64(uint64_t c, mlir::Location loc) {
318-
cir::IntType sInt64Ty = getSInt64Ty();
319-
return cir::ConstantOp::create(*this, loc, cir::IntAttr::get(sInt64Ty, c));
318+
return getConstantInt(loc, getSInt64Ty(), c);
319+
}
320+
cir::ConstantOp getUInt64(uint64_t c, mlir::Location loc) {
321+
return getConstantInt(loc, getUInt64Ty(), c);
320322
}
321323

322324
mlir::Value createNeg(mlir::Value value) {

clang/lib/CIR/CodeGen/CIRGenBuiltin.cpp

Lines changed: 16 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -630,6 +630,22 @@ CIRGenFunction::emitTargetBuiltinExpr(unsigned builtinID, const CallExpr *e,
630630
getTarget().getTriple().getArch());
631631
}
632632

633+
mlir::Value CIRGenFunction::emitScalarOrConstFoldImmArg(
634+
const unsigned iceArguments, const unsigned idx, const Expr *argExpr) {
635+
mlir::Value arg = {};
636+
if ((iceArguments & (1 << idx)) == 0) {
637+
arg = emitScalarExpr(argExpr);
638+
} else {
639+
// If this is required to be a constant, constant fold it so that we
640+
// know that the generated intrinsic gets a ConstantInt.
641+
const std::optional<llvm::APSInt> result =
642+
argExpr->getIntegerConstantExpr(getContext());
643+
assert(result && "Expected argument to be a constant");
644+
arg = builder.getConstInt(getLoc(argExpr->getSourceRange()), *result);
645+
}
646+
return arg;
647+
}
648+
633649
/// Given a builtin id for a function like "__builtin_fabsf", return a Function*
634650
/// for "fabsf".
635651
cir::FuncOp CIRGenModule::getBuiltinLibFunction(const FunctionDecl *fd,

clang/lib/CIR/CodeGen/CIRGenBuiltinX86.cpp

Lines changed: 21 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -16,7 +16,6 @@
1616
#include "clang/Basic/Builtins.h"
1717
#include "clang/Basic/TargetBuiltins.h"
1818
#include "clang/CIR/MissingFeatures.h"
19-
#include "llvm/IR/IntrinsicsX86.h"
2019

2120
using namespace clang;
2221
using namespace clang::CIRGen;
@@ -66,9 +65,8 @@ mlir::Value CIRGenFunction::emitX86BuiltinExpr(unsigned builtinID,
6665
getContext().GetBuiltinType(builtinID, error, &iceArguments);
6766
assert(error == ASTContext::GE_None && "Error while getting builtin type.");
6867

69-
for (auto [idx, arg] : llvm::enumerate(e->arguments())) {
68+
for (auto [idx, arg] : llvm::enumerate(e->arguments()))
7069
ops.push_back(emitScalarOrConstFoldImmArg(iceArguments, idx, arg));
71-
}
7270

7371
CIRGenBuilderTy &builder = getBuilder();
7472
mlir::Type voidTy = builder.getVoidTy();
@@ -98,6 +96,10 @@ mlir::Value CIRGenFunction::emitX86BuiltinExpr(unsigned builtinID,
9896
case X86::BI__builtin_ia32_undef128:
9997
case X86::BI__builtin_ia32_undef256:
10098
case X86::BI__builtin_ia32_undef512:
99+
cgm.errorNYI(e->getSourceRange(),
100+
std::string("unimplemented X86 builtin call: ") +
101+
getContext().BuiltinInfo.getName(builtinID));
102+
return {};
101103
case X86::BI__builtin_ia32_vec_ext_v4hi:
102104
case X86::BI__builtin_ia32_vec_ext_v16qi:
103105
case X86::BI__builtin_ia32_vec_ext_v8hi:
@@ -107,7 +109,22 @@ mlir::Value CIRGenFunction::emitX86BuiltinExpr(unsigned builtinID,
107109
case X86::BI__builtin_ia32_vec_ext_v32qi:
108110
case X86::BI__builtin_ia32_vec_ext_v16hi:
109111
case X86::BI__builtin_ia32_vec_ext_v8si:
110-
case X86::BI__builtin_ia32_vec_ext_v4di:
112+
case X86::BI__builtin_ia32_vec_ext_v4di: {
113+
unsigned numElts = cast<cir::VectorType>(ops[0].getType()).getSize();
114+
115+
uint64_t index =
116+
ops[1].getDefiningOp<cir::ConstantOp>().getIntValue().getZExtValue();
117+
118+
index &= numElts - 1;
119+
120+
cir::ConstantOp indexVal =
121+
builder.getUInt64(index, getLoc(e->getExprLoc()));
122+
123+
// These builtins exist so we can ensure the index is an ICE and in range.
124+
// Otherwise we could just do this in the header file.
125+
return cir::VecExtractOp::create(builder, getLoc(e->getExprLoc()), ops[0],
126+
indexVal);
127+
}
111128
case X86::BI__builtin_ia32_vec_set_v4hi:
112129
case X86::BI__builtin_ia32_vec_set_v16qi:
113130
case X86::BI__builtin_ia32_vec_set_v8hi:

clang/lib/CIR/CodeGen/CIRGenExprScalar.cpp

Lines changed: 0 additions & 22 deletions
Original file line numberDiff line numberDiff line change
@@ -1442,28 +1442,6 @@ mlir::Value CIRGenFunction::emitPromotedScalarExpr(const Expr *e,
14421442
return ScalarExprEmitter(*this, builder).Visit(const_cast<Expr *>(e));
14431443
}
14441444

1445-
mlir::Value CIRGenFunction::emitScalarOrConstFoldImmArg(unsigned iceArguments,
1446-
unsigned index,
1447-
const Expr *arg) {
1448-
mlir::Value result{};
1449-
1450-
// The bit at the specified index indicates whether the argument is required
1451-
// to be a constant integer expression.
1452-
bool isArgRequiredToBeConstant = (iceArguments & (1 << index));
1453-
1454-
if (!isArgRequiredToBeConstant) {
1455-
result = emitScalarExpr(arg);
1456-
} else {
1457-
// If this is required to be a constant, constant fold it so that we
1458-
// know that the generated intrinsic gets a ConstantInt.
1459-
std::optional<llvm::APSInt> iceOpt =
1460-
arg->getIntegerConstantExpr(getContext());
1461-
assert(iceOpt && "Expected argument to be a constant");
1462-
result = builder.getConstInt(getLoc(arg->getSourceRange()), *iceOpt);
1463-
}
1464-
return result;
1465-
}
1466-
14671445
[[maybe_unused]] static bool mustVisitNullValue(const Expr *e) {
14681446
// If a null pointer expression's type is the C++0x nullptr_t and
14691447
// the expression is not a simple literal, it must be evaluated

clang/lib/CIR/CodeGen/CIRGenFunction.h

Lines changed: 3 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -1546,9 +1546,6 @@ class CIRGenFunction : public CIRGenTypeCache {
15461546
mlir::Value emitScalarExpr(const clang::Expr *e,
15471547
bool ignoreResultAssign = false);
15481548

1549-
mlir::Value emitScalarOrConstFoldImmArg(unsigned iceArguments, unsigned index,
1550-
const Expr *arg);
1551-
15521549
mlir::Value emitScalarPrePostIncDec(const UnaryOperator *e, LValue lv,
15531550
cir::UnaryOpKind kind, bool isPre);
15541551

@@ -1721,6 +1718,9 @@ class CIRGenFunction : public CIRGenTypeCache {
17211718
void emitScalarInit(const clang::Expr *init, mlir::Location loc,
17221719
LValue lvalue, bool capturedByInit = false);
17231720

1721+
mlir::Value emitScalarOrConstFoldImmArg(unsigned iceArguments, unsigned idx,
1722+
const Expr *argExpr);
1723+
17241724
void emitStaticVarDecl(const VarDecl &d, cir::GlobalLinkageKind linkage);
17251725

17261726
void emitStoreOfComplex(mlir::Location loc, mlir::Value v, LValue dest,

clang/test/CIR/CodeGen/X86/sse2-builtins.c

Lines changed: 15 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -16,6 +16,21 @@
1616

1717
#include <immintrin.h>
1818

19+
// Lowering to pextrw requires optimization.
20+
int test_mm_extract_epi16(__m128i A) {
21+
// CIR-LABEL: test_mm_extract_epi16
22+
// CIR %{{.*}} = cir.vec.extract %{{.*}}[%{{.*}} : {{!u32i|!u64i}}] : !cir.vector<!s16i x 8>
23+
// CIR %{{.*}} = cir.cast integral %{{.*}} : !u16i -> !s32i
24+
25+
// LLVM-LABEL: test_mm_extract_epi16
26+
// LLVM: extractelement <8 x i16> %{{.*}}, {{i32|i64}} 1
27+
// LLVM: zext i16 %{{.*}} to i32
28+
29+
// OGCG-LABEL: test_mm_extract_epi16
30+
// OGCG: extractelement <8 x i16> %{{.*}}, {{i32|i64}} 1
31+
// OGCG: zext i16 %{{.*}} to i32
32+
return _mm_extract_epi16(A, 1);
33+
}
1934

2035
void test_mm_clflush(void* A) {
2136
// CIR-LABEL: test_mm_clflush

0 commit comments

Comments
 (0)