Skip to content

Commit 1030ef3

Browse files
committed
Review changes
1 parent 5bd7c7b commit 1030ef3

File tree

4 files changed

+11
-11
lines changed

4 files changed

+11
-11
lines changed

clang/include/clang/Basic/BuiltinsAMDGPU.def

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -63,8 +63,8 @@ BUILTIN(__builtin_amdgcn_grid_size_z, "Ui", "nc")
6363
BUILTIN(__builtin_amdgcn_mbcnt_hi, "UiUiUi", "nc")
6464
BUILTIN(__builtin_amdgcn_mbcnt_lo, "UiUiUi", "nc")
6565

66-
BUILTIN(__builtin_amdgcn_bcnt032_lo, "UiUi", "nc")
67-
BUILTIN(__builtin_amdgcn_bcnt064_lo, "UiWUi", "nc")
66+
BUILTIN(__builtin_amdgcn_bcnt32_lo, "UiUi", "nc")
67+
BUILTIN(__builtin_amdgcn_bcnt64_lo, "UiWUi", "nc")
6868

6969
TARGET_BUILTIN(__builtin_amdgcn_s_memtime, "WUi", "n", "s-memtime-inst")
7070

llvm/include/llvm/IR/IntrinsicsAMDGPU.td

Lines changed: 4 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -2359,12 +2359,12 @@ def int_amdgcn_mbcnt_hi :
23592359
DefaultAttrsIntrinsic<[llvm_i32_ty], [llvm_i32_ty, llvm_i32_ty],
23602360
[IntrNoMem]>;
23612361

2362-
def int_amdgcn_bcnt032_lo :
2363-
ClangBuiltin<"__builtin_amdgcn_bcnt032_lo">,
2362+
def int_amdgcn_bcnt32_lo :
2363+
ClangBuiltin<"__builtin_amdgcn_bcnt32_lo">,
23642364
DefaultAttrsIntrinsic<[llvm_i32_ty], [llvm_i32_ty], [IntrNoMem]>;
23652365

2366-
def int_amdgcn_bcnt064_lo :
2367-
ClangBuiltin<"__builtin_amdgcn_bcnt064_lo">,
2366+
def int_amdgcn_bcnt64_lo :
2367+
ClangBuiltin<"__builtin_amdgcn_bcnt64_lo">,
23682368
DefaultAttrsIntrinsic<[llvm_i32_ty], [llvm_i64_ty], [IntrNoMem]>;
23692369

23702370
// llvm.amdgcn.ds.swizzle src offset

llvm/lib/Target/AMDGPU/AMDGPUCodeGenPrepare.cpp

Lines changed: 3 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -95,7 +95,7 @@ static cl::opt<bool> DisableFDivExpand(
9595
cl::ReallyHidden,
9696
cl::init(false));
9797

98-
// Disable processing of fdiv so we can better test the backend implementations.
98+
// Disable bitsin(typeof(x)) - popcnt(x) to s_bcnt0(x) transformation.
9999
static cl::opt<bool>
100100
DisableBcnt0("amdgpu-codegenprepare-disable-bcnt0",
101101
cl::desc("Prevent transforming bitsin(typeof(x)) - "
@@ -2005,8 +2005,8 @@ bool AMDGPUCodeGenPrepareImpl::visitCtpop(IntrinsicInst &I) {
20052005

20062006
IRBuilder<> Builder(MustBeSub);
20072007
Instruction *TransformedIns =
2008-
Builder.CreateIntrinsic(BitWidth > 32 ? Intrinsic::amdgcn_bcnt064_lo
2009-
: Intrinsic::amdgcn_bcnt032_lo,
2008+
Builder.CreateIntrinsic(BitWidth > 32 ? Intrinsic::amdgcn_bcnt64_lo
2009+
: Intrinsic::amdgcn_bcnt32_lo,
20102010
{}, {I.getArgOperand(0)});
20112011

20122012
if ((DestinationWidth = MustBeSub->getType()->getIntegerBitWidth()) !=

llvm/lib/Target/AMDGPU/SOPInstructions.td

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -265,10 +265,10 @@ def S_BREV_B64 : SOP1_64 <"s_brev_b64",
265265

266266
let Defs = [SCC] in {
267267
def S_BCNT0_I32_B32 : SOP1_32 <"s_bcnt0_i32_b32",
268-
[(set i32:$sdst, (UniformUnaryFrag<int_amdgcn_bcnt032_lo> i32:$src0))]
268+
[(set i32:$sdst, (UniformUnaryFrag<int_amdgcn_bcnt32_lo> i32:$src0))]
269269
>;
270270
def S_BCNT0_I32_B64 : SOP1_32_64 <"s_bcnt0_i32_b64",
271-
[(set i32:$sdst, (UniformUnaryFrag<int_amdgcn_bcnt064_lo> i64:$src0))]
271+
[(set i32:$sdst, (UniformUnaryFrag<int_amdgcn_bcnt64_lo> i64:$src0))]
272272
>;
273273
def S_BCNT1_I32_B32 : SOP1_32 <"s_bcnt1_i32_b32",
274274
[(set i32:$sdst, (UniformUnaryFrag<ctpop> i32:$src0))]

0 commit comments

Comments
 (0)