Skip to content
Merged
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
8 changes: 8 additions & 0 deletions llvm/include/llvm/CodeGen/SelectionDAGNodes.h
Original file line number Diff line number Diff line change
Expand Up @@ -1497,6 +1497,14 @@ class MemSDNode : public SDNode {
MMO->refineAlignment(NewMMO);
}

void refineRanges(const MachineMemOperand *NewMMO) {
// If this node has range metadata that is different than NewMMO, clear the
// range metadata.
// FIXME: Union the ranges instead?
if (getRanges() && getRanges() != NewMMO->getRanges())
MMO->clearRanges();
}

const SDValue &getChain() const { return getOperand(0); }

const SDValue &getBasePtr() const {
Expand Down
17 changes: 11 additions & 6 deletions llvm/lib/CodeGen/SelectionDAG/SelectionDAG.cpp
Original file line number Diff line number Diff line change
Expand Up @@ -1275,6 +1275,8 @@ SelectionDAG::AddModifiedNodeToCSEMaps(SDNode *N) {
// to replace the dead one with the existing one. This can cause
// recursive merging of other unrelated nodes down the line.
Existing->intersectFlagsWith(N->getFlags());
if (auto *MemNode = dyn_cast<MemSDNode>(Existing))
MemNode->refineRanges(cast<MemSDNode>(N)->getMemOperand());
ReplaceAllUsesWith(N, Existing);

// N is now dead. Inform the listeners and delete it.
Expand Down Expand Up @@ -9109,8 +9111,9 @@ SDValue SelectionDAG::getAtomic(unsigned Opcode, const SDLoc &dl, EVT MemVT,
ID.AddInteger(MMO->getPointerInfo().getAddrSpace());
ID.AddInteger(MMO->getFlags());
void* IP = nullptr;
if (SDNode *E = FindNodeOrInsertPos(ID, dl, IP)) {
cast<AtomicSDNode>(E)->refineAlignment(MMO);
if (auto *E = cast_or_null<AtomicSDNode>(FindNodeOrInsertPos(ID, dl, IP))) {
E->refineAlignment(MMO);
E->refineRanges(MMO);
return SDValue(E, 0);
}

Expand Down Expand Up @@ -9401,8 +9404,9 @@ SDValue SelectionDAG::getLoad(ISD::MemIndexedMode AM, ISD::LoadExtType ExtType,
ID.AddInteger(MMO->getPointerInfo().getAddrSpace());
ID.AddInteger(MMO->getFlags());
void *IP = nullptr;
if (SDNode *E = FindNodeOrInsertPos(ID, dl, IP)) {
cast<LoadSDNode>(E)->refineAlignment(MMO);
if (auto *E = cast_or_null<LoadSDNode>(FindNodeOrInsertPos(ID, dl, IP))) {
E->refineAlignment(MMO);
E->refineRanges(MMO);
return SDValue(E, 0);
}
auto *N = newSDNode<LoadSDNode>(dl.getIROrder(), dl.getDebugLoc(), VTs, AM,
Expand Down Expand Up @@ -9622,8 +9626,9 @@ SDValue SelectionDAG::getLoadVP(ISD::MemIndexedMode AM,
ID.AddInteger(MMO->getPointerInfo().getAddrSpace());
ID.AddInteger(MMO->getFlags());
void *IP = nullptr;
if (SDNode *E = FindNodeOrInsertPos(ID, dl, IP)) {
cast<VPLoadSDNode>(E)->refineAlignment(MMO);
if (auto *E = cast_or_null<VPLoadSDNode>(FindNodeOrInsertPos(ID, dl, IP))) {
E->refineAlignment(MMO);
E->refineRanges(MMO);
return SDValue(E, 0);
}
auto *N = newSDNode<VPLoadSDNode>(dl.getIROrder(), dl.getDebugLoc(), VTs, AM,
Expand Down
40 changes: 40 additions & 0 deletions llvm/test/CodeGen/RISCV/pr145363.ll
Original file line number Diff line number Diff line change
@@ -0,0 +1,40 @@
; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py UTC_ARGS: --version 5
; RUN: llc < %s -mtriple=riscv64 | FileCheck %s

; These two loads will CSE, we need to conservatively combine the range
; metadata. The final assembly should not contain an OR.
define i32 @f(ptr %p) {
; CHECK-LABEL: f:
; CHECK: # %bb.0:
; CHECK-NEXT: lw a0, 0(a0)
; CHECK-NEXT: lui a1, 294471
; CHECK-NEXT: addi a1, a1, 1064
; CHECK-NEXT: addw a0, a0, a1
; CHECK-NEXT: ret
%load = load i32, ptr %p, align 4, !range !0
%load2 = load i32, ptr %p, align 4
%add = add i32 1206154280, %load2
ret i32 %add
}

; The mul and getelementptr will get removed in DAGCombine causing the loads
; to CSE after they are created.
define i32 @test(ptr %p, i32 %x, ptr %q) {
; CHECK-LABEL: test:
; CHECK: # %bb.0:
; CHECK-NEXT: lw a1, 0(a0)
; CHECK-NEXT: lui a0, 294471
; CHECK-NEXT: addi a0, a0, 1064
; CHECK-NEXT: addw a0, a1, a0
; CHECK-NEXT: sw a1, 0(a2)
; CHECK-NEXT: ret
%load = load i32, ptr %p, align 4, !range !0
%mul = mul i32 0, %x
%a = getelementptr i32, ptr %p, i32 %mul
%load2 = load i32, ptr %a, align 4
%add = add i32 1206154280, %load2
store i32 %load, ptr %q
ret i32 %add
}

!0 = !{i32 1, i32 2, i32 3, i32 4}