[llvm] r245172 - Revert "Add support for cross block dse. This patch enables dead stroe elimination across basicblocks."
David Majnemer via llvm-commits
llvm-commits at lists.llvm.org
Sun Aug 16 00:12:00 PDT 2015
Author: majnemer
Date: Sun Aug 16 02:11:59 2015
New Revision: 245172
URL: http://llvm.org/viewvc/llvm-project?rev=245172&view=rev
Log:
Revert "Add support for cross block dse. This patch enables dead stroe elimination across basicblocks."
This reverts commit r245025, it caused PR24469.
Removed:
llvm/trunk/test/Transforms/DeadStoreElimination/cross_block_dse.ll
llvm/trunk/test/Transforms/DeadStoreElimination/cross_block_dse_loop.ll
Modified:
llvm/trunk/lib/Transforms/Scalar/DeadStoreElimination.cpp
Modified: llvm/trunk/lib/Transforms/Scalar/DeadStoreElimination.cpp
URL: http://llvm.org/viewvc/llvm-project/llvm/trunk/lib/Transforms/Scalar/DeadStoreElimination.cpp?rev=245172&r1=245171&r2=245172&view=diff
==============================================================================
--- llvm/trunk/lib/Transforms/Scalar/DeadStoreElimination.cpp (original)
+++ llvm/trunk/lib/Transforms/Scalar/DeadStoreElimination.cpp Sun Aug 16 02:11:59 2015
@@ -16,16 +16,13 @@
//===----------------------------------------------------------------------===//
#include "llvm/Transforms/Scalar.h"
-#include "llvm/ADT/DenseSet.h"
#include "llvm/ADT/STLExtras.h"
#include "llvm/ADT/SetVector.h"
#include "llvm/ADT/Statistic.h"
#include "llvm/Analysis/AliasAnalysis.h"
#include "llvm/Analysis/CaptureTracking.h"
-#include "llvm/Analysis/CFG.h"
#include "llvm/Analysis/MemoryBuiltins.h"
#include "llvm/Analysis/MemoryDependenceAnalysis.h"
-#include "llvm/Analysis/PostDominators.h"
#include "llvm/Analysis/TargetLibraryInfo.h"
#include "llvm/Analysis/ValueTracking.h"
#include "llvm/IR/Constants.h"
@@ -45,7 +42,6 @@ using namespace llvm;
STATISTIC(NumRedundantStores, "Number of redundant stores deleted");
STATISTIC(NumFastStores, "Number of stores deleted");
-STATISTIC(NumCrossBlockStores, "Number of cross block stores deleted");
STATISTIC(NumFastOther , "Number of other instrs removed");
namespace {
@@ -53,41 +49,12 @@ namespace {
AliasAnalysis *AA;
MemoryDependenceAnalysis *MD;
DominatorTree *DT;
- PostDominatorTree *PDT;
const TargetLibraryInfo *TLI;
- SmallVector<SmallVector<StoreInst *, 8>, 16> Candidates;
- SetVector<StoreInst *> DeadStores;
- SmallVector<std::pair<const BasicBlock *, const BasicBlock *>, 32>
- BackEdges;
- DenseSet<std::pair<const BasicBlock *, const BasicBlock *>> BackEdgesMap;
+
static char ID; // Pass identification, replacement for typeid
- DSE()
- : FunctionPass(ID), AA(nullptr), MD(nullptr), DT(nullptr),
- PDT(nullptr) {
+ DSE() : FunctionPass(ID), AA(nullptr), MD(nullptr), DT(nullptr) {
initializeDSEPass(*PassRegistry::getPassRegistry());
}
- // Return all stores in a given BasicBlock.
- SmallVector<StoreInst *, 8> getStores(BasicBlock *BB) {
- SmallVector<StoreInst *, 8> VecStores;
- for (auto &BI : *BB) {
- if (StoreInst *SI = dyn_cast<StoreInst>(&BI))
- VecStores.push_back(SI);
- }
- return VecStores;
- }
-
- // Get dfs in/out on the PDT and populate Candidates store list which
- // is used to find potential dead stores for a given block
- void populateCandidateStores(Function &F) {
- for (auto &I : F) {
- DomTreeNode *DTNode = PDT->getNode(&I);
- if (!DTNode)
- continue;
- int DFSIn = DTNode->getDFSNumIn();
- SmallVector<StoreInst *, 8> VecStores = getStores(&I);
- Candidates[DFSIn] = VecStores;
- }
- }
bool runOnFunction(Function &F) override {
if (skipOptnoneFunction(F))
@@ -97,21 +64,7 @@ namespace {
MD = &getAnalysis<MemoryDependenceAnalysis>();
DT = &getAnalysis<DominatorTreeWrapperPass>().getDomTree();
TLI = &getAnalysis<TargetLibraryInfoWrapperPass>().getTLI();
- PDT = &getAnalysis<PostDominatorTree>();
- if (PDT->getRootNode()) {
- int Count = PDT->getRootNode()->getDFSNumOut();
- SmallVector<StoreInst *, 8> VecStores;
- Candidates.resize(Count + 1);
- Candidates.assign(Count + 1, VecStores);
-
- // If we have more than 1 block try to populate candidate store.
- if (Count > 1) {
- populateCandidateStores(F);
- FindFunctionBackedges(F, BackEdges);
- for (auto I : BackEdges)
- BackEdgesMap.insert(I);
- }
- }
+
bool Changed = false;
for (Function::iterator I = F.begin(), E = F.end(); I != E; ++I)
// Only check non-dead blocks. Dead blocks may have strange pointer
@@ -130,23 +83,16 @@ namespace {
void RemoveAccessedObjects(const MemoryLocation &LoadedLoc,
SmallSetVector<Value *, 16> &DeadStackObjects,
const DataLayout &DL);
- void handleNonLocalStoreDeletion(StoreInst *SI);
- bool isSafeCandidateForDeletion(BasicBlock *SrcBlock, BasicBlock *SinkBlock,
- StoreInst *SI);
- void DeleteDeadInstruction(Instruction *I, MemoryDependenceAnalysis &MD,
- const TargetLibraryInfo &TLI,
- SmallSetVector<Value *, 16> *ValueSet = nullptr);
+
void getAnalysisUsage(AnalysisUsage &AU) const override {
AU.setPreservesCFG();
AU.addRequired<DominatorTreeWrapperPass>();
AU.addRequired<AliasAnalysis>();
AU.addRequired<MemoryDependenceAnalysis>();
- AU.addRequired<PostDominatorTree>();
AU.addRequired<TargetLibraryInfoWrapperPass>();
AU.addPreserved<AliasAnalysis>();
AU.addPreserved<DominatorTreeWrapperPass>();
AU.addPreserved<MemoryDependenceAnalysis>();
- AU.addPreserved<PostDominatorTree>();
}
};
}
@@ -156,7 +102,6 @@ INITIALIZE_PASS_BEGIN(DSE, "dse", "Dead
INITIALIZE_AG_DEPENDENCY(AliasAnalysis)
INITIALIZE_PASS_DEPENDENCY(DominatorTreeWrapperPass)
INITIALIZE_PASS_DEPENDENCY(MemoryDependenceAnalysis)
-INITIALIZE_PASS_DEPENDENCY(PostDominatorTree)
INITIALIZE_PASS_DEPENDENCY(TargetLibraryInfoWrapperPass)
INITIALIZE_PASS_END(DSE, "dse", "Dead Store Elimination", false, false)
@@ -166,6 +111,50 @@ FunctionPass *llvm::createDeadStoreElimi
// Helper functions
//===----------------------------------------------------------------------===//
+/// DeleteDeadInstruction - Delete this instruction. Before we do, go through
+/// and zero out all the operands of this instruction. If any of them become
+/// dead, delete them and the computation tree that feeds them.
+///
+/// If ValueSet is non-null, remove any deleted instructions from it as well.
+///
+static void DeleteDeadInstruction(Instruction *I,
+ MemoryDependenceAnalysis &MD,
+ const TargetLibraryInfo &TLI,
+ SmallSetVector<Value*, 16> *ValueSet = nullptr) {
+ SmallVector<Instruction*, 32> NowDeadInsts;
+
+ NowDeadInsts.push_back(I);
+ --NumFastOther;
+
+ // Before we touch this instruction, remove it from memdep!
+ do {
+ Instruction *DeadInst = NowDeadInsts.pop_back_val();
+ ++NumFastOther;
+
+ // This instruction is dead, zap it, in stages. Start by removing it from
+ // MemDep, which needs to know the operands and needs it to be in the
+ // function.
+ MD.removeInstruction(DeadInst);
+
+ for (unsigned op = 0, e = DeadInst->getNumOperands(); op != e; ++op) {
+ Value *Op = DeadInst->getOperand(op);
+ DeadInst->setOperand(op, nullptr);
+
+ // If this operand just became dead, add it to the NowDeadInsts list.
+ if (!Op->use_empty()) continue;
+
+ if (Instruction *OpI = dyn_cast<Instruction>(Op))
+ if (isInstructionTriviallyDead(OpI, &TLI))
+ NowDeadInsts.push_back(OpI);
+ }
+
+ DeadInst->eraseFromParent();
+
+ if (ValueSet) ValueSet->remove(DeadInst);
+ } while (!NowDeadInsts.empty());
+}
+
+
/// hasMemoryWrite - Does this instruction write some memory? This only returns
/// true for things that we can analyze with other helpers below.
static bool hasMemoryWrite(Instruction *I, const TargetLibraryInfo &TLI) {
@@ -538,15 +527,10 @@ bool DSE::runOnBasicBlock(BasicBlock &BB
MemDepResult InstDep = MD->getDependency(Inst);
- if (!InstDep.isDef() && !InstDep.isClobber() && !InstDep.isNonLocal())
+ // Ignore any store where we can't find a local dependence.
+ // FIXME: cross-block DSE would be fun. :)
+ if (!InstDep.isDef() && !InstDep.isClobber())
continue;
- if (InstDep.isNonLocal()) {
- if (!PDT->getRootNode())
- continue;
- if (StoreInst *SI = dyn_cast<StoreInst>(Inst))
- handleNonLocalStoreDeletion(SI);
- continue;
- }
// Figure out what location is being stored to.
MemoryLocation Loc = getLocForWrite(Inst, *AA);
@@ -720,50 +704,6 @@ static void FindUnconditionalPreds(Small
}
}
-/// DeleteDeadInstruction - Delete this instruction. Before we do, go through
-/// and zero out all the operands of this instruction. If any of them become
-/// dead, delete them and the computation tree that feeds them.
-/// If ValueSet is non-null, remove any deleted instructions from it as well.
-void DSE::DeleteDeadInstruction(Instruction *I, MemoryDependenceAnalysis &MD,
- const TargetLibraryInfo &TLI,
- SmallSetVector<Value *, 16> *ValueSet) {
- SmallVector<Instruction *, 32> NowDeadInsts;
-
- NowDeadInsts.push_back(I);
- --NumFastOther;
-
- // Before we touch this instruction, remove it from memdep!
- do {
- Instruction *DeadInst = NowDeadInsts.pop_back_val();
- ++NumFastOther;
- if (StoreInst *SI = dyn_cast<StoreInst>(DeadInst))
- DeadStores.insert(SI);
-
- // This instruction is dead, zap it, in stages. Start by removing it from
- // MemDep, which needs to know the operands and needs it to be in the
- // function.
- MD.removeInstruction(DeadInst);
-
- for (unsigned op = 0, e = DeadInst->getNumOperands(); op != e; ++op) {
- Value *Op = DeadInst->getOperand(op);
- DeadInst->setOperand(op, nullptr);
-
- // If this operand just became dead, add it to the NowDeadInsts list.
- if (!Op->use_empty())
- continue;
-
- if (Instruction *OpI = dyn_cast<Instruction>(Op))
- if (isInstructionTriviallyDead(OpI, &TLI))
- NowDeadInsts.push_back(OpI);
- }
-
- DeadInst->eraseFromParent();
-
- if (ValueSet)
- ValueSet->remove(DeadInst);
- } while (!NowDeadInsts.empty());
-}
-
/// HandleFree - Handle frees of entire structures whose dependency is a store
/// to a field of that structure.
bool DSE::HandleFree(CallInst *F) {
@@ -991,116 +931,3 @@ void DSE::RemoveAccessedObjects(const Me
return !AA->isNoAlias(StackLoc, LoadedLoc);
});
}
-
-/// isSafeCandidateForDeletion- Check all paths from the SrcBlock till
-/// SinkBlock to see if Store 'SI' is safe to be remove.
-/// Returns true if the candidate store SI is safe to delete
-/// else returns false.
-bool DSE::isSafeCandidateForDeletion(BasicBlock *SrcBlock,
- BasicBlock *SinkBlock, StoreInst *SI) {
- SmallVector<BasicBlock *, 16> WorkList;
- SmallPtrSet<BasicBlock *, 8> Visited;
- BasicBlock::iterator BBI(SI);
-
- // Check from the store till end of block and make sure we have no references
- // to memory stored by this Store Instruction.
- for (auto BI = ++BBI, BE = SrcBlock->end(); BI != BE; ++BI) {
- Instruction *I = BI;
- StoreInst *CSI = dyn_cast<StoreInst>(I);
- if (CSI) {
- AliasResult R =
- AA->alias(MemoryLocation::get(SI), MemoryLocation::get(CSI));
- if (R == MustAlias)
- return true;
- } else {
- ModRefInfo Res = AA->getModRefInfo(I, MemoryLocation::get(SI));
- if (Res != MRI_NoModRef)
- return false;
- }
- }
-
- // Add successors of the block to stack and start DFS.
- for (succ_iterator I = succ_begin(SrcBlock), E = succ_end(SrcBlock); I != E;
- ++I) {
- if (!Visited.insert(*I).second)
- continue;
- // A path with backedge may not be safe. Conservatively mark
- // this store unsafe.
- if (BackEdgesMap.count(std::make_pair(SrcBlock, *I)))
- return false;
- WorkList.push_back(*I);
- }
-
- while (!WorkList.empty()) {
- BasicBlock *B = WorkList.pop_back_val();
- auto BI = B->begin();
- auto BE = B->end();
- for (; BI != BE; ++BI) {
- Instruction *I = BI;
- StoreInst *CSI = dyn_cast<StoreInst>(I);
- if (CSI) {
- AliasResult R =
- AA->alias(MemoryLocation::get(SI), MemoryLocation::get(CSI));
- if (R == MustAlias)
- break;
- } else {
- ModRefInfo Res = AA->getModRefInfo(I, MemoryLocation::get(SI));
- if (Res != MRI_NoModRef)
- return false;
- }
- }
-
- // If we reached the sink node or we found a block which has a stores that
- // overwrites the candidate block we need not look at their successors.
- if (B == SinkBlock || BI != BE)
- continue;
-
- for (succ_iterator I = succ_begin(B), E = succ_end(B); I != E; ++I) {
- if (!Visited.insert(*I).second)
- continue;
- // A path with backedge may not be safe.Conservatively mark
- // this store unsafe.
- if (BackEdgesMap.count(std::make_pair(B, *I)))
- return false;
- WorkList.push_back(*I);
- }
- }
-
- return true;
-}
-
-/// handleNonLocalStoreDeletion - Handle non local dead store elimination.
-/// This works by finding candidate stores using PDT and then running DFS
-/// from candidate store block checking all paths to make sure the store is
-/// safe to delete.
-void DSE::handleNonLocalStoreDeletion(StoreInst *SI) {
- BasicBlock *BB = SI->getParent();
- Value *Pointer = SI->getPointerOperand();
- DomTreeNode *DTNode = PDT->getNode(BB);
- if (!DTNode)
- return;
-
- int DFSNumIn = DTNode->getDFSNumIn();
- int DFSNumOut = DTNode->getDFSNumOut();
- for (int i = DFSNumIn + 1; i < DFSNumOut; ++i) {
- for (auto &I : Candidates[i]) {
- StoreInst *CandidateSI = I;
- if (DeadStores.count(CandidateSI))
- continue;
- Value *MemPtr = CandidateSI->getPointerOperand();
- if (!MemPtr)
- continue;
- if (Pointer->getType() != MemPtr->getType())
- continue;
- AliasResult R =
- AA->alias(MemoryLocation::get(SI), MemoryLocation::get(CandidateSI));
- if (R != MustAlias)
- continue;
- if (isSafeCandidateForDeletion(CandidateSI->getParent(), BB,
- CandidateSI)) {
- DeleteDeadInstruction(CandidateSI, *MD, *TLI);
- ++NumCrossBlockStores;
- }
- }
- }
-}
Removed: llvm/trunk/test/Transforms/DeadStoreElimination/cross_block_dse.ll
URL: http://llvm.org/viewvc/llvm-project/llvm/trunk/test/Transforms/DeadStoreElimination/cross_block_dse.ll?rev=245171&view=auto
==============================================================================
--- llvm/trunk/test/Transforms/DeadStoreElimination/cross_block_dse.ll (original)
+++ llvm/trunk/test/Transforms/DeadStoreElimination/cross_block_dse.ll (removed)
@@ -1,76 +0,0 @@
-; RUN: opt < %s -basicaa -dse -S | FileCheck %s
-target datalayout = "e-m:e-i64:64-f80:128-n8:16:32:64-S128"
-
- at x = common global i32 0
- at y = common global i32 0
-
-define void @test_01(i32 %N) {
- %1 = alloca i32
- store i32 %N, i32* %1
- store i32 10, i32* @x
- %2 = load i32, i32* %1
- %3 = icmp ne i32 %2, 0
- br i1 %3, label %4, label %5
-
-; <label>:4
- store i32 5, i32* @x
- br label %5
-
-; <label>:5
- store i32 15, i32* @x
- ret void
-}
-; CHECK-LABEL: @test_01(
-; CHECK-NOT: store i32 10, i32* @x
-; CHECK-NOT: store i32 5, i32* @x
-; CHECK: store i32 15, i32* @x
-
-
-define void @test_02(i32 %N) {
- %1 = alloca i32
- store i32 %N, i32* %1
- store i32 10, i32* @x
- %2 = load i32, i32* %1
- %3 = icmp ne i32 %2, 0
- br i1 %3, label %4, label %5
-
-; <label>:4
- store i32 5, i32* @x
- br label %7
-
-; <label>:5
- %6 = load i32, i32* @x
- store i32 %6, i32* @y
- br label %7
-
-; <label>:7
- store i32 15, i32* @x
- ret void
-}
-; CHECK-LABEL: @test_02(
-; CHECK: store i32 10, i32* @x
-; CHECK-NOT: store i32 5, i32* @x
-; CHECK: store i32 %6, i32* @y
-
-
-define void @test_03(i32 %N) #0 {
- %1 = alloca i32
- store i32 %N, i32* %1
- store i32 10, i32* @x
- %2 = load i32, i32* %1
- %3 = icmp ne i32 %2, 0
- br i1 %3, label %4, label %6
-
-; <label>:4 ; preds = %0
- %5 = load i32, i32* @x
- store i32 %5, i32* @y
- br label %6
-
-; <label>:6 ; preds = %4, %0
- store i32 15, i32* @x
- ret void
-}
-; CHECK-LABEL: @test_03(
-; CHECK: store i32 10, i32* @x
-; CHECK: store i32 %5, i32* @y
-; CHECK: store i32 15, i32* @x
Removed: llvm/trunk/test/Transforms/DeadStoreElimination/cross_block_dse_loop.ll
URL: http://llvm.org/viewvc/llvm-project/llvm/trunk/test/Transforms/DeadStoreElimination/cross_block_dse_loop.ll?rev=245171&view=auto
==============================================================================
--- llvm/trunk/test/Transforms/DeadStoreElimination/cross_block_dse_loop.ll (original)
+++ llvm/trunk/test/Transforms/DeadStoreElimination/cross_block_dse_loop.ll (removed)
@@ -1,104 +0,0 @@
-; RUN: opt < %s -basicaa -dse -S | FileCheck %s
-target datalayout = "e-m:e-i64:64-f80:128-n8:16:32:64-S128"
-
- at A = common global [100 x i32] zeroinitializer, align 16
- at x = common global i32 0
-
-; Negative Test case-
-;void foo(int N) {
-; A[0] = N;
-; for(int i=0;i<N;++i)
-; A[i]+=i;
-; A[0] = 10;
-;}
-;; Stores should not be optimized away.
-
-define void @test_01(i32 %N) #0 {
- %1 = alloca i32
- %i = alloca i32
- store i32 %N, i32* %1
- %2 = load i32, i32* %1
- store i32 %2, i32* getelementptr inbounds ([100 x i32], [100 x i32]* @A, i32 0, i64 0)
- store i32 0, i32* %i
- br label %3
-
-; <label>:3 ; preds = %14, %0
- %4 = load i32, i32* %i
- %5 = load i32, i32* %1
- %6 = icmp slt i32 %4, %5
- br i1 %6, label %7, label %17
-
-; <label>:7 ; preds = %3
- %8 = load i32, i32* %i
- %9 = load i32, i32* %i
- %10 = sext i32 %9 to i64
- %11 = getelementptr inbounds [100 x i32], [100 x i32]* @A, i32 0, i64 %10
- %12 = load i32, i32* %11
- %13 = add nsw i32 %12, %8
- store i32 %13, i32* %11
- br label %14
-
-; <label>:14 ; preds = %7
- %15 = load i32, i32* %i
- %16 = add nsw i32 %15, 1
- store i32 %16, i32* %i
- br label %3
-
-; <label>:17 ; preds = %3
- store i32 10, i32* getelementptr inbounds ([100 x i32], [100 x i32]* @A, i32 0, i64 0)
- ret void
-}
-; CHECK-LABEL: @test_01(
-; CHECK: store i32 %2, i32* getelementptr inbounds ([100 x i32], [100 x i32]* @A, i32 0, i64 0)
-; CHECK: store i32 %13, i32* %11
-; CHECK: store i32 10, i32* getelementptr inbounds ([100 x i32], [100 x i32]* @A, i32 0, i64 0)
-
-
-; Postive Test case-
-;void foo(int N) {
-; A[0] = N;
-; for(int i=0;i<N;++i)
-; A[i]=i;
-; A[0] = 10;
-;}
-;; Stores should not be optimized away.
-define void @test_02(i32 %N) #0 {
- %1 = alloca i32
- %i = alloca i32
- store i32 %N, i32* %1
- %2 = load i32, i32* %1
- store i32 %2, i32* getelementptr inbounds ([100 x i32], [100 x i32]* @A, i32 0, i64 0)
- store i32 0, i32* %i
- br label %3
-
-; <label>:3 ; preds = %12, %0
- %4 = load i32, i32* %i
- %5 = load i32, i32* %1
- %6 = icmp slt i32 %4, %5
- br i1 %6, label %7, label %15
-
-; <label>:7 ; preds = %3
- %8 = load i32, i32* %i
- %9 = load i32, i32* %i
- %10 = sext i32 %9 to i64
- %11 = getelementptr inbounds [100 x i32], [100 x i32]* @A, i32 0, i64 %10
- store i32 %8, i32* %11
- br label %12
-
-; <label>:12 ; preds = %7
- %13 = load i32, i32* %i
- %14 = add nsw i32 %13, 1
- store i32 %14, i32* %i
- br label %3
-
-; <label>:15 ; preds = %3
- store i32 10, i32* getelementptr inbounds ([100 x i32], [100 x i32]* @A, i32 0, i64 0)
- ret void
-}
-
-; CHECK-LABEL: @test_02(
-; CHECK-NOT: store i32 %2, i32* getelementptr inbounds ([100 x i32], [100 x i32]* @A, i32 0, i64 0)
-; CHECK: store i32 %7, i32* %10
-; CHECK: store i32 10, i32* getelementptr inbounds ([100 x i32], [100 x i32]* @A, i32 0, i64 0)
-
-
More information about the llvm-commits
mailing list