Revert r187191, which broke opt -mem2reg on the testcases included in PR16867.

However, opt -O2 doesn't run mem2reg directly so nobody noticed until r188146
when SROA started sending more things directly down the PromoteMemToReg path.

In order to revert r187191, I also revert dependent revisions r187296, r187322
and r188146. Fixes PR16867. Does not add the testcases from that PR, but both
of them should get added for both mem2reg and sroa when this revert gets
unreverted.


git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@188327 91177308-0d34-0410-b5e6-96231b3b80d8
This commit is contained in:
Nick Lewycky 2013-08-13 22:51:58 +00:00
parent 0fe3792a2f
commit 6c1fa7caae
7 changed files with 166 additions and 323 deletions

View File

@ -20,7 +20,6 @@
namespace llvm { namespace llvm {
class AllocaInst; class AllocaInst;
class DataLayout;
class DominatorTree; class DominatorTree;
class AliasSetTracker; class AliasSetTracker;
@ -30,7 +29,7 @@ class AliasSetTracker;
/// (transitively) using this alloca. This also enforces that there is only /// (transitively) using this alloca. This also enforces that there is only
/// ever one layer of bitcasts or GEPs between the alloca and the lifetime /// ever one layer of bitcasts or GEPs between the alloca and the lifetime
/// markers. /// markers.
bool isAllocaPromotable(const AllocaInst *AI, const DataLayout *DL); bool isAllocaPromotable(const AllocaInst *AI);
/// \brief Promote the specified list of alloca instructions into scalar /// \brief Promote the specified list of alloca instructions into scalar
/// registers, inserting PHI nodes as appropriate. /// registers, inserting PHI nodes as appropriate.
@ -42,7 +41,7 @@ bool isAllocaPromotable(const AllocaInst *AI, const DataLayout *DL);
/// If AST is specified, the specified tracker is updated to reflect changes /// If AST is specified, the specified tracker is updated to reflect changes
/// made to the IR. /// made to the IR.
void PromoteMemToReg(ArrayRef<AllocaInst *> Allocas, DominatorTree &DT, void PromoteMemToReg(ArrayRef<AllocaInst *> Allocas, DominatorTree &DT,
const DataLayout *DL, AliasSetTracker *AST = 0); AliasSetTracker *AST = 0);
} // End llvm namespace } // End llvm namespace

View File

@ -197,18 +197,6 @@ public:
/// \brief Construct the slices of a particular alloca. /// \brief Construct the slices of a particular alloca.
AllocaSlices(const DataLayout &DL, AllocaInst &AI); AllocaSlices(const DataLayout &DL, AllocaInst &AI);
/// \brief Whether we determined during the trivial analysis of the alloca
/// that it was immediately promotable with mem2reg.
bool isAllocaPromotable() const { return IsAllocaPromotable; }
/// \brief A list of directly stored values when \c isAllocaPromotable is
/// true.
///
/// The contents are undefined if the alloca is not trivially promotable.
/// This is used to detect other allocas which should be iterated on when
/// doing direct promotion.
ArrayRef<Value *> getStoredValues() const { return StoredValues; }
/// \brief Test whether a pointer to the allocation escapes our analysis. /// \brief Test whether a pointer to the allocation escapes our analysis.
/// ///
/// If this is true, the slices are never fully built and should be /// If this is true, the slices are never fully built and should be
@ -265,20 +253,10 @@ private:
class SliceBuilder; class SliceBuilder;
friend class AllocaSlices::SliceBuilder; friend class AllocaSlices::SliceBuilder;
#if !defined(NDEBUG) || defined(LLVM_ENABLE_DUMP)
/// \brief Handle to alloca instruction to simplify method interfaces. /// \brief Handle to alloca instruction to simplify method interfaces.
AllocaInst &AI; AllocaInst &AI;
#endif
/// \brief A flag indicating if the alloca is trivially promotable.
///
/// While walking the alloca's uses we track when the uses exceed what
/// mem2reg can trivially handle. This essentially should match the logic in
/// \c isAllocaPromotable but re-using the existing walk of the pointer uses.
bool IsAllocaPromotable;
/// \brief Storage for stored values.
///
/// Only used while the alloca is trivially promotable.
SmallVector<Value *, 8> StoredValues;
/// \brief The instruction responsible for this alloca not having a known set /// \brief The instruction responsible for this alloca not having a known set
/// of slices. /// of slices.
@ -347,9 +325,9 @@ class AllocaSlices::SliceBuilder : public PtrUseVisitor<SliceBuilder> {
SmallPtrSet<Instruction *, 4> VisitedDeadInsts; SmallPtrSet<Instruction *, 4> VisitedDeadInsts;
public: public:
SliceBuilder(const DataLayout &DL, AllocaSlices &S) SliceBuilder(const DataLayout &DL, AllocaInst &AI, AllocaSlices &S)
: PtrUseVisitor<SliceBuilder>(DL), : PtrUseVisitor<SliceBuilder>(DL),
AllocSize(DL.getTypeAllocSize(S.AI.getAllocatedType())), S(S) {} AllocSize(DL.getTypeAllocSize(AI.getAllocatedType())), S(S) {}
private: private:
void markAsDead(Instruction &I) { void markAsDead(Instruction &I) {
@ -402,15 +380,6 @@ private:
if (GEPI.use_empty()) if (GEPI.use_empty())
return markAsDead(GEPI); return markAsDead(GEPI);
// FIXME: mem2reg shouldn't care about the nature of the GEP, but instead
// the offsets of the loads. Until then, we short-circuit here for the
// promotable case.
if (GEPI.hasAllZeroIndices())
return Base::enqueueUsers(GEPI);
// Otherwise, there is something in the GEP, so we disable mem2reg and
// accumulate it.
S.IsAllocaPromotable = false;
return Base::visitGetElementPtrInst(GEPI); return Base::visitGetElementPtrInst(GEPI);
} }
@ -427,13 +396,6 @@ private:
bool IsSplittable = bool IsSplittable =
Ty->isIntegerTy() && !IsVolatile && Offset == 0 && Size >= AllocSize; Ty->isIntegerTy() && !IsVolatile && Offset == 0 && Size >= AllocSize;
// mem2reg can only promote non-volatile loads and stores which exactly
// load the alloca (no offset and the right type).
if (IsVolatile || Offset != 0 || Ty != S.AI.getAllocatedType())
S.IsAllocaPromotable = false;
if (S.IsAllocaPromotable)
assert(Offset == 0);
insertUse(I, Offset, Size, IsSplittable); insertUse(I, Offset, Size, IsSplittable);
} }
@ -474,9 +436,6 @@ private:
return markAsDead(SI); return markAsDead(SI);
} }
if (S.IsAllocaPromotable)
S.StoredValues.push_back(ValOp);
assert((!SI.isSimple() || ValOp->getType()->isSingleValueType()) && assert((!SI.isSimple() || ValOp->getType()->isSingleValueType()) &&
"All simple FCA stores should have been pre-split"); "All simple FCA stores should have been pre-split");
handleLoadOrStore(ValOp->getType(), SI, Offset, Size, SI.isVolatile()); handleLoadOrStore(ValOp->getType(), SI, Offset, Size, SI.isVolatile());
@ -494,8 +453,6 @@ private:
if (!IsOffsetKnown) if (!IsOffsetKnown)
return PI.setAborted(&II); return PI.setAborted(&II);
S.IsAllocaPromotable = false;
insertUse(II, Offset, insertUse(II, Offset,
Length ? Length->getLimitedValue() Length ? Length->getLimitedValue()
: AllocSize - Offset.getLimitedValue(), : AllocSize - Offset.getLimitedValue(),
@ -512,8 +469,6 @@ private:
if (!IsOffsetKnown) if (!IsOffsetKnown)
return PI.setAborted(&II); return PI.setAborted(&II);
S.IsAllocaPromotable = false;
uint64_t RawOffset = Offset.getLimitedValue(); uint64_t RawOffset = Offset.getLimitedValue();
uint64_t Size = Length ? Length->getLimitedValue() uint64_t Size = Length ? Length->getLimitedValue()
: AllocSize - RawOffset; : AllocSize - RawOffset;
@ -574,8 +529,6 @@ private:
return; return;
} }
S.IsAllocaPromotable = false;
Base::visitIntrinsicInst(II); Base::visitIntrinsicInst(II);
} }
@ -650,8 +603,6 @@ private:
return; return;
} }
S.IsAllocaPromotable = false;
insertUse(PN, Offset, PHISize); insertUse(PN, Offset, PHISize);
} }
@ -659,18 +610,14 @@ private:
if (SI.use_empty()) if (SI.use_empty())
return markAsDead(SI); return markAsDead(SI);
if (Value *Result = foldSelectInst(SI)) { if (Value *Result = foldSelectInst(SI)) {
if (Result == *U) { if (Result == *U)
// If the result of the constant fold will be the pointer, recurse // If the result of the constant fold will be the pointer, recurse
// through the select as if we had RAUW'ed it. // through the select as if we had RAUW'ed it.
enqueueUsers(SI); enqueueUsers(SI);
else
// FIXME: mem2reg should support this pattern, but it doesn't.
S.IsAllocaPromotable = false;
} else {
// Otherwise the operand to the select is dead, and we can replace it // Otherwise the operand to the select is dead, and we can replace it
// with undef. // with undef.
S.DeadOperands.push_back(U); S.DeadOperands.push_back(U);
}
return; return;
} }
@ -697,8 +644,6 @@ private:
return; return;
} }
S.IsAllocaPromotable = false;
insertUse(SI, Offset, SelectSize); insertUse(SI, Offset, SelectSize);
} }
@ -709,8 +654,12 @@ private:
}; };
AllocaSlices::AllocaSlices(const DataLayout &DL, AllocaInst &AI) AllocaSlices::AllocaSlices(const DataLayout &DL, AllocaInst &AI)
: AI(AI), IsAllocaPromotable(true), PointerEscapingInstr(0) { :
SliceBuilder PB(DL, *this); #if !defined(NDEBUG) || defined(LLVM_ENABLE_DUMP)
AI(AI),
#endif
PointerEscapingInstr(0) {
SliceBuilder PB(DL, AI, *this);
SliceBuilder::PtrInfo PtrI = PB.visitPtr(AI); SliceBuilder::PtrInfo PtrI = PB.visitPtr(AI);
if (PtrI.isEscaped() || PtrI.isAborted()) { if (PtrI.isEscaped() || PtrI.isAborted()) {
// FIXME: We should sink the escape vs. abort info into the caller nicely, // FIXME: We should sink the escape vs. abort info into the caller nicely,
@ -3390,24 +3339,6 @@ bool SROA::runOnAlloca(AllocaInst &AI) {
if (S.begin() == S.end()) if (S.begin() == S.end())
return Changed; return Changed;
// Trivially promotable, don't go through the splitting and rewriting.
if (S.isAllocaPromotable()) {
DEBUG(dbgs() << " Directly promoting alloca: " << AI << "\n");
PromotableAllocas.push_back(&AI);
// Walk through the stored values quickly here to handle directly
// promotable allocas that require iterating on other allocas.
ArrayRef<Value *> StoredValues = S.getStoredValues();
for (ArrayRef<Value *>::iterator SVI = StoredValues.begin(),
SVE = StoredValues.end();
SVI != SVE; ++SVI)
if ((*SVI)->getType()->isPointerTy())
if (AllocaInst *SAI =
dyn_cast<AllocaInst>((*SVI)->stripInBoundsOffsets()))
PostPromotionWorklist.insert(SAI);
return true;
}
Changed |= splitAlloca(AI, S); Changed |= splitAlloca(AI, S);
DEBUG(dbgs() << " Speculating PHIs\n"); DEBUG(dbgs() << " Speculating PHIs\n");
@ -3478,7 +3409,7 @@ bool SROA::promoteAllocas(Function &F) {
if (DT && !ForceSSAUpdater) { if (DT && !ForceSSAUpdater) {
DEBUG(dbgs() << "Promoting allocas with mem2reg...\n"); DEBUG(dbgs() << "Promoting allocas with mem2reg...\n");
PromoteMemToReg(PromotableAllocas, *DT, DL); PromoteMemToReg(PromotableAllocas, *DT);
PromotableAllocas.clear(); PromotableAllocas.clear();
return true; return true;
} }

View File

@ -1426,7 +1426,7 @@ bool SROA::performPromotion(Function &F) {
if (Allocas.empty()) break; if (Allocas.empty()) break;
if (HasDomTree) if (HasDomTree)
PromoteMemToReg(Allocas, *DT, TD); PromoteMemToReg(Allocas, *DT);
else { else {
SSAUpdater SSA; SSAUpdater SSA;
for (unsigned i = 0, e = Allocas.size(); i != e; ++i) { for (unsigned i = 0, e = Allocas.size(); i != e; ++i) {

View File

@ -16,7 +16,6 @@
#include "llvm/Transforms/Scalar.h" #include "llvm/Transforms/Scalar.h"
#include "llvm/ADT/Statistic.h" #include "llvm/ADT/Statistic.h"
#include "llvm/Analysis/Dominators.h" #include "llvm/Analysis/Dominators.h"
#include "llvm/IR/DataLayout.h"
#include "llvm/IR/Function.h" #include "llvm/IR/Function.h"
#include "llvm/IR/Instructions.h" #include "llvm/IR/Instructions.h"
#include "llvm/Transforms/Utils/PromoteMemToReg.h" #include "llvm/Transforms/Utils/PromoteMemToReg.h"
@ -28,7 +27,6 @@ STATISTIC(NumPromoted, "Number of alloca's promoted");
namespace { namespace {
struct PromotePass : public FunctionPass { struct PromotePass : public FunctionPass {
static char ID; // Pass identification, replacement for typeid static char ID; // Pass identification, replacement for typeid
PromotePass() : FunctionPass(ID) { PromotePass() : FunctionPass(ID) {
initializePromotePassPass(*PassRegistry::getPassRegistry()); initializePromotePassPass(*PassRegistry::getPassRegistry());
} }
@ -64,7 +62,6 @@ bool PromotePass::runOnFunction(Function &F) {
bool Changed = false; bool Changed = false;
DominatorTree &DT = getAnalysis<DominatorTree>(); DominatorTree &DT = getAnalysis<DominatorTree>();
const DataLayout *DL = getAnalysisIfAvailable<DataLayout>();
while (1) { while (1) {
Allocas.clear(); Allocas.clear();
@ -73,12 +70,12 @@ bool PromotePass::runOnFunction(Function &F) {
// the entry node // the entry node
for (BasicBlock::iterator I = BB.begin(), E = --BB.end(); I != E; ++I) for (BasicBlock::iterator I = BB.begin(), E = --BB.end(); I != E; ++I)
if (AllocaInst *AI = dyn_cast<AllocaInst>(I)) // Is it an alloca? if (AllocaInst *AI = dyn_cast<AllocaInst>(I)) // Is it an alloca?
if (isAllocaPromotable(AI, DL)) if (isAllocaPromotable(AI))
Allocas.push_back(AI); Allocas.push_back(AI);
if (Allocas.empty()) break; if (Allocas.empty()) break;
PromoteMemToReg(Allocas, DT, DL); PromoteMemToReg(Allocas, DT);
NumPromoted += Allocas.size(); NumPromoted += Allocas.size();
Changed = true; Changed = true;
} }

View File

@ -30,7 +30,6 @@
#include "llvm/ADT/ArrayRef.h" #include "llvm/ADT/ArrayRef.h"
#include "llvm/ADT/DenseMap.h" #include "llvm/ADT/DenseMap.h"
#include "llvm/ADT/STLExtras.h" #include "llvm/ADT/STLExtras.h"
#include "llvm/ADT/SetVector.h"
#include "llvm/ADT/SmallPtrSet.h" #include "llvm/ADT/SmallPtrSet.h"
#include "llvm/ADT/SmallVector.h" #include "llvm/ADT/SmallVector.h"
#include "llvm/ADT/Statistic.h" #include "llvm/ADT/Statistic.h"
@ -46,7 +45,6 @@
#include "llvm/IR/Instructions.h" #include "llvm/IR/Instructions.h"
#include "llvm/IR/IntrinsicInst.h" #include "llvm/IR/IntrinsicInst.h"
#include "llvm/IR/Metadata.h" #include "llvm/IR/Metadata.h"
#include "llvm/InstVisitor.h"
#include "llvm/Support/CFG.h" #include "llvm/Support/CFG.h"
#include "llvm/Transforms/Utils/Local.h" #include "llvm/Transforms/Utils/Local.h"
#include <algorithm> #include <algorithm>
@ -58,16 +56,56 @@ STATISTIC(NumSingleStore, "Number of alloca's promoted with a single store");
STATISTIC(NumDeadAlloca, "Number of dead alloca's removed"); STATISTIC(NumDeadAlloca, "Number of dead alloca's removed");
STATISTIC(NumPHIInsert, "Number of PHI nodes inserted"); STATISTIC(NumPHIInsert, "Number of PHI nodes inserted");
bool llvm::isAllocaPromotable(const AllocaInst *AI) {
// FIXME: If the memory unit is of pointer or integer type, we can permit
// assignments to subsections of the memory unit.
// Only allow direct and non-volatile loads and stores...
for (Value::const_use_iterator UI = AI->use_begin(), UE = AI->use_end();
UI != UE; ++UI) { // Loop over all of the uses of the alloca
const User *U = *UI;
if (const LoadInst *LI = dyn_cast<LoadInst>(U)) {
// Note that atomic loads can be transformed; atomic semantics do
// not have any meaning for a local alloca.
if (LI->isVolatile())
return false;
} else if (const StoreInst *SI = dyn_cast<StoreInst>(U)) {
if (SI->getOperand(0) == AI)
return false; // Don't allow a store OF the AI, only INTO the AI.
// Note that atomic stores can be transformed; atomic semantics do
// not have any meaning for a local alloca.
if (SI->isVolatile())
return false;
} else if (const IntrinsicInst *II = dyn_cast<IntrinsicInst>(U)) {
if (II->getIntrinsicID() != Intrinsic::lifetime_start &&
II->getIntrinsicID() != Intrinsic::lifetime_end)
return false;
} else if (const BitCastInst *BCI = dyn_cast<BitCastInst>(U)) {
if (BCI->getType() != Type::getInt8PtrTy(U->getContext()))
return false;
if (!onlyUsedByLifetimeMarkers(BCI))
return false;
} else if (const GetElementPtrInst *GEPI = dyn_cast<GetElementPtrInst>(U)) {
if (GEPI->getType() != Type::getInt8PtrTy(U->getContext()))
return false;
if (!GEPI->hasAllZeroIndices())
return false;
if (!onlyUsedByLifetimeMarkers(GEPI))
return false;
} else {
return false;
}
}
return true;
}
namespace { namespace {
struct AllocaInfo : private InstVisitor<AllocaInfo, bool> { struct AllocaInfo {
const DataLayout *DL;
SmallVector<BasicBlock *, 32> DefiningBlocks; SmallVector<BasicBlock *, 32> DefiningBlocks;
SmallVector<BasicBlock *, 32> UsingBlocks; SmallVector<BasicBlock *, 32> UsingBlocks;
SmallVector<Instruction *, 8> DeadInsts;
Type *AllocaTy;
StoreInst *OnlyStore; StoreInst *OnlyStore;
BasicBlock *OnlyBlock; BasicBlock *OnlyBlock;
bool OnlyUsedInOneBlock; bool OnlyUsedInOneBlock;
@ -75,13 +113,9 @@ struct AllocaInfo : private InstVisitor<AllocaInfo, bool> {
Value *AllocaPointerVal; Value *AllocaPointerVal;
DbgDeclareInst *DbgDeclare; DbgDeclareInst *DbgDeclare;
AllocaInfo(const DataLayout *DL) : DL(DL) {}
void clear() { void clear() {
DefiningBlocks.clear(); DefiningBlocks.clear();
UsingBlocks.clear(); UsingBlocks.clear();
DeadInsts.clear();
AllocaTy = 0;
OnlyStore = 0; OnlyStore = 0;
OnlyBlock = 0; OnlyBlock = 0;
OnlyUsedInOneBlock = true; OnlyUsedInOneBlock = true;
@ -91,116 +125,39 @@ struct AllocaInfo : private InstVisitor<AllocaInfo, bool> {
/// Scan the uses of the specified alloca, filling in the AllocaInfo used /// Scan the uses of the specified alloca, filling in the AllocaInfo used
/// by the rest of the pass to reason about the uses of this alloca. /// by the rest of the pass to reason about the uses of this alloca.
bool analyzeAlloca(AllocaInst &AI) { void AnalyzeAlloca(AllocaInst *AI) {
clear(); clear();
AllocaTy = AI.getAllocatedType(); // As we scan the uses of the alloca instruction, keep track of stores,
enqueueUsers(AI); // and decide whether all of the loads and stores to the alloca are within
// the same basic block.
for (Value::use_iterator UI = AI->use_begin(), E = AI->use_end();
UI != E;) {
Instruction *User = cast<Instruction>(*UI++);
// Walk queued up uses in the worklist to handle nested uses. if (StoreInst *SI = dyn_cast<StoreInst>(User)) {
while (!UseWorklist.empty()) { // Remember the basic blocks which define new values for the alloca
U = UseWorklist.pop_back_val(); DefiningBlocks.push_back(SI->getParent());
Instruction &I = *cast<Instruction>(U->getUser()); AllocaPointerVal = SI->getOperand(0);
if (!visit(I)) OnlyStore = SI;
return false; // Propagate failure to promote up. } else {
LoadInst *LI = cast<LoadInst>(User);
// Otherwise it must be a load instruction, keep track of variable
// reads.
UsingBlocks.push_back(LI->getParent());
AllocaPointerVal = LI;
}
if (OnlyUsedInOneBlock) { if (OnlyUsedInOneBlock) {
if (OnlyBlock == 0) if (OnlyBlock == 0)
OnlyBlock = I.getParent(); OnlyBlock = User->getParent();
else if (OnlyBlock != I.getParent()) else if (OnlyBlock != User->getParent())
OnlyUsedInOneBlock = false; OnlyUsedInOneBlock = false;
} }
} }
DbgDeclare = FindAllocaDbgDeclare(&AI); DbgDeclare = FindAllocaDbgDeclare(AI);
return true;
} }
private:
// Befriend the base class so it can call through private visitor methods.
friend class InstVisitor<AllocaInfo, bool>;
/// \brief A use pointer that is non-null when visiting uses.
Use *U;
/// \brief A worklist for recursively visiting all uses of an alloca.
SmallVector<Use *, 8> UseWorklist;
/// \brief A set for preventing cyclic visitation.
SmallPtrSet<Use *, 8> VisitedUses;
void enqueueUsers(Instruction &I) {
for (Value::use_iterator UI = I.use_begin(), UE = I.use_end(); UI != UE;
++UI)
if (VisitedUses.insert(&UI.getUse()))
UseWorklist.push_back(&UI.getUse());
}
bool visitLoadInst(LoadInst &LI) {
if (LI.isVolatile() || LI.getType() != AllocaTy)
return false;
// Keep track of variable reads.
UsingBlocks.push_back(LI.getParent());
AllocaPointerVal = &LI;
return true;
}
bool visitStoreInst(StoreInst &SI) {
if (SI.isVolatile() || SI.getValueOperand() == U->get() ||
SI.getValueOperand()->getType() != AllocaTy)
return false;
// Remember the basic blocks which define new values for the alloca
DefiningBlocks.push_back(SI.getParent());
AllocaPointerVal = SI.getOperand(0);
OnlyStore = &SI;
return true;
}
bool visitBitCastInst(BitCastInst &BC) {
if (BC.use_empty())
DeadInsts.push_back(&BC);
else
enqueueUsers(BC);
return true;
}
bool visitGetElementPtrInst(GetElementPtrInst &GEPI) {
if (GEPI.use_empty()) {
DeadInsts.push_back(&GEPI);
return true;
}
enqueueUsers(GEPI);
return GEPI.hasAllZeroIndices();
}
// We can promote through debug info intrinsics as they don't alter the
// value stored in memory.
bool visitDbgInfoIntrinsic(DbgInfoIntrinsic &I) {
DeadInsts.push_back(&I);
return true;
}
bool visitIntrinsicInst(IntrinsicInst &II) {
switch (II.getIntrinsicID()) {
default:
return false;
// Lifetime intrinsics don't preclude promoting the memory to a register.
// FIXME: We should use these to promote to undef when outside of a valid
// lifetime.
case Intrinsic::lifetime_start:
case Intrinsic::lifetime_end:
DeadInsts.push_back(&II);
return true;
}
}
// The fallback is that the alloca cannot be promoted.
bool visitInstruction(Instruction &I) { return false; }
}; };
// Data package used by RenamePass() // Data package used by RenamePass()
@ -278,7 +235,6 @@ struct PromoteMem2Reg {
std::vector<AllocaInst *> Allocas; std::vector<AllocaInst *> Allocas;
DominatorTree &DT; DominatorTree &DT;
DIBuilder DIB; DIBuilder DIB;
const DataLayout *DL;
/// An AliasSetTracker object to update. If null, don't update it. /// An AliasSetTracker object to update. If null, don't update it.
AliasSetTracker *AST; AliasSetTracker *AST;
@ -324,9 +280,9 @@ struct PromoteMem2Reg {
public: public:
PromoteMem2Reg(ArrayRef<AllocaInst *> Allocas, DominatorTree &DT, PromoteMem2Reg(ArrayRef<AllocaInst *> Allocas, DominatorTree &DT,
const DataLayout *DL, AliasSetTracker *AST) AliasSetTracker *AST)
: Allocas(Allocas.begin(), Allocas.end()), DT(DT), : Allocas(Allocas.begin(), Allocas.end()), DT(DT),
DIB(*DT.getRoot()->getParent()->getParent()), DL(DL), AST(AST) {} DIB(*DT.getRoot()->getParent()->getParent()), AST(AST) {}
void run(); void run();
@ -357,39 +313,27 @@ private:
} // end of anonymous namespace } // end of anonymous namespace
/// \brief Walk a small vector of dead instructions and recursively remove them static void removeLifetimeIntrinsicUsers(AllocaInst *AI) {
/// and subsequently dead instructions. // Knowing that this alloca is promotable, we know that it's safe to kill all
/// // instructions except for load and store.
/// This is only valid to call on dead instructions using an alloca which is
/// promotable, as we leverage that assumption to delete them faster.
static void removeDeadInstructions(AllocaInst *AI,
SmallVectorImpl<Instruction *> &DeadInsts) {
while (!DeadInsts.empty()) {
Instruction *I = DeadInsts.pop_back_val();
// Don't delete the alloca itself. for (Value::use_iterator UI = AI->use_begin(), UE = AI->use_end();
if (I == AI) UI != UE;) {
Instruction *I = cast<Instruction>(*UI);
++UI;
if (isa<LoadInst>(I) || isa<StoreInst>(I))
continue; continue;
// Note that we open code the deletion algorithm here because we know if (!I->getType()->isVoidTy()) {
// apriori that all of the instructions using an alloca that reaches here // The only users of this bitcast/GEP instruction are lifetime intrinsics.
// are trivially dead when their use list becomes empty (The only risk are // Follow the use/def chain to erase them now instead of leaving it for
// lifetime markers which we specifically want to nuke). By coding it here // dead code elimination later.
// we can skip the triviality test and be more efficient. for (Value::use_iterator UI = I->use_begin(), UE = I->use_end();
// UI != UE;) {
// Null out all of the instruction's operands to see if any operand becomes Instruction *Inst = cast<Instruction>(*UI);
// dead as we go. ++UI;
for (User::op_iterator OI = I->op_begin(), OE = I->op_end(); OI != OE; Inst->eraseFromParent();
++OI) { }
Instruction *Op = dyn_cast<Instruction>(*OI);
if (!Op)
continue;
OI->set(0);
if (!Op->use_empty())
continue;
DeadInsts.push_back(Op);
} }
I->eraseFromParent(); I->eraseFromParent();
} }
@ -590,23 +534,17 @@ void PromoteMem2Reg::run() {
PointerAllocaValues.resize(Allocas.size()); PointerAllocaValues.resize(Allocas.size());
AllocaDbgDeclares.resize(Allocas.size()); AllocaDbgDeclares.resize(Allocas.size());
AllocaInfo Info(DL); AllocaInfo Info;
LargeBlockInfo LBI; LargeBlockInfo LBI;
for (unsigned AllocaNum = 0; AllocaNum != Allocas.size(); ++AllocaNum) { for (unsigned AllocaNum = 0; AllocaNum != Allocas.size(); ++AllocaNum) {
AllocaInst *AI = Allocas[AllocaNum]; AllocaInst *AI = Allocas[AllocaNum];
assert(isAllocaPromotable(AI) && "Cannot promote non-promotable alloca!");
assert(AI->getParent()->getParent() == &F && assert(AI->getParent()->getParent() == &F &&
"All allocas should be in the same function, which is same as DF!"); "All allocas should be in the same function, which is same as DF!");
// Calculate the set of read and write-locations for each alloca. This is removeLifetimeIntrinsicUsers(AI);
// analogous to finding the 'uses' and 'definitions' of each variable.
bool Good = Info.analyzeAlloca(*AI);
(void)Good;
assert(Good && "Cannot promote non-promotable alloca!");
// Nuke all of the dead instructions.
removeDeadInstructions(AI, Info.DeadInsts);
if (AI->use_empty()) { if (AI->use_empty()) {
// If there are no uses of the alloca, just delete it now. // If there are no uses of the alloca, just delete it now.
@ -620,6 +558,10 @@ void PromoteMem2Reg::run() {
continue; continue;
} }
// Calculate the set of read and write-locations for each alloca. This is
// analogous to finding the 'uses' and 'definitions' of each variable.
Info.AnalyzeAlloca(AI);
// If there is only a single store to this value, replace any loads of // If there is only a single store to this value, replace any loads of
// it that are directly dominated by the definition with the value stored. // it that are directly dominated by the definition with the value stored.
if (Info.DefiningBlocks.size() == 1) { if (Info.DefiningBlocks.size() == 1) {
@ -1145,19 +1087,11 @@ NextIteration:
goto NextIteration; goto NextIteration;
} }
bool llvm::isAllocaPromotable(const AllocaInst *AI, const DataLayout *DL) {
// We cast away constness because we re-use the non-const analysis that the
// actual promotion routine uses. While it is non-const, it doesn't actually
// mutate anything at this phase, and we discard the non-const results that
// promotion uses to mutate the alloca.
return AllocaInfo(DL).analyzeAlloca(*const_cast<AllocaInst *>(AI));
}
void llvm::PromoteMemToReg(ArrayRef<AllocaInst *> Allocas, DominatorTree &DT, void llvm::PromoteMemToReg(ArrayRef<AllocaInst *> Allocas, DominatorTree &DT,
const DataLayout *DL, AliasSetTracker *AST) { AliasSetTracker *AST) {
// If there is nothing to do, bail out... // If there is nothing to do, bail out...
if (Allocas.empty()) if (Allocas.empty())
return; return;
PromoteMem2Reg(Allocas, DT, DL, AST).run(); PromoteMem2Reg(Allocas, DT, AST).run();
} }

View File

@ -0,0 +1,52 @@
; RUN: opt -mem2reg -S -o - < %s | FileCheck %s
declare void @llvm.lifetime.start(i64 %size, i8* nocapture %ptr)
declare void @llvm.lifetime.end(i64 %size, i8* nocapture %ptr)
define void @test1() {
; CHECK: test1
; CHECK-NOT: alloca
%A = alloca i32
%B = bitcast i32* %A to i8*
call void @llvm.lifetime.start(i64 2, i8* %B)
store i32 1, i32* %A
call void @llvm.lifetime.end(i64 2, i8* %B)
ret void
}
define void @test2() {
; CHECK: test2
; CHECK-NOT: alloca
%A = alloca {i8, i16}
%B = getelementptr {i8, i16}* %A, i32 0, i32 0
call void @llvm.lifetime.start(i64 2, i8* %B)
store {i8, i16} zeroinitializer, {i8, i16}* %A
call void @llvm.lifetime.end(i64 2, i8* %B)
ret void
}
; RUN: opt -mem2reg -S -o - < %s | FileCheck %s
declare void @llvm.lifetime.start(i64 %size, i8* nocapture %ptr)
declare void @llvm.lifetime.end(i64 %size, i8* nocapture %ptr)
define void @test1() {
; CHECK: test1
; CHECK-NOT: alloca
%A = alloca i32
%B = bitcast i32* %A to i8*
call void @llvm.lifetime.start(i64 2, i8* %B)
store i32 1, i32* %A
call void @llvm.lifetime.end(i64 2, i8* %B)
ret void
}
define void @test2() {
; CHECK: test2
; CHECK-NOT: alloca
%A = alloca {i8, i16}
%B = getelementptr {i8, i16}* %A, i32 0, i32 0
call void @llvm.lifetime.start(i64 2, i8* %B)
store {i8, i16} zeroinitializer, {i8, i16}* %A
call void @llvm.lifetime.end(i64 2, i8* %B)
ret void
}

View File

@ -1,70 +0,0 @@
; RUN: opt -mem2reg -S -o - < %s | FileCheck %s
target datalayout = "e-p:64:64:64-i1:8:8-i8:8:8-i16:16:16-i32:32:32-i64:32:64-f32:32:32-f64:64:64-v64:64:64-v128:128:128-a0:0:64-n8:16:32:64"
declare void @llvm.lifetime.start(i64 %size, i8* nocapture %ptr)
declare void @llvm.lifetime.end(i64 %size, i8* nocapture %ptr)
define void @test1() {
; Ensure we can look through a bitcast to i8* and the addition of lifetime
; markers.
;
; CHECK-LABEL: @test1(
; CHECK-NOT: alloca
; CHECK: ret void
%A = alloca i32
%B = bitcast i32* %A to i8*
call void @llvm.lifetime.start(i64 2, i8* %B)
store i32 1, i32* %A
call void @llvm.lifetime.end(i64 2, i8* %B)
ret void
}
define void @test2() {
; Ensure we can look through a GEP to i8* and the addition of lifetime
; markers.
;
; CHECK-LABEL: @test2(
; CHECK-NOT: alloca
; CHECK: ret void
%A = alloca {i8, i16}
%B = getelementptr {i8, i16}* %A, i32 0, i32 0
call void @llvm.lifetime.start(i64 2, i8* %B)
store {i8, i16} zeroinitializer, {i8, i16}* %A
call void @llvm.lifetime.end(i64 2, i8* %B)
ret void
}
define i32 @test3(i32 %x) {
; CHECK-LABEL: @test3(
;
; Check that we recursively walk the uses of the alloca and thus can see
; through round trip bitcasts, dead bitcasts, GEPs, multiple GEPs, and lifetime
; markers.
entry:
%a = alloca i32
; CHECK-NOT: alloca
%b = bitcast i32* %a to i8*
%b2 = getelementptr inbounds i8* %b, i32 0
%b3 = getelementptr inbounds i8* %b2, i32 0
call void @llvm.lifetime.start(i64 -1, i8* %b3)
; CHECK-NOT: call void @llvm.lifetime.start
store i32 %x, i32* %a
; CHECK-NOT: store
%dead = bitcast i32* %a to i4096*
%dead1 = bitcast i4096* %dead to i42*
%dead2 = getelementptr inbounds i32* %a, i32 %x
; CHECK-NOT: bitcast
; CHECK-NOT: getelementptr
%ret = load i32* %a
; CHECK-NOT: load
ret i32 %ret
; CHECK: ret i32 %x
}