[LICM] Don't create more than one copy of an instruction per loop exit block when sinking.

Fixes exponential compilation complexity in PR19835, caused by
LICM::sink not handling the following pattern well:

f = op g
e = op f, g
d = op e
c = op d, e
b = op c
a = op b, c

When an instruction with N uses is sunk, each of its operands gets N
new uses (all of them - phi nodes). In the example above, if a had 1
use, c would have 2, e would have 4, and g would have 8.


git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@211673 91177308-0d34-0410-b5e6-96231b3b80d8
This commit is contained in:
Evgeniy Stepanov
2014-06-25 07:54:58 +00:00
parent aa2e057bc1
commit 98726c311b
2 changed files with 62 additions and 23 deletions

View File

@@ -550,6 +550,9 @@ void LICM::sink(Instruction &I) {
SmallPtrSet<BasicBlock *, 32> ExitBlockSet(ExitBlocks.begin(), ExitBlocks.end());
#endif
// Clones of this instruction. Don't create more than one per exit block!
SmallDenseMap<BasicBlock *, Instruction *, 32> SunkCopies;
// If this instruction is only used outside of the loop, then all users are
// PHI nodes in exit blocks due to LCSSA form. Just RAUW them with clones of
// the instruction.
@@ -561,30 +564,37 @@ void LICM::sink(Instruction &I) {
assert(ExitBlockSet.count(ExitBlock) &&
"The LCSSA PHI is not in an exit block!");
Instruction *New = I.clone();
ExitBlock->getInstList().insert(ExitBlock->getFirstInsertionPt(), New);
if (!I.getName().empty())
New->setName(I.getName() + ".le");
Instruction *New;
auto It = SunkCopies.find(ExitBlock);
if (It != SunkCopies.end()) {
New = It->second;
} else {
New = I.clone();
SunkCopies[ExitBlock] = New;
ExitBlock->getInstList().insert(ExitBlock->getFirstInsertionPt(), New);
if (!I.getName().empty())
New->setName(I.getName() + ".le");
// Build LCSSA PHI nodes for any in-loop operands. Note that this is
// particularly cheap because we can rip off the PHI node that we're
// replacing for the number and blocks of the predecessors.
// OPT: If this shows up in a profile, we can instead finish sinking all
// invariant instructions, and then walk their operands to re-establish
// LCSSA. That will eliminate creating PHI nodes just to nuke them when
// sinking bottom-up.
for (User::op_iterator OI = New->op_begin(), OE = New->op_end(); OI != OE;
++OI)
if (Instruction *OInst = dyn_cast<Instruction>(*OI))
if (Loop *OLoop = LI->getLoopFor(OInst->getParent()))
if (!OLoop->contains(PN)) {
PHINode *OpPN = PHINode::Create(
OInst->getType(), PN->getNumIncomingValues(),
OInst->getName() + ".lcssa", ExitBlock->begin());
for (unsigned i = 0, e = PN->getNumIncomingValues(); i != e; ++i)
OpPN->addIncoming(OInst, PN->getIncomingBlock(i));
*OI = OpPN;
}
// Build LCSSA PHI nodes for any in-loop operands. Note that this is
// particularly cheap because we can rip off the PHI node that we're
// replacing for the number and blocks of the predecessors.
// OPT: If this shows up in a profile, we can instead finish sinking all
// invariant instructions, and then walk their operands to re-establish
// LCSSA. That will eliminate creating PHI nodes just to nuke them when
// sinking bottom-up.
for (User::op_iterator OI = New->op_begin(), OE = New->op_end(); OI != OE;
++OI)
if (Instruction *OInst = dyn_cast<Instruction>(*OI))
if (Loop *OLoop = LI->getLoopFor(OInst->getParent()))
if (!OLoop->contains(PN)) {
PHINode *OpPN = PHINode::Create(
OInst->getType(), PN->getNumIncomingValues(),
OInst->getName() + ".lcssa", ExitBlock->begin());
for (unsigned i = 0, e = PN->getNumIncomingValues(); i != e; ++i)
OpPN->addIncoming(OInst, PN->getIncomingBlock(i));
*OI = OpPN;
}
}
PN->replaceAllUsesWith(New);
PN->eraseFromParent();