//===-- BranchFolding.cpp - Fold machine code branch instructions ---------===// // // The LLVM Compiler Infrastructure // // This file was developed by the LLVM research group and is distributed under // the University of Illinois Open Source License. See LICENSE.TXT for details. // //===----------------------------------------------------------------------===// // // This pass forwards branches to unconditional branches to make them branch // directly to the target block. This pass often results in dead MBB's, which // it then removes. // // Note that this pass must be run after register allocation, it cannot handle // SSA form. // //===----------------------------------------------------------------------===// #include "llvm/CodeGen/Passes.h" #include "llvm/CodeGen/MachineDebugInfo.h" #include "llvm/CodeGen/MachineFunctionPass.h" #include "llvm/CodeGen/MachineJumpTableInfo.h" #include "llvm/Target/TargetInstrInfo.h" #include "llvm/Target/TargetMachine.h" #include "llvm/Support/CommandLine.h" #include "llvm/ADT/Statistic.h" #include "llvm/ADT/STLExtras.h" using namespace llvm; static Statistic<> NumDeadBlocks("branchfold", "Number of dead blocks removed"); static Statistic<> NumBranchOpts("branchfold", "Number of branches optimized"); static Statistic<> NumTailMerge ("branchfold", "Number of block tails merged"); static cl::opt EnableTailMerge("enable-tail-merge", cl::init(false)); namespace { struct BranchFolder : public MachineFunctionPass { virtual bool runOnMachineFunction(MachineFunction &MF); virtual const char *getPassName() const { return "Control Flow Optimizer"; } const TargetInstrInfo *TII; MachineDebugInfo *MDI; bool MadeChange; private: // Tail Merging. bool TailMergeBlocks(MachineFunction &MF); void ReplaceTailWithBranchTo(MachineBasicBlock::iterator OldInst, MachineBasicBlock *NewDest); // Branch optzn. bool OptimizeBranches(MachineFunction &MF); void OptimizeBlock(MachineFunction::iterator MBB); void RemoveDeadBlock(MachineBasicBlock *MBB); }; } FunctionPass *llvm::createBranchFoldingPass() { return new BranchFolder(); } /// RemoveDeadBlock - Remove the specified dead machine basic block from the /// function, updating the CFG. void BranchFolder::RemoveDeadBlock(MachineBasicBlock *MBB) { assert(MBB->pred_empty() && "MBB must be dead!"); MachineFunction *MF = MBB->getParent(); // drop all successors. while (!MBB->succ_empty()) MBB->removeSuccessor(MBB->succ_end()-1); // If there is DWARF info to active, check to see if there are any DWARF_LABEL // records in the basic block. If so, unregister them from MachineDebugInfo. if (MDI && !MBB->empty()) { unsigned DWARF_LABELOpc = TII->getDWARF_LABELOpcode(); assert(DWARF_LABELOpc && "Target supports dwarf but didn't implement getDWARF_LABELOpcode!"); for (MachineBasicBlock::iterator I = MBB->begin(), E = MBB->end(); I != E; ++I) { if ((unsigned)I->getOpcode() == DWARF_LABELOpc) { // The label ID # is always operand #0, an immediate. MDI->InvalidateLabel(I->getOperand(0).getImm()); } } } // Remove the block. MF->getBasicBlockList().erase(MBB); } bool BranchFolder::runOnMachineFunction(MachineFunction &MF) { TII = MF.getTarget().getInstrInfo(); if (!TII) return false; MDI = getAnalysisToUpdate(); bool EverMadeChange = false; bool MadeChangeThisIteration = true; while (MadeChangeThisIteration) { MadeChangeThisIteration = false; MadeChangeThisIteration |= TailMergeBlocks(MF); MadeChangeThisIteration |= OptimizeBranches(MF); EverMadeChange |= MadeChangeThisIteration; } return EverMadeChange; } //===----------------------------------------------------------------------===// // Tail Merging of Blocks //===----------------------------------------------------------------------===// /// HashMachineInstr - Compute a hash value for MI and its operands. static unsigned HashMachineInstr(const MachineInstr *MI) { unsigned Hash = MI->getOpcode(); for (unsigned i = 0, e = MI->getNumOperands(); i != e; ++i) { const MachineOperand &Op = MI->getOperand(i); // Merge in bits from the operand if easy. unsigned OperandHash = 0; switch (Op.getType()) { case MachineOperand::MO_Register: OperandHash = Op.getReg(); break; case MachineOperand::MO_Immediate: OperandHash = Op.getImm(); break; case MachineOperand::MO_MachineBasicBlock: OperandHash = Op.getMachineBasicBlock()->getNumber(); break; case MachineOperand::MO_FrameIndex: OperandHash = Op.getFrameIndex(); break; case MachineOperand::MO_ConstantPoolIndex: OperandHash = Op.getConstantPoolIndex(); break; case MachineOperand::MO_JumpTableIndex: OperandHash = Op.getJumpTableIndex(); break; case MachineOperand::MO_GlobalAddress: case MachineOperand::MO_ExternalSymbol: // Global address / external symbol are too hard, don't bother, but do // pull in the offset. OperandHash = Op.getOffset(); break; default: break; } Hash += ((OperandHash << 3) | Op.getType()) << (i&31); } return Hash; } /// HashEndOfMBB - Hash the last two instructions in the MBB. We hash two /// instructions, because cross-jumping only saves code when at least two /// instructions are removed (since a branch must be inserted). static unsigned HashEndOfMBB(const MachineBasicBlock *MBB) { MachineBasicBlock::const_iterator I = MBB->end(); if (I == MBB->begin()) return 0; // Empty MBB. --I; unsigned Hash = HashMachineInstr(I); if (I == MBB->begin()) return Hash; // Single instr MBB. --I; // Hash in the second-to-last instruction. Hash ^= HashMachineInstr(I) << 2; return Hash; } /// ComputeCommonTailLength - Given two machine basic blocks, compute the number /// of instructions they actually have in common together at their end. Return /// iterators for the first shared instruction in each block. static unsigned ComputeCommonTailLength(MachineBasicBlock *MBB1, MachineBasicBlock *MBB2, MachineBasicBlock::iterator &I1, MachineBasicBlock::iterator &I2) { I1 = MBB1->end(); I2 = MBB2->end(); unsigned TailLen = 0; while (I1 != MBB1->begin() && I2 != MBB2->begin()) { --I1; --I2; if (!I1->isIdenticalTo(I2)) { ++I1; ++I2; break; } ++TailLen; } return TailLen; } /// ReplaceTailWithBranchTo - Delete the instruction OldInst and everything /// after it, replacing it with an unconditional branch to NewDest. This /// returns true if OldInst's block is modified, false if NewDest is modified. void BranchFolder::ReplaceTailWithBranchTo(MachineBasicBlock::iterator OldInst, MachineBasicBlock *NewDest) { MachineBasicBlock *OldBB = OldInst->getParent(); // Remove all the old successors of OldBB from the CFG. while (!OldBB->succ_empty()) OldBB->removeSuccessor(OldBB->succ_begin()); // Remove all the dead instructions from the end of OldBB. OldBB->erase(OldInst, OldBB->end()); // If OldBB isn't immediately before OldBB, insert a branch to it. if (++MachineFunction::iterator(OldBB) != MachineFunction::iterator(NewDest)) TII->InsertBranch(*OldBB, NewDest, 0, std::vector()); OldBB->addSuccessor(NewDest); ++NumTailMerge; } bool BranchFolder::TailMergeBlocks(MachineFunction &MF) { MadeChange = false; if (!EnableTailMerge) return false; // Find blocks with no successors. std::vector > MergePotentials; for (MachineFunction::iterator I = MF.begin(), E = MF.end(); I != E; ++I) { if (I->succ_empty()) MergePotentials.push_back(std::make_pair(HashEndOfMBB(I), I)); } // Sort by hash value so that blocks with identical end sequences sort // together. std::stable_sort(MergePotentials.begin(), MergePotentials.end()); // Walk through equivalence sets looking for actual exact matches. while (MergePotentials.size() > 1) { unsigned CurHash = (MergePotentials.end()-1)->first; unsigned PrevHash = (MergePotentials.end()-2)->first; MachineBasicBlock *CurMBB = (MergePotentials.end()-1)->second; // If there is nothing that matches the hash of the current basic block, // give up. if (CurHash != PrevHash) { MergePotentials.pop_back(); continue; } // Determine the actual length of the shared tail between these two basic // blocks. Because the hash can have collisions, it's possible that this is // less than 2. MachineBasicBlock::iterator BBI1, BBI2; unsigned CommonTailLen = ComputeCommonTailLength(CurMBB, (MergePotentials.end()-2)->second, BBI1, BBI2); // If the tails don't have at least two instructions in common, see if there // is anything else in the equivalence class that does match. if (CommonTailLen < 2) { unsigned FoundMatch = ~0U; for (int i = MergePotentials.size()-2; i != -1 && MergePotentials[i].first == CurHash; --i) { CommonTailLen = ComputeCommonTailLength(CurMBB, MergePotentials[i].second, BBI1, BBI2); if (CommonTailLen >= 2) { FoundMatch = i; break; } } // If we didn't find anything that has at least two instructions matching // this one, bail out. if (FoundMatch == ~0U) { MergePotentials.pop_back(); continue; } // Otherwise, move the matching block to the right position. std::swap(MergePotentials[FoundMatch], *(MergePotentials.end()-2)); } // If either block is the entire common tail, make the longer one branch to // the shorter one. MachineBasicBlock *MBB2 = (MergePotentials.end()-2)->second; if (CurMBB->begin() == BBI1) { // Hack the end off MBB2, making it jump to CurMBB instead. ReplaceTailWithBranchTo(BBI2, CurMBB); // This modifies MBB2, so remove it from the worklist. MergePotentials.erase(MergePotentials.end()-2); MadeChange = true; continue; } else if (MBB2->begin() == BBI2) { // Hack the end off CurMBB, making it jump to MBBI@ instead. ReplaceTailWithBranchTo(BBI1, MBB2); // This modifies CurMBB, so remove it from the worklist. MergePotentials.pop_back(); MadeChange = true; continue; } MergePotentials.pop_back(); } return MadeChange; } //===----------------------------------------------------------------------===// // Branch Optimization //===----------------------------------------------------------------------===// bool BranchFolder::OptimizeBranches(MachineFunction &MF) { MadeChange = false; for (MachineFunction::iterator I = ++MF.begin(), E = MF.end(); I != E; ) { MachineBasicBlock *MBB = I++; OptimizeBlock(MBB); // If it is dead, remove it. if (MBB->pred_empty()) { RemoveDeadBlock(MBB); MadeChange = true; ++NumDeadBlocks; } } return MadeChange; } /// CorrectExtraCFGEdges - Various pieces of code can cause excess edges in the /// CFG to be inserted. If we have proven that MBB can only branch to DestA and /// DestB, remove any other MBB successors from the CFG. DestA and DestB can /// be null. static bool CorrectExtraCFGEdges(MachineBasicBlock &MBB, MachineBasicBlock *DestA, MachineBasicBlock *DestB, bool isCond, MachineFunction::iterator FallThru) { bool MadeChange = false; bool AddedFallThrough = false; // If this block ends with a conditional branch that falls through to its // successor, set DestB as the successor. if (isCond) { if (DestB == 0 && FallThru != MBB.getParent()->end()) { DestB = FallThru; AddedFallThrough = true; } } else { // If this is an unconditional branch with no explicit dest, it must just be // a fallthrough into DestB. if (DestA == 0 && FallThru != MBB.getParent()->end()) { DestA = FallThru; AddedFallThrough = true; } } MachineBasicBlock::pred_iterator SI = MBB.succ_begin(); while (SI != MBB.succ_end()) { if (*SI == DestA) { DestA = 0; ++SI; } else if (*SI == DestB) { DestB = 0; ++SI; } else { // Otherwise, this is a superfluous edge, remove it. MBB.removeSuccessor(SI); MadeChange = true; } } if (!AddedFallThrough) { assert(DestA == 0 && DestB == 0 && "MachineCFG is missing edges!"); } else if (isCond) { assert(DestA == 0 && "MachineCFG is missing edges!"); } return MadeChange; } /// ReplaceUsesOfBlockWith - Given a machine basic block 'BB' that branched to /// 'Old', change the code and CFG so that it branches to 'New' instead. static void ReplaceUsesOfBlockWith(MachineBasicBlock *BB, MachineBasicBlock *Old, MachineBasicBlock *New, const TargetInstrInfo *TII) { assert(Old != New && "Cannot replace self with self!"); MachineBasicBlock::iterator I = BB->end(); while (I != BB->begin()) { --I; if (!TII->isTerminatorInstr(I->getOpcode())) break; // Scan the operands of this machine instruction, replacing any uses of Old // with New. for (unsigned i = 0, e = I->getNumOperands(); i != e; ++i) if (I->getOperand(i).isMachineBasicBlock() && I->getOperand(i).getMachineBasicBlock() == Old) I->getOperand(i).setMachineBasicBlock(New); } // Update the successor information. std::vector Succs(BB->succ_begin(), BB->succ_end()); for (int i = Succs.size()-1; i >= 0; --i) if (Succs[i] == Old) { BB->removeSuccessor(Old); BB->addSuccessor(New); } } /// OptimizeBlock - Analyze and optimize control flow related to the specified /// block. This is never called on the entry block. void BranchFolder::OptimizeBlock(MachineFunction::iterator MBB) { // If this block is empty, make everyone use its fall-through, not the block // explicitly. if (MBB->empty()) { // Dead block? Leave for cleanup later. if (MBB->pred_empty()) return; MachineFunction::iterator FallThrough = next(MBB); if (FallThrough == MBB->getParent()->end()) { // TODO: Simplify preds to not branch here if possible! } else { // Rewrite all predecessors of the old block to go to the fallthrough // instead. while (!MBB->pred_empty()) { MachineBasicBlock *Pred = *(MBB->pred_end()-1); ReplaceUsesOfBlockWith(Pred, MBB, FallThrough, TII); } // If MBB was the target of a jump table, update jump tables to go to the // fallthrough instead. MBB->getParent()->getJumpTableInfo()->ReplaceMBBInJumpTables(MBB, FallThrough); MadeChange = true; } return; } // Check to see if we can simplify the terminator of the block before this // one. MachineBasicBlock &PrevBB = *prior(MBB); MachineBasicBlock *PriorTBB = 0, *PriorFBB = 0; std::vector PriorCond; bool PriorUnAnalyzable = false; PriorUnAnalyzable = TII->AnalyzeBranch(PrevBB, PriorTBB, PriorFBB, PriorCond); if (!PriorUnAnalyzable) { // If the CFG for the prior block has extra edges, remove them. MadeChange |= CorrectExtraCFGEdges(PrevBB, PriorTBB, PriorFBB, !PriorCond.empty(), MBB); // If the previous branch is conditional and both conditions go to the same // destination, remove the branch, replacing it with an unconditional one or // a fall-through. if (PriorTBB && PriorTBB == PriorFBB) { TII->RemoveBranch(PrevBB); PriorCond.clear(); if (PriorTBB != &*MBB) TII->InsertBranch(PrevBB, PriorTBB, 0, PriorCond); MadeChange = true; ++NumBranchOpts; return OptimizeBlock(MBB); } // If the previous branch *only* branches to *this* block (conditional or // not) remove the branch. if (PriorTBB == &*MBB && PriorFBB == 0) { TII->RemoveBranch(PrevBB); MadeChange = true; ++NumBranchOpts; return OptimizeBlock(MBB); } // If the prior block branches somewhere else on the condition and here if // the condition is false, remove the uncond second branch. if (PriorFBB == &*MBB) { TII->RemoveBranch(PrevBB); TII->InsertBranch(PrevBB, PriorTBB, 0, PriorCond); MadeChange = true; ++NumBranchOpts; return OptimizeBlock(MBB); } // If the prior block branches here on true and somewhere else on false, and // if the branch condition is reversible, reverse the branch to create a // fall-through. if (PriorTBB == &*MBB) { std::vector NewPriorCond(PriorCond); if (!TII->ReverseBranchCondition(NewPriorCond)) { TII->RemoveBranch(PrevBB); TII->InsertBranch(PrevBB, PriorFBB, 0, NewPriorCond); MadeChange = true; ++NumBranchOpts; return OptimizeBlock(MBB); } } } // Analyze the branch in the current block. MachineBasicBlock *CurTBB = 0, *CurFBB = 0; std::vector CurCond; if (!TII->AnalyzeBranch(*MBB, CurTBB, CurFBB, CurCond)) { // If the CFG for the prior block has extra edges, remove them. MadeChange |= CorrectExtraCFGEdges(*MBB, CurTBB, CurFBB, !CurCond.empty(), next(MBB)); // If this branch is the only thing in its block, see if we can forward // other blocks across it. if (CurTBB && CurCond.empty() && CurFBB == 0 && TII->isBranch(MBB->begin()->getOpcode()) && CurTBB != &*MBB) { // This block may contain just an unconditional branch. Because there can // be 'non-branch terminators' in the block, try removing the branch and // then seeing if the block is empty. TII->RemoveBranch(*MBB); // If this block is just an unconditional branch to CurTBB, we can // usually completely eliminate the block. The only case we cannot // completely eliminate the block is when the block before this one // falls through into MBB and we can't understand the prior block's branch // condition. if (MBB->empty() && (!PriorUnAnalyzable || !PrevBB.isSuccessor(MBB))) { // If the prior block falls through into us, turn it into an // explicit branch to us to make updates simpler. if (PrevBB.isSuccessor(MBB) && PriorTBB != &*MBB && PriorFBB != &*MBB) { if (PriorTBB == 0) { assert(PriorCond.empty() && PriorFBB == 0 && "Bad branch analysis"); PriorTBB = MBB; } else { assert(PriorFBB == 0 && "Machine CFG out of date!"); PriorFBB = MBB; } TII->RemoveBranch(PrevBB); TII->InsertBranch(PrevBB, PriorTBB, PriorFBB, PriorCond); } // Iterate through all the predecessors, revectoring each in-turn. MachineBasicBlock::pred_iterator PI = MBB->pred_begin(); bool DidChange = false; bool HasBranchToSelf = false; while (PI != MBB->pred_end()) { if (*PI == &*MBB) { // If this block has an uncond branch to itself, leave it. ++PI; HasBranchToSelf = true; } else { DidChange = true; ReplaceUsesOfBlockWith(*PI, MBB, CurTBB, TII); } } // Change any jumptables to go to the new MBB. MBB->getParent()->getJumpTableInfo()->ReplaceMBBInJumpTables(MBB, CurTBB); if (DidChange) { ++NumBranchOpts; MadeChange = true; if (!HasBranchToSelf) return; } } // Add the branch back if the block is more than just an uncond branch. TII->InsertBranch(*MBB, CurTBB, 0, CurCond); } } }