recommit the patch that makes LSR and LowerInvoke use the TargetTransform interface.

git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@166264 91177308-0d34-0410-b5e6-96231b3b80d8
This commit is contained in:
Nadav Rotem 2012-10-19 04:27:49 +00:00
parent 9aecdb51c7
commit 725f1d1280
6 changed files with 101 additions and 92 deletions

View File

@ -22,7 +22,7 @@
#include <set> #include <set>
namespace llvm { namespace llvm {
class TargetLowering; class ScalarTargetTransformInfo;
/// Return true if the given expression is safe to expand in the sense that /// Return true if the given expression is safe to expand in the sense that
/// all materialized values are safe to speculate. /// all materialized values are safe to speculate.
@ -129,7 +129,7 @@ namespace llvm {
/// representative. Return the number of phis eliminated. /// representative. Return the number of phis eliminated.
unsigned replaceCongruentIVs(Loop *L, const DominatorTree *DT, unsigned replaceCongruentIVs(Loop *L, const DominatorTree *DT,
SmallVectorImpl<WeakVH> &DeadInsts, SmallVectorImpl<WeakVH> &DeadInsts,
const TargetLowering *TLI = NULL); const ScalarTargetTransformInfo *STTI = NULL);
/// expandCodeFor - Insert code to directly compute the specified SCEV /// expandCodeFor - Insert code to directly compute the specified SCEV
/// expression into the program. The inserted code is inserted into the /// expression into the program. The inserted code is inserted into the

View File

@ -119,7 +119,7 @@ Pass *createLICMPass();
// optional parameter used to consult the target machine whether certain // optional parameter used to consult the target machine whether certain
// transformations are profitable. // transformations are profitable.
// //
Pass *createLoopStrengthReducePass(const TargetLowering *TLI = 0); Pass *createLoopStrengthReducePass();
Pass *createGlobalMergePass(const TargetLowering *TLI = 0); Pass *createGlobalMergePass(const TargetLowering *TLI = 0);
@ -249,9 +249,8 @@ extern char &LowerSwitchID;
// purpose "my LLVM-to-LLVM pass doesn't support the invoke instruction yet" // purpose "my LLVM-to-LLVM pass doesn't support the invoke instruction yet"
// lowering pass. // lowering pass.
// //
FunctionPass *createLowerInvokePass(const TargetLowering *TLI = 0); FunctionPass *createLowerInvokePass();
FunctionPass *createLowerInvokePass(const TargetLowering *TLI, FunctionPass *createLowerInvokePass(bool useExpensiveEHSupport);
bool useExpensiveEHSupport);
extern char &LowerInvokePassID; extern char &LowerInvokePassID;
//===----------------------------------------------------------------------===// //===----------------------------------------------------------------------===//

View File

@ -19,8 +19,8 @@
#include "llvm/LLVMContext.h" #include "llvm/LLVMContext.h"
#include "llvm/Support/Debug.h" #include "llvm/Support/Debug.h"
#include "llvm/DataLayout.h" #include "llvm/DataLayout.h"
#include "llvm/Target/TargetLowering.h"
#include "llvm/ADT/STLExtras.h" #include "llvm/ADT/STLExtras.h"
#include "llvm/TargetTransformInfo.h"
using namespace llvm; using namespace llvm;
@ -1599,15 +1599,15 @@ static bool width_descending(Value *lhs, Value *rhs) {
/// This does not depend on any SCEVExpander state but should be used in /// This does not depend on any SCEVExpander state but should be used in
/// the same context that SCEVExpander is used. /// the same context that SCEVExpander is used.
unsigned SCEVExpander::replaceCongruentIVs(Loop *L, const DominatorTree *DT, unsigned SCEVExpander::replaceCongruentIVs(Loop *L, const DominatorTree *DT,
SmallVectorImpl<WeakVH> &DeadInsts, SmallVectorImpl<WeakVH> &DeadInsts,
const TargetLowering *TLI) { const ScalarTargetTransformInfo *STTI) {
// Find integer phis in order of increasing width. // Find integer phis in order of increasing width.
SmallVector<PHINode*, 8> Phis; SmallVector<PHINode*, 8> Phis;
for (BasicBlock::iterator I = L->getHeader()->begin(); for (BasicBlock::iterator I = L->getHeader()->begin();
PHINode *Phi = dyn_cast<PHINode>(I); ++I) { PHINode *Phi = dyn_cast<PHINode>(I); ++I) {
Phis.push_back(Phi); Phis.push_back(Phi);
} }
if (TLI) if (STTI)
std::sort(Phis.begin(), Phis.end(), width_descending); std::sort(Phis.begin(), Phis.end(), width_descending);
unsigned NumElim = 0; unsigned NumElim = 0;
@ -1624,8 +1624,8 @@ unsigned SCEVExpander::replaceCongruentIVs(Loop *L, const DominatorTree *DT,
PHINode *&OrigPhiRef = ExprToIVMap[SE.getSCEV(Phi)]; PHINode *&OrigPhiRef = ExprToIVMap[SE.getSCEV(Phi)];
if (!OrigPhiRef) { if (!OrigPhiRef) {
OrigPhiRef = Phi; OrigPhiRef = Phi;
if (Phi->getType()->isIntegerTy() && TLI if (Phi->getType()->isIntegerTy() && STTI &&
&& TLI->isTruncateFree(Phi->getType(), Phis.back()->getType())) { STTI->isTruncateFree(Phi->getType(), Phis.back()->getType())) {
// This phi can be freely truncated to the narrowest phi type. Map the // This phi can be freely truncated to the narrowest phi type. Map the
// truncated expression to it so it will be reused for narrow types. // truncated expression to it so it will be reused for narrow types.
const SCEV *TruncExpr = const SCEV *TruncExpr =

View File

@ -359,7 +359,7 @@ void TargetPassConfig::addIRPasses() {
// Run loop strength reduction before anything else. // Run loop strength reduction before anything else.
if (getOptLevel() != CodeGenOpt::None && !DisableLSR) { if (getOptLevel() != CodeGenOpt::None && !DisableLSR) {
addPass(createLoopStrengthReducePass(getTargetLowering())); addPass(createLoopStrengthReducePass());
if (PrintLSR) if (PrintLSR)
addPass(createPrintFunctionPass("\n\n*** Code after LSR ***\n", &dbgs())); addPass(createPrintFunctionPass("\n\n*** Code after LSR ***\n", &dbgs()));
} }
@ -389,7 +389,7 @@ void TargetPassConfig::addPassesToHandleExceptions() {
addPass(createDwarfEHPass(TM)); addPass(createDwarfEHPass(TM));
break; break;
case ExceptionHandling::None: case ExceptionHandling::None:
addPass(createLowerInvokePass(TM->getTargetLowering())); addPass(createLowerInvokePass());
// The lower invoke pass may create unreachable code. Remove it. // The lower invoke pass may create unreachable code. Remove it.
addPass(createUnreachableBlockEliminationPass()); addPass(createUnreachableBlockEliminationPass());

View File

@ -37,7 +37,7 @@
// //
// TODO: Handle multiple loops at a time. // TODO: Handle multiple loops at a time.
// //
// TODO: Should TargetLowering::AddrMode::BaseGV be changed to a ConstantExpr // TODO: Should AddrMode::BaseGV be changed to a ConstantExpr
// instead of a GlobalValue? // instead of a GlobalValue?
// //
// TODO: When truncation is free, truncate ICmp users' operands to make it a // TODO: When truncation is free, truncate ICmp users' operands to make it a
@ -67,6 +67,7 @@
#include "llvm/Transforms/Scalar.h" #include "llvm/Transforms/Scalar.h"
#include "llvm/Transforms/Utils/BasicBlockUtils.h" #include "llvm/Transforms/Utils/BasicBlockUtils.h"
#include "llvm/Transforms/Utils/Local.h" #include "llvm/Transforms/Utils/Local.h"
#include "llvm/TargetTransformInfo.h"
#include "llvm/ADT/SmallBitVector.h" #include "llvm/ADT/SmallBitVector.h"
#include "llvm/ADT/SetVector.h" #include "llvm/ADT/SetVector.h"
#include "llvm/ADT/DenseSet.h" #include "llvm/ADT/DenseSet.h"
@ -74,7 +75,6 @@
#include "llvm/Support/CommandLine.h" #include "llvm/Support/CommandLine.h"
#include "llvm/Support/ValueHandle.h" #include "llvm/Support/ValueHandle.h"
#include "llvm/Support/raw_ostream.h" #include "llvm/Support/raw_ostream.h"
#include "llvm/Target/TargetLowering.h"
#include <algorithm> #include <algorithm>
using namespace llvm; using namespace llvm;
@ -1118,7 +1118,7 @@ public:
enum KindType { enum KindType {
Basic, ///< A normal use, with no folding. Basic, ///< A normal use, with no folding.
Special, ///< A special case of basic, allowing -1 scales. Special, ///< A special case of basic, allowing -1 scales.
Address, ///< An address use; folding according to TargetLowering Address, ///< An address use; folding according to ScalarTargetTransformInfo.
ICmpZero ///< An equality icmp with both operands folded into one. ICmpZero ///< An equality icmp with both operands folded into one.
// TODO: Add a generic icmp too? // TODO: Add a generic icmp too?
}; };
@ -1272,12 +1272,12 @@ void LSRUse::dump() const {
/// address-mode folding and special icmp tricks. /// address-mode folding and special icmp tricks.
static bool isLegalUse(const AddrMode &AM, static bool isLegalUse(const AddrMode &AM,
LSRUse::KindType Kind, Type *AccessTy, LSRUse::KindType Kind, Type *AccessTy,
const TargetLowering *TLI) { const ScalarTargetTransformInfo *STTI) {
switch (Kind) { switch (Kind) {
case LSRUse::Address: case LSRUse::Address:
// If we have low-level target information, ask the target if it can // If we have low-level target information, ask the target if it can
// completely fold this address. // completely fold this address.
if (TLI) return TLI->isLegalAddressingMode(AM, AccessTy); if (STTI) return STTI->isLegalAddressingMode(AM, AccessTy);
// Otherwise, just guess that reg+reg addressing is legal. // Otherwise, just guess that reg+reg addressing is legal.
return !AM.BaseGV && AM.BaseOffs == 0 && AM.Scale <= 1; return !AM.BaseGV && AM.BaseOffs == 0 && AM.Scale <= 1;
@ -1300,7 +1300,7 @@ static bool isLegalUse(const AddrMode &AM,
// If we have low-level target information, ask the target if it can fold an // If we have low-level target information, ask the target if it can fold an
// integer immediate on an icmp. // integer immediate on an icmp.
if (AM.BaseOffs != 0) { if (AM.BaseOffs != 0) {
if (!TLI) if (!STTI)
return false; return false;
// We have one of: // We have one of:
// ICmpZero BaseReg + Offset => ICmp BaseReg, -Offset // ICmpZero BaseReg + Offset => ICmp BaseReg, -Offset
@ -1309,7 +1309,7 @@ static bool isLegalUse(const AddrMode &AM,
int64_t Offs = AM.BaseOffs; int64_t Offs = AM.BaseOffs;
if (AM.Scale == 0) if (AM.Scale == 0)
Offs = -(uint64_t)Offs; // The cast does the right thing with INT64_MIN. Offs = -(uint64_t)Offs; // The cast does the right thing with INT64_MIN.
return TLI->isLegalICmpImmediate(Offs); return STTI->isLegalICmpImmediate(Offs);
} }
// ICmpZero BaseReg + -1*ScaleReg => ICmp BaseReg, ScaleReg // ICmpZero BaseReg + -1*ScaleReg => ICmp BaseReg, ScaleReg
@ -1330,20 +1330,20 @@ static bool isLegalUse(const AddrMode &AM,
static bool isLegalUse(AddrMode AM, static bool isLegalUse(AddrMode AM,
int64_t MinOffset, int64_t MaxOffset, int64_t MinOffset, int64_t MaxOffset,
LSRUse::KindType Kind, Type *AccessTy, LSRUse::KindType Kind, Type *AccessTy,
const TargetLowering *TLI) { const ScalarTargetTransformInfo *LTTI) {
// Check for overflow. // Check for overflow.
if (((int64_t)((uint64_t)AM.BaseOffs + MinOffset) > AM.BaseOffs) != if (((int64_t)((uint64_t)AM.BaseOffs + MinOffset) > AM.BaseOffs) !=
(MinOffset > 0)) (MinOffset > 0))
return false; return false;
AM.BaseOffs = (uint64_t)AM.BaseOffs + MinOffset; AM.BaseOffs = (uint64_t)AM.BaseOffs + MinOffset;
if (isLegalUse(AM, Kind, AccessTy, TLI)) { if (isLegalUse(AM, Kind, AccessTy, LTTI)) {
AM.BaseOffs = (uint64_t)AM.BaseOffs - MinOffset; AM.BaseOffs = (uint64_t)AM.BaseOffs - MinOffset;
// Check for overflow. // Check for overflow.
if (((int64_t)((uint64_t)AM.BaseOffs + MaxOffset) > AM.BaseOffs) != if (((int64_t)((uint64_t)AM.BaseOffs + MaxOffset) > AM.BaseOffs) !=
(MaxOffset > 0)) (MaxOffset > 0))
return false; return false;
AM.BaseOffs = (uint64_t)AM.BaseOffs + MaxOffset; AM.BaseOffs = (uint64_t)AM.BaseOffs + MaxOffset;
return isLegalUse(AM, Kind, AccessTy, TLI); return isLegalUse(AM, Kind, AccessTy, LTTI);
} }
return false; return false;
} }
@ -1352,7 +1352,7 @@ static bool isAlwaysFoldable(int64_t BaseOffs,
GlobalValue *BaseGV, GlobalValue *BaseGV,
bool HasBaseReg, bool HasBaseReg,
LSRUse::KindType Kind, Type *AccessTy, LSRUse::KindType Kind, Type *AccessTy,
const TargetLowering *TLI) { const ScalarTargetTransformInfo *LTTI) {
// Fast-path: zero is always foldable. // Fast-path: zero is always foldable.
if (BaseOffs == 0 && !BaseGV) return true; if (BaseOffs == 0 && !BaseGV) return true;
@ -1371,14 +1371,14 @@ static bool isAlwaysFoldable(int64_t BaseOffs,
AM.HasBaseReg = true; AM.HasBaseReg = true;
} }
return isLegalUse(AM, Kind, AccessTy, TLI); return isLegalUse(AM, Kind, AccessTy, LTTI);
} }
static bool isAlwaysFoldable(const SCEV *S, static bool isAlwaysFoldable(const SCEV *S,
int64_t MinOffset, int64_t MaxOffset, int64_t MinOffset, int64_t MaxOffset,
bool HasBaseReg, bool HasBaseReg,
LSRUse::KindType Kind, Type *AccessTy, LSRUse::KindType Kind, Type *AccessTy,
const TargetLowering *TLI, const ScalarTargetTransformInfo *LTTI,
ScalarEvolution &SE) { ScalarEvolution &SE) {
// Fast-path: zero is always foldable. // Fast-path: zero is always foldable.
if (S->isZero()) return true; if (S->isZero()) return true;
@ -1402,7 +1402,7 @@ static bool isAlwaysFoldable(const SCEV *S,
AM.HasBaseReg = HasBaseReg; AM.HasBaseReg = HasBaseReg;
AM.Scale = Kind == LSRUse::ICmpZero ? -1 : 1; AM.Scale = Kind == LSRUse::ICmpZero ? -1 : 1;
return isLegalUse(AM, MinOffset, MaxOffset, Kind, AccessTy, TLI); return isLegalUse(AM, MinOffset, MaxOffset, Kind, AccessTy, LTTI);
} }
namespace { namespace {
@ -1502,7 +1502,7 @@ class LSRInstance {
ScalarEvolution &SE; ScalarEvolution &SE;
DominatorTree &DT; DominatorTree &DT;
LoopInfo &LI; LoopInfo &LI;
const TargetLowering *const TLI; const ScalarTargetTransformInfo *const STTI;
Loop *const L; Loop *const L;
bool Changed; bool Changed;
@ -1638,7 +1638,7 @@ class LSRInstance {
Pass *P); Pass *P);
public: public:
LSRInstance(const TargetLowering *tli, Loop *l, Pass *P); LSRInstance(const ScalarTargetTransformInfo *ltti, Loop *l, Pass *P);
bool getChanged() const { return Changed; } bool getChanged() const { return Changed; }
@ -1688,11 +1688,10 @@ void LSRInstance::OptimizeShadowIV() {
} }
if (!DestTy) continue; if (!DestTy) continue;
if (TLI) { if (STTI) {
// If target does not support DestTy natively then do not apply // If target does not support DestTy natively then do not apply
// this transformation. // this transformation.
EVT DVT = TLI->getValueType(DestTy); if (!STTI->isTypeLegal(DestTy)) continue;
if (!TLI->isTypeLegal(DVT)) continue;
} }
PHINode *PH = dyn_cast<PHINode>(ShadowUse->getOperand(0)); PHINode *PH = dyn_cast<PHINode>(ShadowUse->getOperand(0));
@ -2015,18 +2014,18 @@ LSRInstance::OptimizeLoopTermCond() {
if (C->getValue().getMinSignedBits() >= 64 || if (C->getValue().getMinSignedBits() >= 64 ||
C->getValue().isMinSignedValue()) C->getValue().isMinSignedValue())
goto decline_post_inc; goto decline_post_inc;
// Without TLI, assume that any stride might be valid, and so any // Without STTI, assume that any stride might be valid, and so any
// use might be shared. // use might be shared.
if (!TLI) if (!STTI)
goto decline_post_inc; goto decline_post_inc;
// Check for possible scaled-address reuse. // Check for possible scaled-address reuse.
Type *AccessTy = getAccessType(UI->getUser()); Type *AccessTy = getAccessType(UI->getUser());
AddrMode AM; AddrMode AM;
AM.Scale = C->getSExtValue(); AM.Scale = C->getSExtValue();
if (TLI->isLegalAddressingMode(AM, AccessTy)) if (STTI->isLegalAddressingMode(AM, AccessTy))
goto decline_post_inc; goto decline_post_inc;
AM.Scale = -AM.Scale; AM.Scale = -AM.Scale;
if (TLI->isLegalAddressingMode(AM, AccessTy)) if (STTI->isLegalAddressingMode(AM, AccessTy))
goto decline_post_inc; goto decline_post_inc;
} }
} }
@ -2097,12 +2096,12 @@ LSRInstance::reconcileNewOffset(LSRUse &LU, int64_t NewOffset, bool HasBaseReg,
// Conservatively assume HasBaseReg is true for now. // Conservatively assume HasBaseReg is true for now.
if (NewOffset < LU.MinOffset) { if (NewOffset < LU.MinOffset) {
if (!isAlwaysFoldable(LU.MaxOffset - NewOffset, 0, HasBaseReg, if (!isAlwaysFoldable(LU.MaxOffset - NewOffset, 0, HasBaseReg,
Kind, AccessTy, TLI)) Kind, AccessTy, STTI))
return false; return false;
NewMinOffset = NewOffset; NewMinOffset = NewOffset;
} else if (NewOffset > LU.MaxOffset) { } else if (NewOffset > LU.MaxOffset) {
if (!isAlwaysFoldable(NewOffset - LU.MinOffset, 0, HasBaseReg, if (!isAlwaysFoldable(NewOffset - LU.MinOffset, 0, HasBaseReg,
Kind, AccessTy, TLI)) Kind, AccessTy, STTI))
return false; return false;
NewMaxOffset = NewOffset; NewMaxOffset = NewOffset;
} }
@ -2131,7 +2130,7 @@ LSRInstance::getUse(const SCEV *&Expr,
int64_t Offset = ExtractImmediate(Expr, SE); int64_t Offset = ExtractImmediate(Expr, SE);
// Basic uses can't accept any offset, for example. // Basic uses can't accept any offset, for example.
if (!isAlwaysFoldable(Offset, 0, /*HasBaseReg=*/true, Kind, AccessTy, TLI)) { if (!isAlwaysFoldable(Offset, 0, /*HasBaseReg=*/true, Kind, AccessTy, STTI)) {
Expr = Copy; Expr = Copy;
Offset = 0; Offset = 0;
} }
@ -2396,7 +2395,7 @@ bool IVChain::isProfitableIncrement(const SCEV *OperExpr,
/// TODO: Consider IVInc free if it's already used in another chains. /// TODO: Consider IVInc free if it's already used in another chains.
static bool static bool
isProfitableChain(IVChain &Chain, SmallPtrSet<Instruction*, 4> &Users, isProfitableChain(IVChain &Chain, SmallPtrSet<Instruction*, 4> &Users,
ScalarEvolution &SE, const TargetLowering *TLI) { ScalarEvolution &SE, const ScalarTargetTransformInfo *STTI) {
if (StressIVChain) if (StressIVChain)
return true; return true;
@ -2654,7 +2653,7 @@ void LSRInstance::CollectChains() {
for (unsigned UsersIdx = 0, NChains = IVChainVec.size(); for (unsigned UsersIdx = 0, NChains = IVChainVec.size();
UsersIdx < NChains; ++UsersIdx) { UsersIdx < NChains; ++UsersIdx) {
if (!isProfitableChain(IVChainVec[UsersIdx], if (!isProfitableChain(IVChainVec[UsersIdx],
ChainUsersVec[UsersIdx].FarUsers, SE, TLI)) ChainUsersVec[UsersIdx].FarUsers, SE, STTI))
continue; continue;
// Preserve the chain at UsesIdx. // Preserve the chain at UsesIdx.
if (ChainIdx != UsersIdx) if (ChainIdx != UsersIdx)
@ -2681,7 +2680,8 @@ void LSRInstance::FinalizeChain(IVChain &Chain) {
/// Return true if the IVInc can be folded into an addressing mode. /// Return true if the IVInc can be folded into an addressing mode.
static bool canFoldIVIncExpr(const SCEV *IncExpr, Instruction *UserInst, static bool canFoldIVIncExpr(const SCEV *IncExpr, Instruction *UserInst,
Value *Operand, const TargetLowering *TLI) { Value *Operand,
const ScalarTargetTransformInfo *STTI) {
const SCEVConstant *IncConst = dyn_cast<SCEVConstant>(IncExpr); const SCEVConstant *IncConst = dyn_cast<SCEVConstant>(IncExpr);
if (!IncConst || !isAddressUse(UserInst, Operand)) if (!IncConst || !isAddressUse(UserInst, Operand))
return false; return false;
@ -2691,7 +2691,7 @@ static bool canFoldIVIncExpr(const SCEV *IncExpr, Instruction *UserInst,
int64_t IncOffset = IncConst->getValue()->getSExtValue(); int64_t IncOffset = IncConst->getValue()->getSExtValue();
if (!isAlwaysFoldable(IncOffset, /*BaseGV=*/0, /*HaseBaseReg=*/false, if (!isAlwaysFoldable(IncOffset, /*BaseGV=*/0, /*HaseBaseReg=*/false,
LSRUse::Address, getAccessType(UserInst), TLI)) LSRUse::Address, getAccessType(UserInst), STTI))
return false; return false;
return true; return true;
@ -2762,7 +2762,7 @@ void LSRInstance::GenerateIVChain(const IVChain &Chain, SCEVExpander &Rewriter,
// If an IV increment can't be folded, use it as the next IV value. // If an IV increment can't be folded, use it as the next IV value.
if (!canFoldIVIncExpr(LeftOverExpr, IncI->UserInst, IncI->IVOperand, if (!canFoldIVIncExpr(LeftOverExpr, IncI->UserInst, IncI->IVOperand,
TLI)) { STTI)) {
assert(IVTy == IVOper->getType() && "inconsistent IV increment type"); assert(IVTy == IVOper->getType() && "inconsistent IV increment type");
IVSrc = IVOper; IVSrc = IVOper;
LeftOverExpr = 0; LeftOverExpr = 0;
@ -3108,7 +3108,7 @@ void LSRInstance::GenerateReassociations(LSRUse &LU, unsigned LUIdx,
// into an immediate field. // into an immediate field.
if (isAlwaysFoldable(*J, LU.MinOffset, LU.MaxOffset, if (isAlwaysFoldable(*J, LU.MinOffset, LU.MaxOffset,
Base.getNumRegs() > 1, Base.getNumRegs() > 1,
LU.Kind, LU.AccessTy, TLI, SE)) LU.Kind, LU.AccessTy, STTI, SE))
continue; continue;
// Collect all operands except *J. // Collect all operands except *J.
@ -3122,7 +3122,7 @@ void LSRInstance::GenerateReassociations(LSRUse &LU, unsigned LUIdx,
if (InnerAddOps.size() == 1 && if (InnerAddOps.size() == 1 &&
isAlwaysFoldable(InnerAddOps[0], LU.MinOffset, LU.MaxOffset, isAlwaysFoldable(InnerAddOps[0], LU.MinOffset, LU.MaxOffset,
Base.getNumRegs() > 1, Base.getNumRegs() > 1,
LU.Kind, LU.AccessTy, TLI, SE)) LU.Kind, LU.AccessTy, STTI, SE))
continue; continue;
const SCEV *InnerSum = SE.getAddExpr(InnerAddOps); const SCEV *InnerSum = SE.getAddExpr(InnerAddOps);
@ -3132,9 +3132,9 @@ void LSRInstance::GenerateReassociations(LSRUse &LU, unsigned LUIdx,
// Add the remaining pieces of the add back into the new formula. // Add the remaining pieces of the add back into the new formula.
const SCEVConstant *InnerSumSC = dyn_cast<SCEVConstant>(InnerSum); const SCEVConstant *InnerSumSC = dyn_cast<SCEVConstant>(InnerSum);
if (TLI && InnerSumSC && if (STTI && InnerSumSC &&
SE.getTypeSizeInBits(InnerSumSC->getType()) <= 64 && SE.getTypeSizeInBits(InnerSumSC->getType()) <= 64 &&
TLI->isLegalAddImmediate((uint64_t)F.UnfoldedOffset + STTI->isLegalAddImmediate((uint64_t)F.UnfoldedOffset +
InnerSumSC->getValue()->getZExtValue())) { InnerSumSC->getValue()->getZExtValue())) {
F.UnfoldedOffset = (uint64_t)F.UnfoldedOffset + F.UnfoldedOffset = (uint64_t)F.UnfoldedOffset +
InnerSumSC->getValue()->getZExtValue(); InnerSumSC->getValue()->getZExtValue();
@ -3144,8 +3144,8 @@ void LSRInstance::GenerateReassociations(LSRUse &LU, unsigned LUIdx,
// Add J as its own register, or an unfolded immediate. // Add J as its own register, or an unfolded immediate.
const SCEVConstant *SC = dyn_cast<SCEVConstant>(*J); const SCEVConstant *SC = dyn_cast<SCEVConstant>(*J);
if (TLI && SC && SE.getTypeSizeInBits(SC->getType()) <= 64 && if (STTI && SC && SE.getTypeSizeInBits(SC->getType()) <= 64 &&
TLI->isLegalAddImmediate((uint64_t)F.UnfoldedOffset + STTI->isLegalAddImmediate((uint64_t)F.UnfoldedOffset +
SC->getValue()->getZExtValue())) SC->getValue()->getZExtValue()))
F.UnfoldedOffset = (uint64_t)F.UnfoldedOffset + F.UnfoldedOffset = (uint64_t)F.UnfoldedOffset +
SC->getValue()->getZExtValue(); SC->getValue()->getZExtValue();
@ -3205,7 +3205,7 @@ void LSRInstance::GenerateSymbolicOffsets(LSRUse &LU, unsigned LUIdx,
Formula F = Base; Formula F = Base;
F.AM.BaseGV = GV; F.AM.BaseGV = GV;
if (!isLegalUse(F.AM, LU.MinOffset, LU.MaxOffset, if (!isLegalUse(F.AM, LU.MinOffset, LU.MaxOffset,
LU.Kind, LU.AccessTy, TLI)) LU.Kind, LU.AccessTy, STTI))
continue; continue;
F.BaseRegs[i] = G; F.BaseRegs[i] = G;
(void)InsertFormula(LU, LUIdx, F); (void)InsertFormula(LU, LUIdx, F);
@ -3230,7 +3230,7 @@ void LSRInstance::GenerateConstantOffsets(LSRUse &LU, unsigned LUIdx,
Formula F = Base; Formula F = Base;
F.AM.BaseOffs = (uint64_t)Base.AM.BaseOffs - *I; F.AM.BaseOffs = (uint64_t)Base.AM.BaseOffs - *I;
if (isLegalUse(F.AM, LU.MinOffset - *I, LU.MaxOffset - *I, if (isLegalUse(F.AM, LU.MinOffset - *I, LU.MaxOffset - *I,
LU.Kind, LU.AccessTy, TLI)) { LU.Kind, LU.AccessTy, STTI)) {
// Add the offset to the base register. // Add the offset to the base register.
const SCEV *NewG = SE.getAddExpr(SE.getConstant(G->getType(), *I), G); const SCEV *NewG = SE.getAddExpr(SE.getConstant(G->getType(), *I), G);
// If it cancelled out, drop the base register, otherwise update it. // If it cancelled out, drop the base register, otherwise update it.
@ -3250,7 +3250,7 @@ void LSRInstance::GenerateConstantOffsets(LSRUse &LU, unsigned LUIdx,
Formula F = Base; Formula F = Base;
F.AM.BaseOffs = (uint64_t)F.AM.BaseOffs + Imm; F.AM.BaseOffs = (uint64_t)F.AM.BaseOffs + Imm;
if (!isLegalUse(F.AM, LU.MinOffset, LU.MaxOffset, if (!isLegalUse(F.AM, LU.MinOffset, LU.MaxOffset,
LU.Kind, LU.AccessTy, TLI)) LU.Kind, LU.AccessTy, STTI))
continue; continue;
F.BaseRegs[i] = G; F.BaseRegs[i] = G;
(void)InsertFormula(LU, LUIdx, F); (void)InsertFormula(LU, LUIdx, F);
@ -3297,7 +3297,7 @@ void LSRInstance::GenerateICmpZeroScales(LSRUse &LU, unsigned LUIdx,
F.AM.BaseOffs = NewBaseOffs; F.AM.BaseOffs = NewBaseOffs;
// Check that this scale is legal. // Check that this scale is legal.
if (!isLegalUse(F.AM, Offset, Offset, LU.Kind, LU.AccessTy, TLI)) if (!isLegalUse(F.AM, Offset, Offset, LU.Kind, LU.AccessTy, STTI))
continue; continue;
// Compensate for the use having MinOffset built into it. // Compensate for the use having MinOffset built into it.
@ -3353,12 +3353,12 @@ void LSRInstance::GenerateScales(LSRUse &LU, unsigned LUIdx, Formula Base) {
Base.AM.HasBaseReg = Base.BaseRegs.size() > 1; Base.AM.HasBaseReg = Base.BaseRegs.size() > 1;
// Check whether this scale is going to be legal. // Check whether this scale is going to be legal.
if (!isLegalUse(Base.AM, LU.MinOffset, LU.MaxOffset, if (!isLegalUse(Base.AM, LU.MinOffset, LU.MaxOffset,
LU.Kind, LU.AccessTy, TLI)) { LU.Kind, LU.AccessTy, STTI)) {
// As a special-case, handle special out-of-loop Basic users specially. // As a special-case, handle special out-of-loop Basic users specially.
// TODO: Reconsider this special case. // TODO: Reconsider this special case.
if (LU.Kind == LSRUse::Basic && if (LU.Kind == LSRUse::Basic &&
isLegalUse(Base.AM, LU.MinOffset, LU.MaxOffset, isLegalUse(Base.AM, LU.MinOffset, LU.MaxOffset,
LSRUse::Special, LU.AccessTy, TLI) && LSRUse::Special, LU.AccessTy, STTI) &&
LU.AllFixupsOutsideLoop) LU.AllFixupsOutsideLoop)
LU.Kind = LSRUse::Special; LU.Kind = LSRUse::Special;
else else
@ -3391,8 +3391,8 @@ void LSRInstance::GenerateScales(LSRUse &LU, unsigned LUIdx, Formula Base) {
/// GenerateTruncates - Generate reuse formulae from different IV types. /// GenerateTruncates - Generate reuse formulae from different IV types.
void LSRInstance::GenerateTruncates(LSRUse &LU, unsigned LUIdx, Formula Base) { void LSRInstance::GenerateTruncates(LSRUse &LU, unsigned LUIdx, Formula Base) {
// This requires TargetLowering to tell us which truncates are free. // This requires ScalarTargetTransformInfo to tell us which truncates are free.
if (!TLI) return; if (!STTI) return;
// Don't bother truncating symbolic values. // Don't bother truncating symbolic values.
if (Base.AM.BaseGV) return; if (Base.AM.BaseGV) return;
@ -3405,7 +3405,7 @@ void LSRInstance::GenerateTruncates(LSRUse &LU, unsigned LUIdx, Formula Base) {
for (SmallSetVector<Type *, 4>::const_iterator for (SmallSetVector<Type *, 4>::const_iterator
I = Types.begin(), E = Types.end(); I != E; ++I) { I = Types.begin(), E = Types.end(); I != E; ++I) {
Type *SrcTy = *I; Type *SrcTy = *I;
if (SrcTy != DstTy && TLI->isTruncateFree(SrcTy, DstTy)) { if (SrcTy != DstTy && STTI->isTruncateFree(SrcTy, DstTy)) {
Formula F = Base; Formula F = Base;
if (F.ScaledReg) F.ScaledReg = SE.getAnyExtendExpr(F.ScaledReg, *I); if (F.ScaledReg) F.ScaledReg = SE.getAnyExtendExpr(F.ScaledReg, *I);
@ -3561,7 +3561,7 @@ void LSRInstance::GenerateCrossUseConstantOffsets() {
Formula NewF = F; Formula NewF = F;
NewF.AM.BaseOffs = Offs; NewF.AM.BaseOffs = Offs;
if (!isLegalUse(NewF.AM, LU.MinOffset, LU.MaxOffset, if (!isLegalUse(NewF.AM, LU.MinOffset, LU.MaxOffset,
LU.Kind, LU.AccessTy, TLI)) LU.Kind, LU.AccessTy, STTI))
continue; continue;
NewF.ScaledReg = SE.getAddExpr(NegImmS, NewF.ScaledReg); NewF.ScaledReg = SE.getAddExpr(NegImmS, NewF.ScaledReg);
@ -3586,9 +3586,9 @@ void LSRInstance::GenerateCrossUseConstantOffsets() {
Formula NewF = F; Formula NewF = F;
NewF.AM.BaseOffs = (uint64_t)NewF.AM.BaseOffs + Imm; NewF.AM.BaseOffs = (uint64_t)NewF.AM.BaseOffs + Imm;
if (!isLegalUse(NewF.AM, LU.MinOffset, LU.MaxOffset, if (!isLegalUse(NewF.AM, LU.MinOffset, LU.MaxOffset,
LU.Kind, LU.AccessTy, TLI)) { LU.Kind, LU.AccessTy, STTI)) {
if (!TLI || if (!STTI ||
!TLI->isLegalAddImmediate((uint64_t)NewF.UnfoldedOffset + Imm)) !STTI->isLegalAddImmediate((uint64_t)NewF.UnfoldedOffset + Imm))
continue; continue;
NewF = F; NewF = F;
NewF.UnfoldedOffset = (uint64_t)NewF.UnfoldedOffset + Imm; NewF.UnfoldedOffset = (uint64_t)NewF.UnfoldedOffset + Imm;
@ -3900,7 +3900,7 @@ void LSRInstance::NarrowSearchSpaceByCollapsingUnrolledCode() {
Formula &F = LUThatHas->Formulae[i]; Formula &F = LUThatHas->Formulae[i];
if (!isLegalUse(F.AM, if (!isLegalUse(F.AM,
LUThatHas->MinOffset, LUThatHas->MaxOffset, LUThatHas->MinOffset, LUThatHas->MaxOffset,
LUThatHas->Kind, LUThatHas->AccessTy, TLI)) { LUThatHas->Kind, LUThatHas->AccessTy, STTI)) {
DEBUG(dbgs() << " Deleting "; F.print(dbgs()); DEBUG(dbgs() << " Deleting "; F.print(dbgs());
dbgs() << '\n'); dbgs() << '\n');
LUThatHas->DeleteFormula(F); LUThatHas->DeleteFormula(F);
@ -4589,12 +4589,12 @@ LSRInstance::ImplementSolution(const SmallVectorImpl<const Formula *> &Solution,
Changed |= DeleteTriviallyDeadInstructions(DeadInsts); Changed |= DeleteTriviallyDeadInstructions(DeadInsts);
} }
LSRInstance::LSRInstance(const TargetLowering *tli, Loop *l, Pass *P) LSRInstance::LSRInstance(const ScalarTargetTransformInfo *stti, Loop *l, Pass *P)
: IU(P->getAnalysis<IVUsers>()), : IU(P->getAnalysis<IVUsers>()),
SE(P->getAnalysis<ScalarEvolution>()), SE(P->getAnalysis<ScalarEvolution>()),
DT(P->getAnalysis<DominatorTree>()), DT(P->getAnalysis<DominatorTree>()),
LI(P->getAnalysis<LoopInfo>()), LI(P->getAnalysis<LoopInfo>()),
TLI(tli), L(l), Changed(false), IVIncInsertPos(0) { STTI(stti), L(l), Changed(false), IVIncInsertPos(0) {
// If LoopSimplify form is not available, stay out of trouble. // If LoopSimplify form is not available, stay out of trouble.
if (!L->isLoopSimplifyForm()) if (!L->isLoopSimplifyForm())
@ -4684,7 +4684,7 @@ LSRInstance::LSRInstance(const TargetLowering *tli, Loop *l, Pass *P)
for (SmallVectorImpl<Formula>::const_iterator J = LU.Formulae.begin(), for (SmallVectorImpl<Formula>::const_iterator J = LU.Formulae.begin(),
JE = LU.Formulae.end(); J != JE; ++J) JE = LU.Formulae.end(); J != JE; ++J)
assert(isLegalUse(J->AM, LU.MinOffset, LU.MaxOffset, assert(isLegalUse(J->AM, LU.MinOffset, LU.MaxOffset,
LU.Kind, LU.AccessTy, TLI) && LU.Kind, LU.AccessTy, STTI) &&
"Illegal formula generated!"); "Illegal formula generated!");
}; };
#endif #endif
@ -4757,13 +4757,13 @@ void LSRInstance::dump() const {
namespace { namespace {
class LoopStrengthReduce : public LoopPass { class LoopStrengthReduce : public LoopPass {
/// TLI - Keep a pointer of a TargetLowering to consult for determining /// ScalarTargetTransformInfo provides target information that is needed
/// transformation profitability. /// for strength reducing loops.
const TargetLowering *const TLI; const ScalarTargetTransformInfo *STTI;
public: public:
static char ID; // Pass ID, replacement for typeid static char ID; // Pass ID, replacement for typeid
explicit LoopStrengthReduce(const TargetLowering *tli = 0); LoopStrengthReduce();
private: private:
bool runOnLoop(Loop *L, LPPassManager &LPM); bool runOnLoop(Loop *L, LPPassManager &LPM);
@ -4783,13 +4783,12 @@ INITIALIZE_PASS_DEPENDENCY(LoopSimplify)
INITIALIZE_PASS_END(LoopStrengthReduce, "loop-reduce", INITIALIZE_PASS_END(LoopStrengthReduce, "loop-reduce",
"Loop Strength Reduction", false, false) "Loop Strength Reduction", false, false)
Pass *llvm::createLoopStrengthReducePass() {
Pass *llvm::createLoopStrengthReducePass(const TargetLowering *TLI) { return new LoopStrengthReduce();
return new LoopStrengthReduce(TLI);
} }
LoopStrengthReduce::LoopStrengthReduce(const TargetLowering *tli) LoopStrengthReduce::LoopStrengthReduce()
: LoopPass(ID), TLI(tli) { : LoopPass(ID), STTI(0) {
initializeLoopStrengthReducePass(*PassRegistry::getPassRegistry()); initializeLoopStrengthReducePass(*PassRegistry::getPassRegistry());
} }
@ -4815,8 +4814,13 @@ void LoopStrengthReduce::getAnalysisUsage(AnalysisUsage &AU) const {
bool LoopStrengthReduce::runOnLoop(Loop *L, LPPassManager & /*LPM*/) { bool LoopStrengthReduce::runOnLoop(Loop *L, LPPassManager & /*LPM*/) {
bool Changed = false; bool Changed = false;
TargetTransformInfo *TTI = getAnalysisIfAvailable<TargetTransformInfo>();
if (TTI)
STTI = TTI->getScalarTargetTransformInfo();
// Run the main LSR transformation. // Run the main LSR transformation.
Changed |= LSRInstance(TLI, L, this).getChanged(); Changed |= LSRInstance(STTI, L, this).getChanged();
// Remove any extra phis created by processing inner loops. // Remove any extra phis created by processing inner loops.
Changed |= DeleteDeadPHIs(L->getHeader()); Changed |= DeleteDeadPHIs(L->getHeader());
@ -4827,7 +4831,7 @@ bool LoopStrengthReduce::runOnLoop(Loop *L, LPPassManager & /*LPM*/) {
Rewriter.setDebugType(DEBUG_TYPE); Rewriter.setDebugType(DEBUG_TYPE);
#endif #endif
unsigned numFolded = Rewriter. unsigned numFolded = Rewriter.
replaceCongruentIVs(L, &getAnalysis<DominatorTree>(), DeadInsts, TLI); replaceCongruentIVs(L, &getAnalysis<DominatorTree>(), DeadInsts, STTI);
if (numFolded) { if (numFolded) {
Changed = true; Changed = true;
DeleteTriviallyDeadInstructions(DeadInsts); DeleteTriviallyDeadInstructions(DeadInsts);

View File

@ -45,10 +45,10 @@
#include "llvm/Pass.h" #include "llvm/Pass.h"
#include "llvm/Transforms/Utils/BasicBlockUtils.h" #include "llvm/Transforms/Utils/BasicBlockUtils.h"
#include "llvm/Transforms/Utils/Local.h" #include "llvm/Transforms/Utils/Local.h"
#include "llvm/TargetTransformInfo.h"
#include "llvm/ADT/SmallVector.h" #include "llvm/ADT/SmallVector.h"
#include "llvm/ADT/Statistic.h" #include "llvm/ADT/Statistic.h"
#include "llvm/Support/CommandLine.h" #include "llvm/Support/CommandLine.h"
#include "llvm/Target/TargetLowering.h"
#include <csetjmp> #include <csetjmp>
#include <set> #include <set>
using namespace llvm; using namespace llvm;
@ -70,15 +70,14 @@ namespace {
Constant *SetJmpFn, *LongJmpFn, *StackSaveFn, *StackRestoreFn; Constant *SetJmpFn, *LongJmpFn, *StackSaveFn, *StackRestoreFn;
bool useExpensiveEHSupport; bool useExpensiveEHSupport;
// We peek in TLI to grab the target's jmp_buf size and alignment // We peek in STTI to grab the target's jmp_buf size and alignment
const TargetLowering *TLI; const ScalarTargetTransformInfo *STTI;
public: public:
static char ID; // Pass identification, replacement for typeid static char ID; // Pass identification, replacement for typeid
explicit LowerInvoke(const TargetLowering *tli = NULL, explicit LowerInvoke(bool useExpensiveEHSupport = ExpensiveEHSupport)
bool useExpensiveEHSupport = ExpensiveEHSupport)
: FunctionPass(ID), useExpensiveEHSupport(useExpensiveEHSupport), : FunctionPass(ID), useExpensiveEHSupport(useExpensiveEHSupport),
TLI(tli) { STTI(0) {
initializeLowerInvokePass(*PassRegistry::getPassRegistry()); initializeLowerInvokePass(*PassRegistry::getPassRegistry());
} }
bool doInitialization(Module &M); bool doInitialization(Module &M);
@ -108,21 +107,24 @@ INITIALIZE_PASS(LowerInvoke, "lowerinvoke",
char &llvm::LowerInvokePassID = LowerInvoke::ID; char &llvm::LowerInvokePassID = LowerInvoke::ID;
// Public Interface To the LowerInvoke pass. // Public Interface To the LowerInvoke pass.
FunctionPass *llvm::createLowerInvokePass(const TargetLowering *TLI) { FunctionPass *llvm::createLowerInvokePass() {
return new LowerInvoke(TLI, ExpensiveEHSupport); return new LowerInvoke(ExpensiveEHSupport);
} }
FunctionPass *llvm::createLowerInvokePass(const TargetLowering *TLI, FunctionPass *llvm::createLowerInvokePass(bool useExpensiveEHSupport) {
bool useExpensiveEHSupport) { return new LowerInvoke(useExpensiveEHSupport);
return new LowerInvoke(TLI, useExpensiveEHSupport);
} }
// doInitialization - Make sure that there is a prototype for abort in the // doInitialization - Make sure that there is a prototype for abort in the
// current module. // current module.
bool LowerInvoke::doInitialization(Module &M) { bool LowerInvoke::doInitialization(Module &M) {
TargetTransformInfo *TTI = getAnalysisIfAvailable<TargetTransformInfo>();
if (TTI)
STTI = TTI->getScalarTargetTransformInfo();
Type *VoidPtrTy = Type::getInt8PtrTy(M.getContext()); Type *VoidPtrTy = Type::getInt8PtrTy(M.getContext());
if (useExpensiveEHSupport) { if (useExpensiveEHSupport) {
// Insert a type for the linked list of jump buffers. // Insert a type for the linked list of jump buffers.
unsigned JBSize = TLI ? TLI->getJumpBufSize() : 0; unsigned JBSize = STTI ? STTI->getJumpBufSize() : 0;
JBSize = JBSize ? JBSize : 200; JBSize = JBSize ? JBSize : 200;
Type *JmpBufTy = ArrayType::get(VoidPtrTy, JBSize); Type *JmpBufTy = ArrayType::get(VoidPtrTy, JBSize);
@ -430,7 +432,7 @@ bool LowerInvoke::insertExpensiveEHSupport(Function &F) {
// Create an alloca for the incoming jump buffer ptr and the new jump buffer // Create an alloca for the incoming jump buffer ptr and the new jump buffer
// that needs to be restored on all exits from the function. This is an // that needs to be restored on all exits from the function. This is an
// alloca because the value needs to be live across invokes. // alloca because the value needs to be live across invokes.
unsigned Align = TLI ? TLI->getJumpBufAlignment() : 0; unsigned Align = STTI ? STTI->getJumpBufAlignment() : 0;
AllocaInst *JmpBuf = AllocaInst *JmpBuf =
new AllocaInst(JBLinkTy, 0, Align, new AllocaInst(JBLinkTy, 0, Align,
"jblink", F.begin()->begin()); "jblink", F.begin()->begin());
@ -575,6 +577,10 @@ bool LowerInvoke::insertExpensiveEHSupport(Function &F) {
} }
bool LowerInvoke::runOnFunction(Function &F) { bool LowerInvoke::runOnFunction(Function &F) {
TargetTransformInfo *TTI = getAnalysisIfAvailable<TargetTransformInfo>();
if (TTI)
STTI = TTI->getScalarTargetTransformInfo();
if (useExpensiveEHSupport) if (useExpensiveEHSupport)
return insertExpensiveEHSupport(F); return insertExpensiveEHSupport(F);
else else