mirror of
				https://github.com/c64scene-ar/llvm-6502.git
				synced 2025-10-25 10:27:04 +00:00 
			
		
		
		
	Remove LoopDependenceAnalysis.
It was unmaintained and not much more than a stub. The new DependenceAnalysis pass is both more general and complete. git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@166810 91177308-0d34-0410-b5e6-96231b3b80d8
This commit is contained in:
		| @@ -77,6 +77,7 @@ perl -e '$/ = undef; for (split(/\n/, <>)) { s:^ *///? ?::; print "  <p>\n" if ! | |||||||
| <tr><td><a href="#basicaa">-basicaa</a></td><td>Basic Alias Analysis (stateless AA impl)</td></tr> | <tr><td><a href="#basicaa">-basicaa</a></td><td>Basic Alias Analysis (stateless AA impl)</td></tr> | ||||||
| <tr><td><a href="#basiccg">-basiccg</a></td><td>Basic CallGraph Construction</td></tr> | <tr><td><a href="#basiccg">-basiccg</a></td><td>Basic CallGraph Construction</td></tr> | ||||||
| <tr><td><a href="#count-aa">-count-aa</a></td><td>Count Alias Analysis Query Responses</td></tr> | <tr><td><a href="#count-aa">-count-aa</a></td><td>Count Alias Analysis Query Responses</td></tr> | ||||||
|  | <tr><td><a href="#da">-da</a></td><td>Dependence Analysis</td></tr> | ||||||
| <tr><td><a href="#debug-aa">-debug-aa</a></td><td>AA use debugger</td></tr> | <tr><td><a href="#debug-aa">-debug-aa</a></td><td>AA use debugger</td></tr> | ||||||
| <tr><td><a href="#domfrontier">-domfrontier</a></td><td>Dominance Frontier Construction</td></tr> | <tr><td><a href="#domfrontier">-domfrontier</a></td><td>Dominance Frontier Construction</td></tr> | ||||||
| <tr><td><a href="#domtree">-domtree</a></td><td>Dominator Tree Construction</td></tr> | <tr><td><a href="#domtree">-domtree</a></td><td>Dominator Tree Construction</td></tr> | ||||||
| @@ -92,7 +93,6 @@ perl -e '$/ = undef; for (split(/\n/, <>)) { s:^ *///? ?::; print "  <p>\n" if ! | |||||||
| <tr><td><a href="#intervals">-intervals</a></td><td>Interval Partition Construction</td></tr> | <tr><td><a href="#intervals">-intervals</a></td><td>Interval Partition Construction</td></tr> | ||||||
| <tr><td><a href="#iv-users">-iv-users</a></td><td>Induction Variable Users</td></tr> | <tr><td><a href="#iv-users">-iv-users</a></td><td>Induction Variable Users</td></tr> | ||||||
| <tr><td><a href="#lazy-value-info">-lazy-value-info</a></td><td>Lazy Value Information Analysis</td></tr> | <tr><td><a href="#lazy-value-info">-lazy-value-info</a></td><td>Lazy Value Information Analysis</td></tr> | ||||||
| <tr><td><a href="#lda">-lda</a></td><td>Loop Dependence Analysis</td></tr> |  | ||||||
| <tr><td><a href="#libcall-aa">-libcall-aa</a></td><td>LibCall Alias Analysis</td></tr> | <tr><td><a href="#libcall-aa">-libcall-aa</a></td><td>LibCall Alias Analysis</td></tr> | ||||||
| <tr><td><a href="#lint">-lint</a></td><td>Statically lint-checks LLVM IR</td></tr> | <tr><td><a href="#lint">-lint</a></td><td>Statically lint-checks LLVM IR</td></tr> | ||||||
| <tr><td><a href="#loops">-loops</a></td><td>Natural Loop Information</td></tr> | <tr><td><a href="#loops">-loops</a></td><td>Natural Loop Information</td></tr> | ||||||
| @@ -249,6 +249,15 @@ perl -e '$/ = undef; for (split(/\n/, <>)) { s:^ *///? ?::; print "  <p>\n" if ! | |||||||
|   </p> |   </p> | ||||||
| </div> | </div> | ||||||
|  |  | ||||||
|  | <!-------------------------------------------------------------------------- --> | ||||||
|  | <h3> | ||||||
|  |   <a name="da">-da: Dependence Analysis</a> | ||||||
|  | </h3> | ||||||
|  | <div> | ||||||
|  |   <p>Dependence analysis framework, which is used to detect dependences in | ||||||
|  |   memory accesses.</p> | ||||||
|  | </div> | ||||||
|  |  | ||||||
| <!-------------------------------------------------------------------------- --> | <!-------------------------------------------------------------------------- --> | ||||||
| <h3> | <h3> | ||||||
|   <a name="debug-aa">-debug-aa: AA use debugger</a> |   <a name="debug-aa">-debug-aa: AA use debugger</a> | ||||||
| @@ -431,15 +440,6 @@ perl -e '$/ = undef; for (split(/\n/, <>)) { s:^ *///? ?::; print "  <p>\n" if ! | |||||||
|   <p>Interface for lazy computation of value constraint information.</p> |   <p>Interface for lazy computation of value constraint information.</p> | ||||||
| </div> | </div> | ||||||
|  |  | ||||||
| <!-------------------------------------------------------------------------- --> |  | ||||||
| <h3> |  | ||||||
|   <a name="lda">-lda: Loop Dependence Analysis</a> |  | ||||||
| </h3> |  | ||||||
| <div> |  | ||||||
|   <p>Loop dependence analysis framework, which is used to detect dependences in |  | ||||||
|   memory accesses in loops.</p> |  | ||||||
| </div> |  | ||||||
|  |  | ||||||
| <!-------------------------------------------------------------------------- --> | <!-------------------------------------------------------------------------- --> | ||||||
| <h3> | <h3> | ||||||
|   <a name="libcall-aa">-libcall-aa: LibCall Alias Analysis</a> |   <a name="libcall-aa">-libcall-aa: LibCall Alias Analysis</a> | ||||||
|   | |||||||
| @@ -1,124 +0,0 @@ | |||||||
| //===- llvm/Analysis/LoopDependenceAnalysis.h --------------- -*- C++ -*---===// |  | ||||||
| // |  | ||||||
| //                     The LLVM Compiler Infrastructure |  | ||||||
| // |  | ||||||
| // This file is distributed under the University of Illinois Open Source |  | ||||||
| // License. See LICENSE.TXT for details. |  | ||||||
| // |  | ||||||
| //===----------------------------------------------------------------------===// |  | ||||||
| // |  | ||||||
| // LoopDependenceAnalysis is an LLVM pass that analyses dependences in memory |  | ||||||
| // accesses in loops. |  | ||||||
| // |  | ||||||
| // Please note that this is work in progress and the interface is subject to |  | ||||||
| // change. |  | ||||||
| // |  | ||||||
| // TODO: adapt as interface progresses |  | ||||||
| // |  | ||||||
| //===----------------------------------------------------------------------===// |  | ||||||
|  |  | ||||||
| #ifndef LLVM_ANALYSIS_LOOP_DEPENDENCE_ANALYSIS_H |  | ||||||
| #define LLVM_ANALYSIS_LOOP_DEPENDENCE_ANALYSIS_H |  | ||||||
|  |  | ||||||
| #include "llvm/ADT/DenseSet.h" |  | ||||||
| #include "llvm/ADT/FoldingSet.h" |  | ||||||
| #include "llvm/ADT/SmallVector.h" |  | ||||||
| #include "llvm/Analysis/LoopPass.h" |  | ||||||
| #include "llvm/Support/Allocator.h" |  | ||||||
|  |  | ||||||
| namespace llvm { |  | ||||||
|  |  | ||||||
| class AliasAnalysis; |  | ||||||
| class AnalysisUsage; |  | ||||||
| class ScalarEvolution; |  | ||||||
| class SCEV; |  | ||||||
| class Value; |  | ||||||
| class raw_ostream; |  | ||||||
|  |  | ||||||
| class LoopDependenceAnalysis : public LoopPass { |  | ||||||
|   AliasAnalysis *AA; |  | ||||||
|   ScalarEvolution *SE; |  | ||||||
|  |  | ||||||
|   /// L - The loop we are currently analysing. |  | ||||||
|   Loop *L; |  | ||||||
|  |  | ||||||
|   /// TODO: doc |  | ||||||
|   enum DependenceResult { Independent = 0, Dependent = 1, Unknown = 2 }; |  | ||||||
|  |  | ||||||
|   /// TODO: doc |  | ||||||
|   struct Subscript { |  | ||||||
|     /// TODO: Add distance, direction, breaking conditions, ... |  | ||||||
|   }; |  | ||||||
|  |  | ||||||
|   /// DependencePair - Represents a data dependence relation between to memory |  | ||||||
|   /// reference instructions. |  | ||||||
|   struct DependencePair : public FastFoldingSetNode { |  | ||||||
|     Value *A; |  | ||||||
|     Value *B; |  | ||||||
|     DependenceResult Result; |  | ||||||
|     SmallVector<Subscript, 4> Subscripts; |  | ||||||
|  |  | ||||||
|     DependencePair(const FoldingSetNodeID &ID, Value *a, Value *b) : |  | ||||||
|         FastFoldingSetNode(ID), A(a), B(b), Result(Unknown), Subscripts() {} |  | ||||||
|   }; |  | ||||||
|  |  | ||||||
|   /// findOrInsertDependencePair - Return true if a DependencePair for the |  | ||||||
|   /// given Values already exists, false if a new DependencePair had to be |  | ||||||
|   /// created. The third argument is set to the pair found or created. |  | ||||||
|   bool findOrInsertDependencePair(Value*, Value*, DependencePair*&); |  | ||||||
|  |  | ||||||
|   /// getLoops - Collect all loops of the loop nest L in which |  | ||||||
|   /// a given SCEV is variant. |  | ||||||
|   void getLoops(const SCEV*, DenseSet<const Loop*>*) const; |  | ||||||
|  |  | ||||||
|   /// isLoopInvariant - True if a given SCEV is invariant in all loops of the |  | ||||||
|   /// loop nest starting at the innermost loop L. |  | ||||||
|   bool isLoopInvariant(const SCEV*) const; |  | ||||||
|  |  | ||||||
|   /// isAffine - An SCEV is affine with respect to the loop nest starting at |  | ||||||
|   /// the innermost loop L if it is of the form A+B*X where A, B are invariant |  | ||||||
|   /// in the loop nest and X is a induction variable in the loop nest. |  | ||||||
|   bool isAffine(const SCEV*) const; |  | ||||||
|  |  | ||||||
|   /// TODO: doc |  | ||||||
|   bool isZIVPair(const SCEV*, const SCEV*) const; |  | ||||||
|   bool isSIVPair(const SCEV*, const SCEV*) const; |  | ||||||
|   DependenceResult analyseZIV(const SCEV*, const SCEV*, Subscript*) const; |  | ||||||
|   DependenceResult analyseSIV(const SCEV*, const SCEV*, Subscript*) const; |  | ||||||
|   DependenceResult analyseMIV(const SCEV*, const SCEV*, Subscript*) const; |  | ||||||
|   DependenceResult analyseSubscript(const SCEV*, const SCEV*, Subscript*) const; |  | ||||||
|   DependenceResult analysePair(DependencePair*) const; |  | ||||||
|  |  | ||||||
| public: |  | ||||||
|   static char ID; // Class identification, replacement for typeinfo |  | ||||||
|   LoopDependenceAnalysis() : LoopPass(ID) { |  | ||||||
|     initializeLoopDependenceAnalysisPass(*PassRegistry::getPassRegistry()); |  | ||||||
|   } |  | ||||||
|  |  | ||||||
|   /// isDependencePair - Check whether two values can possibly give rise to |  | ||||||
|   /// a data dependence: that is the case if both are instructions accessing |  | ||||||
|   /// memory and at least one of those accesses is a write. |  | ||||||
|   bool isDependencePair(const Value*, const Value*) const; |  | ||||||
|  |  | ||||||
|   /// depends - Return a boolean indicating if there is a data dependence |  | ||||||
|   /// between two instructions. |  | ||||||
|   bool depends(Value*, Value*); |  | ||||||
|  |  | ||||||
|   bool runOnLoop(Loop*, LPPassManager&); |  | ||||||
|   virtual void releaseMemory(); |  | ||||||
|   virtual void getAnalysisUsage(AnalysisUsage&) const; |  | ||||||
|   void print(raw_ostream&, const Module* = 0) const; |  | ||||||
|  |  | ||||||
| private: |  | ||||||
|   FoldingSet<DependencePair> Pairs; |  | ||||||
|   BumpPtrAllocator PairAllocator; |  | ||||||
| }; // class LoopDependenceAnalysis |  | ||||||
|  |  | ||||||
| // createLoopDependenceAnalysisPass - This creates an instance of the |  | ||||||
| // LoopDependenceAnalysis pass. |  | ||||||
| // |  | ||||||
| LoopPass *createLoopDependenceAnalysisPass(); |  | ||||||
|  |  | ||||||
| } // namespace llvm |  | ||||||
|  |  | ||||||
| #endif /* LLVM_ANALYSIS_LOOP_DEPENDENCE_ANALYSIS_H */ |  | ||||||
| @@ -185,13 +185,6 @@ namespace llvm { | |||||||
|   // |   // | ||||||
|   FunctionPass *createDependenceAnalysisPass(); |   FunctionPass *createDependenceAnalysisPass(); | ||||||
|  |  | ||||||
|   //===--------------------------------------------------------------------===// |  | ||||||
|   // |  | ||||||
|   // createLoopDependenceAnalysisPass - This creates an instance of the |  | ||||||
|   // LoopDependenceAnalysis pass. |  | ||||||
|   // |  | ||||||
|   LoopPass *createLoopDependenceAnalysisPass(); |  | ||||||
|  |  | ||||||
|   //===--------------------------------------------------------------------===// |   //===--------------------------------------------------------------------===// | ||||||
|   // |   // | ||||||
|   // Minor pass prototypes, allowing us to expose them through bugpoint and |   // Minor pass prototypes, allowing us to expose them through bugpoint and | ||||||
|   | |||||||
| @@ -147,7 +147,6 @@ void initializeProfileMetadataLoaderPassPass(PassRegistry&); | |||||||
| void initializePathProfileLoaderPassPass(PassRegistry&); | void initializePathProfileLoaderPassPass(PassRegistry&); | ||||||
| void initializeLocalStackSlotPassPass(PassRegistry&); | void initializeLocalStackSlotPassPass(PassRegistry&); | ||||||
| void initializeLoopDeletionPass(PassRegistry&); | void initializeLoopDeletionPass(PassRegistry&); | ||||||
| void initializeLoopDependenceAnalysisPass(PassRegistry&); |  | ||||||
| void initializeLoopExtractorPass(PassRegistry&); | void initializeLoopExtractorPass(PassRegistry&); | ||||||
| void initializeLoopInfoPass(PassRegistry&); | void initializeLoopInfoPass(PassRegistry&); | ||||||
| void initializeLoopInstSimplifyPass(PassRegistry&); | void initializeLoopInstSimplifyPass(PassRegistry&); | ||||||
|   | |||||||
| @@ -86,7 +86,6 @@ namespace { | |||||||
|       (void) llvm::createLCSSAPass(); |       (void) llvm::createLCSSAPass(); | ||||||
|       (void) llvm::createLICMPass(); |       (void) llvm::createLICMPass(); | ||||||
|       (void) llvm::createLazyValueInfoPass(); |       (void) llvm::createLazyValueInfoPass(); | ||||||
|       (void) llvm::createLoopDependenceAnalysisPass(); |  | ||||||
|       (void) llvm::createLoopExtractorPass(); |       (void) llvm::createLoopExtractorPass(); | ||||||
|       (void) llvm::createLoopSimplifyPass(); |       (void) llvm::createLoopSimplifyPass(); | ||||||
|       (void) llvm::createLoopStrengthReducePass(); |       (void) llvm::createLoopStrengthReducePass(); | ||||||
|   | |||||||
| @@ -47,7 +47,6 @@ void llvm::initializeAnalysis(PassRegistry &Registry) { | |||||||
|   initializeLazyValueInfoPass(Registry); |   initializeLazyValueInfoPass(Registry); | ||||||
|   initializeLibCallAliasAnalysisPass(Registry); |   initializeLibCallAliasAnalysisPass(Registry); | ||||||
|   initializeLintPass(Registry); |   initializeLintPass(Registry); | ||||||
|   initializeLoopDependenceAnalysisPass(Registry); |  | ||||||
|   initializeLoopInfoPass(Registry); |   initializeLoopInfoPass(Registry); | ||||||
|   initializeMemDepPrinterPass(Registry); |   initializeMemDepPrinterPass(Registry); | ||||||
|   initializeMemoryDependenceAnalysisPass(Registry); |   initializeMemoryDependenceAnalysisPass(Registry); | ||||||
|   | |||||||
| @@ -27,7 +27,6 @@ add_llvm_library(LLVMAnalysis | |||||||
|   LibCallSemantics.cpp |   LibCallSemantics.cpp | ||||||
|   Lint.cpp |   Lint.cpp | ||||||
|   Loads.cpp |   Loads.cpp | ||||||
|   LoopDependenceAnalysis.cpp |  | ||||||
|   LoopInfo.cpp |   LoopInfo.cpp | ||||||
|   LoopPass.cpp |   LoopPass.cpp | ||||||
|   MemDepPrinter.cpp |   MemDepPrinter.cpp | ||||||
|   | |||||||
| @@ -1,362 +0,0 @@ | |||||||
| //===- LoopDependenceAnalysis.cpp - LDA Implementation ----------*- C++ -*-===// |  | ||||||
| // |  | ||||||
| //                     The LLVM Compiler Infrastructure |  | ||||||
| // |  | ||||||
| // This file is distributed under the University of Illinois Open Source |  | ||||||
| // License. See LICENSE.TXT for details. |  | ||||||
| // |  | ||||||
| //===----------------------------------------------------------------------===// |  | ||||||
| // |  | ||||||
| // This is the (beginning) of an implementation of a loop dependence analysis |  | ||||||
| // framework, which is used to detect dependences in memory accesses in loops. |  | ||||||
| // |  | ||||||
| // Please note that this is work in progress and the interface is subject to |  | ||||||
| // change. |  | ||||||
| // |  | ||||||
| // TODO: adapt as implementation progresses. |  | ||||||
| // |  | ||||||
| // TODO: document lingo (pair, subscript, index) |  | ||||||
| // |  | ||||||
| //===----------------------------------------------------------------------===// |  | ||||||
|  |  | ||||||
| #define DEBUG_TYPE "lda" |  | ||||||
| #include "llvm/ADT/DenseSet.h" |  | ||||||
| #include "llvm/ADT/Statistic.h" |  | ||||||
| #include "llvm/Analysis/AliasAnalysis.h" |  | ||||||
| #include "llvm/Analysis/LoopDependenceAnalysis.h" |  | ||||||
| #include "llvm/Analysis/LoopPass.h" |  | ||||||
| #include "llvm/Analysis/ScalarEvolution.h" |  | ||||||
| #include "llvm/Analysis/ScalarEvolutionExpressions.h" |  | ||||||
| #include "llvm/Analysis/ValueTracking.h" |  | ||||||
| #include "llvm/Assembly/Writer.h" |  | ||||||
| #include "llvm/Instructions.h" |  | ||||||
| #include "llvm/Operator.h" |  | ||||||
| #include "llvm/Support/Allocator.h" |  | ||||||
| #include "llvm/Support/Debug.h" |  | ||||||
| #include "llvm/Support/ErrorHandling.h" |  | ||||||
| #include "llvm/Support/raw_ostream.h" |  | ||||||
| #include "llvm/DataLayout.h" |  | ||||||
| using namespace llvm; |  | ||||||
|  |  | ||||||
| STATISTIC(NumAnswered,    "Number of dependence queries answered"); |  | ||||||
| STATISTIC(NumAnalysed,    "Number of distinct dependence pairs analysed"); |  | ||||||
| STATISTIC(NumDependent,   "Number of pairs with dependent accesses"); |  | ||||||
| STATISTIC(NumIndependent, "Number of pairs with independent accesses"); |  | ||||||
| STATISTIC(NumUnknown,     "Number of pairs with unknown accesses"); |  | ||||||
|  |  | ||||||
| LoopPass *llvm::createLoopDependenceAnalysisPass() { |  | ||||||
|   return new LoopDependenceAnalysis(); |  | ||||||
| } |  | ||||||
|  |  | ||||||
| INITIALIZE_PASS_BEGIN(LoopDependenceAnalysis, "lda", |  | ||||||
|                 "Loop Dependence Analysis", false, true) |  | ||||||
| INITIALIZE_PASS_DEPENDENCY(ScalarEvolution) |  | ||||||
| INITIALIZE_AG_DEPENDENCY(AliasAnalysis) |  | ||||||
| INITIALIZE_PASS_END(LoopDependenceAnalysis, "lda", |  | ||||||
|                 "Loop Dependence Analysis", false, true) |  | ||||||
| char LoopDependenceAnalysis::ID = 0; |  | ||||||
|  |  | ||||||
| //===----------------------------------------------------------------------===// |  | ||||||
| //                             Utility Functions |  | ||||||
| //===----------------------------------------------------------------------===// |  | ||||||
|  |  | ||||||
| static inline bool IsMemRefInstr(const Value *V) { |  | ||||||
|   const Instruction *I = dyn_cast<const Instruction>(V); |  | ||||||
|   return I && (I->mayReadFromMemory() || I->mayWriteToMemory()); |  | ||||||
| } |  | ||||||
|  |  | ||||||
| static void GetMemRefInstrs(const Loop *L, |  | ||||||
|                             SmallVectorImpl<Instruction*> &Memrefs) { |  | ||||||
|   for (Loop::block_iterator b = L->block_begin(), be = L->block_end(); |  | ||||||
|        b != be; ++b) |  | ||||||
|     for (BasicBlock::iterator i = (*b)->begin(), ie = (*b)->end(); |  | ||||||
|          i != ie; ++i) |  | ||||||
|       if (IsMemRefInstr(i)) |  | ||||||
|         Memrefs.push_back(i); |  | ||||||
| } |  | ||||||
|  |  | ||||||
| static bool IsLoadOrStoreInst(Value *I) { |  | ||||||
|   // Returns true if the load or store can be analyzed. Atomic and volatile |  | ||||||
|   // operations have properties which this analysis does not understand. |  | ||||||
|   if (LoadInst *LI = dyn_cast<LoadInst>(I)) |  | ||||||
|     return LI->isUnordered(); |  | ||||||
|   else if (StoreInst *SI = dyn_cast<StoreInst>(I)) |  | ||||||
|     return SI->isUnordered(); |  | ||||||
|   return false; |  | ||||||
| } |  | ||||||
|  |  | ||||||
| static Value *GetPointerOperand(Value *I) { |  | ||||||
|   if (LoadInst *i = dyn_cast<LoadInst>(I)) |  | ||||||
|     return i->getPointerOperand(); |  | ||||||
|   if (StoreInst *i = dyn_cast<StoreInst>(I)) |  | ||||||
|     return i->getPointerOperand(); |  | ||||||
|   llvm_unreachable("Value is no load or store instruction!"); |  | ||||||
| } |  | ||||||
|  |  | ||||||
| static AliasAnalysis::AliasResult UnderlyingObjectsAlias(AliasAnalysis *AA, |  | ||||||
|                                                          const Value *A, |  | ||||||
|                                                          const Value *B) { |  | ||||||
|   const Value *aObj = GetUnderlyingObject(A); |  | ||||||
|   const Value *bObj = GetUnderlyingObject(B); |  | ||||||
|   return AA->alias(aObj, AA->getTypeStoreSize(aObj->getType()), |  | ||||||
|                    bObj, AA->getTypeStoreSize(bObj->getType())); |  | ||||||
| } |  | ||||||
|  |  | ||||||
| static inline const SCEV *GetZeroSCEV(ScalarEvolution *SE) { |  | ||||||
|   return SE->getConstant(Type::getInt32Ty(SE->getContext()), 0L); |  | ||||||
| } |  | ||||||
|  |  | ||||||
| //===----------------------------------------------------------------------===// |  | ||||||
| //                             Dependence Testing |  | ||||||
| //===----------------------------------------------------------------------===// |  | ||||||
|  |  | ||||||
| bool LoopDependenceAnalysis::isDependencePair(const Value *A, |  | ||||||
|                                               const Value *B) const { |  | ||||||
|   return IsMemRefInstr(A) && |  | ||||||
|          IsMemRefInstr(B) && |  | ||||||
|          (cast<const Instruction>(A)->mayWriteToMemory() || |  | ||||||
|           cast<const Instruction>(B)->mayWriteToMemory()); |  | ||||||
| } |  | ||||||
|  |  | ||||||
| bool LoopDependenceAnalysis::findOrInsertDependencePair(Value *A, |  | ||||||
|                                                         Value *B, |  | ||||||
|                                                         DependencePair *&P) { |  | ||||||
|   void *insertPos = 0; |  | ||||||
|   FoldingSetNodeID id; |  | ||||||
|   id.AddPointer(A); |  | ||||||
|   id.AddPointer(B); |  | ||||||
|  |  | ||||||
|   P = Pairs.FindNodeOrInsertPos(id, insertPos); |  | ||||||
|   if (P) return true; |  | ||||||
|  |  | ||||||
|   P = new (PairAllocator) DependencePair(id, A, B); |  | ||||||
|   Pairs.InsertNode(P, insertPos); |  | ||||||
|   return false; |  | ||||||
| } |  | ||||||
|  |  | ||||||
| void LoopDependenceAnalysis::getLoops(const SCEV *S, |  | ||||||
|                                       DenseSet<const Loop*>* Loops) const { |  | ||||||
|   // Refactor this into an SCEVVisitor, if efficiency becomes a concern. |  | ||||||
|   for (const Loop *L = this->L; L != 0; L = L->getParentLoop()) |  | ||||||
|     if (!SE->isLoopInvariant(S, L)) |  | ||||||
|       Loops->insert(L); |  | ||||||
| } |  | ||||||
|  |  | ||||||
| bool LoopDependenceAnalysis::isLoopInvariant(const SCEV *S) const { |  | ||||||
|   DenseSet<const Loop*> loops; |  | ||||||
|   getLoops(S, &loops); |  | ||||||
|   return loops.empty(); |  | ||||||
| } |  | ||||||
|  |  | ||||||
| bool LoopDependenceAnalysis::isAffine(const SCEV *S) const { |  | ||||||
|   const SCEVAddRecExpr *rec = dyn_cast<SCEVAddRecExpr>(S); |  | ||||||
|   return isLoopInvariant(S) || (rec && rec->isAffine()); |  | ||||||
| } |  | ||||||
|  |  | ||||||
| bool LoopDependenceAnalysis::isZIVPair(const SCEV *A, const SCEV *B) const { |  | ||||||
|   return isLoopInvariant(A) && isLoopInvariant(B); |  | ||||||
| } |  | ||||||
|  |  | ||||||
| bool LoopDependenceAnalysis::isSIVPair(const SCEV *A, const SCEV *B) const { |  | ||||||
|   DenseSet<const Loop*> loops; |  | ||||||
|   getLoops(A, &loops); |  | ||||||
|   getLoops(B, &loops); |  | ||||||
|   return loops.size() == 1; |  | ||||||
| } |  | ||||||
|  |  | ||||||
| LoopDependenceAnalysis::DependenceResult |  | ||||||
| LoopDependenceAnalysis::analyseZIV(const SCEV *A, |  | ||||||
|                                    const SCEV *B, |  | ||||||
|                                    Subscript *S) const { |  | ||||||
|   assert(isZIVPair(A, B) && "Attempted to ZIV-test non-ZIV SCEVs!"); |  | ||||||
|   return A == B ? Dependent : Independent; |  | ||||||
| } |  | ||||||
|  |  | ||||||
| LoopDependenceAnalysis::DependenceResult |  | ||||||
| LoopDependenceAnalysis::analyseSIV(const SCEV *A, |  | ||||||
|                                    const SCEV *B, |  | ||||||
|                                    Subscript *S) const { |  | ||||||
|   return Unknown; // TODO: Implement. |  | ||||||
| } |  | ||||||
|  |  | ||||||
| LoopDependenceAnalysis::DependenceResult |  | ||||||
| LoopDependenceAnalysis::analyseMIV(const SCEV *A, |  | ||||||
|                                    const SCEV *B, |  | ||||||
|                                    Subscript *S) const { |  | ||||||
|   return Unknown; // TODO: Implement. |  | ||||||
| } |  | ||||||
|  |  | ||||||
| LoopDependenceAnalysis::DependenceResult |  | ||||||
| LoopDependenceAnalysis::analyseSubscript(const SCEV *A, |  | ||||||
|                                          const SCEV *B, |  | ||||||
|                                          Subscript *S) const { |  | ||||||
|   DEBUG(dbgs() << "  Testing subscript: " << *A << ", " << *B << "\n"); |  | ||||||
|  |  | ||||||
|   if (A == B) { |  | ||||||
|     DEBUG(dbgs() << "  -> [D] same SCEV\n"); |  | ||||||
|     return Dependent; |  | ||||||
|   } |  | ||||||
|  |  | ||||||
|   if (!isAffine(A) || !isAffine(B)) { |  | ||||||
|     DEBUG(dbgs() << "  -> [?] not affine\n"); |  | ||||||
|     return Unknown; |  | ||||||
|   } |  | ||||||
|  |  | ||||||
|   if (isZIVPair(A, B)) |  | ||||||
|     return analyseZIV(A, B, S); |  | ||||||
|  |  | ||||||
|   if (isSIVPair(A, B)) |  | ||||||
|     return analyseSIV(A, B, S); |  | ||||||
|  |  | ||||||
|   return analyseMIV(A, B, S); |  | ||||||
| } |  | ||||||
|  |  | ||||||
| LoopDependenceAnalysis::DependenceResult |  | ||||||
| LoopDependenceAnalysis::analysePair(DependencePair *P) const { |  | ||||||
|   DEBUG(dbgs() << "Analysing:\n" << *P->A << "\n" << *P->B << "\n"); |  | ||||||
|  |  | ||||||
|   // We only analyse loads and stores but no possible memory accesses by e.g. |  | ||||||
|   // free, call, or invoke instructions. |  | ||||||
|   if (!IsLoadOrStoreInst(P->A) || !IsLoadOrStoreInst(P->B)) { |  | ||||||
|     DEBUG(dbgs() << "--> [?] no load/store\n"); |  | ||||||
|     return Unknown; |  | ||||||
|   } |  | ||||||
|  |  | ||||||
|   Value *aPtr = GetPointerOperand(P->A); |  | ||||||
|   Value *bPtr = GetPointerOperand(P->B); |  | ||||||
|  |  | ||||||
|   switch (UnderlyingObjectsAlias(AA, aPtr, bPtr)) { |  | ||||||
|   case AliasAnalysis::MayAlias: |  | ||||||
|   case AliasAnalysis::PartialAlias: |  | ||||||
|     // We can not analyse objects if we do not know about their aliasing. |  | ||||||
|     DEBUG(dbgs() << "---> [?] may alias\n"); |  | ||||||
|     return Unknown; |  | ||||||
|  |  | ||||||
|   case AliasAnalysis::NoAlias: |  | ||||||
|     // If the objects noalias, they are distinct, accesses are independent. |  | ||||||
|     DEBUG(dbgs() << "---> [I] no alias\n"); |  | ||||||
|     return Independent; |  | ||||||
|  |  | ||||||
|   case AliasAnalysis::MustAlias: |  | ||||||
|     break; // The underlying objects alias, test accesses for dependence. |  | ||||||
|   } |  | ||||||
|  |  | ||||||
|   const GEPOperator *aGEP = dyn_cast<GEPOperator>(aPtr); |  | ||||||
|   const GEPOperator *bGEP = dyn_cast<GEPOperator>(bPtr); |  | ||||||
|  |  | ||||||
|   if (!aGEP || !bGEP) |  | ||||||
|     return Unknown; |  | ||||||
|  |  | ||||||
|   // FIXME: Is filtering coupled subscripts necessary? |  | ||||||
|  |  | ||||||
|   // Collect GEP operand pairs (FIXME: use GetGEPOperands from BasicAA), adding |  | ||||||
|   // trailing zeroes to the smaller GEP, if needed. |  | ||||||
|   typedef SmallVector<std::pair<const SCEV*, const SCEV*>, 4> GEPOpdPairsTy; |  | ||||||
|   GEPOpdPairsTy opds; |  | ||||||
|   for(GEPOperator::const_op_iterator aIdx = aGEP->idx_begin(), |  | ||||||
|                                      aEnd = aGEP->idx_end(), |  | ||||||
|                                      bIdx = bGEP->idx_begin(), |  | ||||||
|                                      bEnd = bGEP->idx_end(); |  | ||||||
|       aIdx != aEnd && bIdx != bEnd; |  | ||||||
|       aIdx += (aIdx != aEnd), bIdx += (bIdx != bEnd)) { |  | ||||||
|     const SCEV* aSCEV = (aIdx != aEnd) ? SE->getSCEV(*aIdx) : GetZeroSCEV(SE); |  | ||||||
|     const SCEV* bSCEV = (bIdx != bEnd) ? SE->getSCEV(*bIdx) : GetZeroSCEV(SE); |  | ||||||
|     opds.push_back(std::make_pair(aSCEV, bSCEV)); |  | ||||||
|   } |  | ||||||
|  |  | ||||||
|   if (!opds.empty() && opds[0].first != opds[0].second) { |  | ||||||
|     // We cannot (yet) handle arbitrary GEP pointer offsets. By limiting |  | ||||||
|     // |  | ||||||
|     // TODO: this could be relaxed by adding the size of the underlying object |  | ||||||
|     // to the first subscript. If we have e.g. (GEP x,0,i; GEP x,2,-i) and we |  | ||||||
|     // know that x is a [100 x i8]*, we could modify the first subscript to be |  | ||||||
|     // (i, 200-i) instead of (i, -i). |  | ||||||
|     return Unknown; |  | ||||||
|   } |  | ||||||
|  |  | ||||||
|   // Now analyse the collected operand pairs (skipping the GEP ptr offsets). |  | ||||||
|   for (GEPOpdPairsTy::const_iterator i = opds.begin() + 1, end = opds.end(); |  | ||||||
|        i != end; ++i) { |  | ||||||
|     Subscript subscript; |  | ||||||
|     DependenceResult result = analyseSubscript(i->first, i->second, &subscript); |  | ||||||
|     if (result != Dependent) { |  | ||||||
|       // We either proved independence or failed to analyse this subscript. |  | ||||||
|       // Further subscripts will not improve the situation, so abort early. |  | ||||||
|       return result; |  | ||||||
|     } |  | ||||||
|     P->Subscripts.push_back(subscript); |  | ||||||
|   } |  | ||||||
|   // We successfully analysed all subscripts but failed to prove independence. |  | ||||||
|   return Dependent; |  | ||||||
| } |  | ||||||
|  |  | ||||||
| bool LoopDependenceAnalysis::depends(Value *A, Value *B) { |  | ||||||
|   assert(isDependencePair(A, B) && "Values form no dependence pair!"); |  | ||||||
|   ++NumAnswered; |  | ||||||
|  |  | ||||||
|   DependencePair *p; |  | ||||||
|   if (!findOrInsertDependencePair(A, B, p)) { |  | ||||||
|     // The pair is not cached, so analyse it. |  | ||||||
|     ++NumAnalysed; |  | ||||||
|     switch (p->Result = analysePair(p)) { |  | ||||||
|     case Dependent:   ++NumDependent;   break; |  | ||||||
|     case Independent: ++NumIndependent; break; |  | ||||||
|     case Unknown:     ++NumUnknown;     break; |  | ||||||
|     } |  | ||||||
|   } |  | ||||||
|   return p->Result != Independent; |  | ||||||
| } |  | ||||||
|  |  | ||||||
| //===----------------------------------------------------------------------===// |  | ||||||
| //                   LoopDependenceAnalysis Implementation |  | ||||||
| //===----------------------------------------------------------------------===// |  | ||||||
|  |  | ||||||
| bool LoopDependenceAnalysis::runOnLoop(Loop *L, LPPassManager &) { |  | ||||||
|   this->L = L; |  | ||||||
|   AA = &getAnalysis<AliasAnalysis>(); |  | ||||||
|   SE = &getAnalysis<ScalarEvolution>(); |  | ||||||
|   return false; |  | ||||||
| } |  | ||||||
|  |  | ||||||
| void LoopDependenceAnalysis::releaseMemory() { |  | ||||||
|   Pairs.clear(); |  | ||||||
|   PairAllocator.Reset(); |  | ||||||
| } |  | ||||||
|  |  | ||||||
| void LoopDependenceAnalysis::getAnalysisUsage(AnalysisUsage &AU) const { |  | ||||||
|   AU.setPreservesAll(); |  | ||||||
|   AU.addRequiredTransitive<AliasAnalysis>(); |  | ||||||
|   AU.addRequiredTransitive<ScalarEvolution>(); |  | ||||||
| } |  | ||||||
|  |  | ||||||
| static void PrintLoopInfo(raw_ostream &OS, |  | ||||||
|                           LoopDependenceAnalysis *LDA, const Loop *L) { |  | ||||||
|   if (!L->empty()) return; // ignore non-innermost loops |  | ||||||
|  |  | ||||||
|   SmallVector<Instruction*, 8> memrefs; |  | ||||||
|   GetMemRefInstrs(L, memrefs); |  | ||||||
|  |  | ||||||
|   OS << "Loop at depth " << L->getLoopDepth() << ", header block: "; |  | ||||||
|   WriteAsOperand(OS, L->getHeader(), false); |  | ||||||
|   OS << "\n"; |  | ||||||
|  |  | ||||||
|   OS << "  Load/store instructions: " << memrefs.size() << "\n"; |  | ||||||
|   for (SmallVector<Instruction*, 8>::const_iterator x = memrefs.begin(), |  | ||||||
|        end = memrefs.end(); x != end; ++x) |  | ||||||
|     OS << "\t" << (x - memrefs.begin()) << ": " << **x << "\n"; |  | ||||||
|  |  | ||||||
|   OS << "  Pairwise dependence results:\n"; |  | ||||||
|   for (SmallVector<Instruction*, 8>::const_iterator x = memrefs.begin(), |  | ||||||
|        end = memrefs.end(); x != end; ++x) |  | ||||||
|     for (SmallVector<Instruction*, 8>::const_iterator y = x + 1; |  | ||||||
|          y != end; ++y) |  | ||||||
|       if (LDA->isDependencePair(*x, *y)) |  | ||||||
|         OS << "\t" << (x - memrefs.begin()) << "," << (y - memrefs.begin()) |  | ||||||
|            << ": " << (LDA->depends(*x, *y) ? "dependent" : "independent") |  | ||||||
|            << "\n"; |  | ||||||
| } |  | ||||||
|  |  | ||||||
| void LoopDependenceAnalysis::print(raw_ostream &OS, const Module*) const { |  | ||||||
|   // TODO: doc why const_cast is safe |  | ||||||
|   PrintLoopInfo(OS, const_cast<LoopDependenceAnalysis*>(this), this->L); |  | ||||||
| } |  | ||||||
| @@ -1,44 +0,0 @@ | |||||||
| ; RUN: opt < %s -analyze -basicaa -lda | FileCheck %s |  | ||||||
|  |  | ||||||
| ;; x[5] = x[6] // with x being a pointer passed as argument |  | ||||||
|  |  | ||||||
| define void @f1(i32* nocapture %xptr) nounwind { |  | ||||||
| entry: |  | ||||||
|   %x.ld.addr = getelementptr i32* %xptr, i64 6 |  | ||||||
|   %x.st.addr = getelementptr i32* %xptr, i64 5 |  | ||||||
|   br label %for.body |  | ||||||
|  |  | ||||||
| for.body: |  | ||||||
|   %i = phi i64 [ 0, %entry ], [ %i.next, %for.body ] |  | ||||||
|   %x = load i32* %x.ld.addr |  | ||||||
|   store i32 %x, i32* %x.st.addr |  | ||||||
| ; CHECK: 0,1: dep |  | ||||||
|   %i.next = add i64 %i, 1 |  | ||||||
|   %exitcond = icmp eq i64 %i.next, 256 |  | ||||||
|   br i1 %exitcond, label %for.end, label %for.body |  | ||||||
|  |  | ||||||
| for.end: |  | ||||||
|   ret void |  | ||||||
| } |  | ||||||
|  |  | ||||||
| ;; x[5] = x[6] // with x being an array on the stack |  | ||||||
|  |  | ||||||
| define void @foo(...) nounwind { |  | ||||||
| entry: |  | ||||||
|   %xptr = alloca [256 x i32], align 4 |  | ||||||
|   %x.ld.addr = getelementptr [256 x i32]* %xptr, i64 0, i64 6 |  | ||||||
|   %x.st.addr = getelementptr [256 x i32]* %xptr, i64 0, i64 5 |  | ||||||
|   br label %for.body |  | ||||||
|  |  | ||||||
| for.body: |  | ||||||
|   %i = phi i64 [ 0, %entry ], [ %i.next, %for.body ] |  | ||||||
|   %x = load i32* %x.ld.addr |  | ||||||
|   store i32 %x, i32* %x.st.addr |  | ||||||
| ; CHECK: 0,1: ind |  | ||||||
|   %i.next = add i64 %i, 1 |  | ||||||
|   %exitcond = icmp eq i64 %i.next, 256 |  | ||||||
|   br i1 %exitcond, label %for.end, label %for.body |  | ||||||
|  |  | ||||||
| for.end: |  | ||||||
|   ret void |  | ||||||
| } |  | ||||||
| @@ -1 +0,0 @@ | |||||||
| config.suffixes = ['.ll', '.c', '.cpp'] |  | ||||||
| @@ -1,110 +0,0 @@ | |||||||
| ; RUN: opt < %s -analyze -basicaa -lda | FileCheck %s |  | ||||||
|  |  | ||||||
| @x = common global [256 x i32] zeroinitializer, align 4 |  | ||||||
| @y = common global [256 x i32] zeroinitializer, align 4 |  | ||||||
|  |  | ||||||
| ;; for (i = 0; i < 256; i++) |  | ||||||
| ;;   x[i] = x[i] + y[i] |  | ||||||
|  |  | ||||||
| define void @f1(...) nounwind { |  | ||||||
| entry: |  | ||||||
|   br label %for.body |  | ||||||
|  |  | ||||||
| for.body: |  | ||||||
|   %i = phi i64 [ 0, %entry ], [ %i.next, %for.body ] |  | ||||||
|   %y.addr = getelementptr [256 x i32]* @y, i64 0, i64 %i |  | ||||||
|   %x.addr = getelementptr [256 x i32]* @x, i64 0, i64 %i |  | ||||||
|   %x = load i32* %x.addr      ; 0 |  | ||||||
|   %y = load i32* %y.addr      ; 1 |  | ||||||
|   %r = add i32 %y, %x |  | ||||||
|   store i32 %r, i32* %x.addr  ; 2 |  | ||||||
| ; CHECK: 0,2: dep |  | ||||||
| ; CHECK: 1,2: ind |  | ||||||
|   %i.next = add i64 %i, 1 |  | ||||||
|   %exitcond = icmp eq i64 %i.next, 256 |  | ||||||
|   br i1 %exitcond, label %for.end, label %for.body |  | ||||||
|  |  | ||||||
| for.end: |  | ||||||
|   ret void |  | ||||||
| } |  | ||||||
|  |  | ||||||
| ;; for (i = 0; i < 256; i++) |  | ||||||
| ;;   x[i+1] = x[i] + y[i] |  | ||||||
|  |  | ||||||
| define void @f2(...) nounwind { |  | ||||||
| entry: |  | ||||||
|   br label %for.body |  | ||||||
|  |  | ||||||
| for.body: |  | ||||||
|   %i = phi i64 [ 0, %entry ], [ %i.next, %for.body ] |  | ||||||
|   %y.ld.addr = getelementptr [256 x i32]* @y, i64 0, i64 %i |  | ||||||
|   %x.ld.addr = getelementptr [256 x i32]* @x, i64 0, i64 %i |  | ||||||
|   %i.next = add i64 %i, 1 |  | ||||||
|   %x.st.addr = getelementptr [256 x i32]* @x, i64 0, i64 %i.next |  | ||||||
|   %x = load i32* %x.ld.addr     ; 0 |  | ||||||
|   %y = load i32* %y.ld.addr     ; 1 |  | ||||||
|   %r = add i32 %y, %x |  | ||||||
|   store i32 %r, i32* %x.st.addr ; 2 |  | ||||||
| ; CHECK: 0,2: dep |  | ||||||
| ; CHECK: 1,2: ind |  | ||||||
|   %exitcond = icmp eq i64 %i.next, 256 |  | ||||||
|   br i1 %exitcond, label %for.end, label %for.body |  | ||||||
|  |  | ||||||
| for.end: |  | ||||||
|   ret void |  | ||||||
| } |  | ||||||
|  |  | ||||||
| ;; for (i = 0; i < 10; i++) |  | ||||||
| ;;   x[i+20] = x[i] + y[i] |  | ||||||
|  |  | ||||||
| define void @f3(...) nounwind { |  | ||||||
| entry: |  | ||||||
|   br label %for.body |  | ||||||
|  |  | ||||||
| for.body: |  | ||||||
|   %i = phi i64 [ 0, %entry ], [ %i.next, %for.body ] |  | ||||||
|   %y.ld.addr = getelementptr [256 x i32]* @y, i64 0, i64 %i |  | ||||||
|   %x.ld.addr = getelementptr [256 x i32]* @x, i64 0, i64 %i |  | ||||||
|   %i.20 = add i64 %i, 20 |  | ||||||
|   %x.st.addr = getelementptr [256 x i32]* @x, i64 0, i64 %i.20 |  | ||||||
|   %x = load i32* %x.ld.addr     ; 0 |  | ||||||
|   %y = load i32* %y.ld.addr     ; 1 |  | ||||||
|   %r = add i32 %y, %x |  | ||||||
|   store i32 %r, i32* %x.st.addr ; 2 |  | ||||||
| ; CHECK: 0,2: dep |  | ||||||
| ; CHECK: 1,2: ind |  | ||||||
|   %i.next = add i64 %i, 1 |  | ||||||
|   %exitcond = icmp eq i64 %i.next, 10 |  | ||||||
|   br i1 %exitcond, label %for.end, label %for.body |  | ||||||
|  |  | ||||||
| for.end: |  | ||||||
|   ret void |  | ||||||
| } |  | ||||||
|  |  | ||||||
| ;; for (i = 0; i < 10; i++) |  | ||||||
| ;;   x[10*i+1] = x[10*i] + y[i] |  | ||||||
|  |  | ||||||
| define void @f4(...) nounwind { |  | ||||||
| entry: |  | ||||||
|   br label %for.body |  | ||||||
|  |  | ||||||
| for.body: |  | ||||||
|   %i = phi i64 [ 0, %entry ], [ %i.next, %for.body ] |  | ||||||
|   %i.10 = mul i64 %i, 10 |  | ||||||
|   %y.ld.addr = getelementptr [256 x i32]* @y, i64 0, i64 %i.10 |  | ||||||
|   %x.ld.addr = getelementptr [256 x i32]* @x, i64 0, i64 %i.10 |  | ||||||
|   %i.10.1 = add i64 %i.10, 1 |  | ||||||
|   %x.st.addr = getelementptr [256 x i32]* @x, i64 0, i64 %i.10.1 |  | ||||||
|   %x = load i32* %x.ld.addr     ; 0 |  | ||||||
|   %y = load i32* %y.ld.addr     ; 1 |  | ||||||
|   %r = add i32 %y, %x |  | ||||||
|   store i32 %r, i32* %x.st.addr ; 2 |  | ||||||
| ; CHECK: 0,2: dep |  | ||||||
| ; CHECK: 1,2: ind |  | ||||||
|   %i.next = add i64 %i, 1 |  | ||||||
|   %exitcond = icmp eq i64 %i.next, 10 |  | ||||||
|   br i1 %exitcond, label %for.end, label %for.body |  | ||||||
|  |  | ||||||
| for.end: |  | ||||||
|   ret void |  | ||||||
| } |  | ||||||
| @@ -1,118 +0,0 @@ | |||||||
| ; RUN: opt < %s -analyze -basicaa -lda | FileCheck %s |  | ||||||
|  |  | ||||||
| @x = common global [256 x i32] zeroinitializer, align 4 |  | ||||||
| @y = common global [256 x i32] zeroinitializer, align 4 |  | ||||||
|  |  | ||||||
| ;; for (i = 0; i < 256; i++) |  | ||||||
| ;;   x[i] = x[255 - i] + y[i] |  | ||||||
|  |  | ||||||
| define void @f1(...) nounwind { |  | ||||||
| entry: |  | ||||||
|   br label %for.body |  | ||||||
|  |  | ||||||
| for.body: |  | ||||||
|   %i = phi i64 [ 0, %entry ], [ %i.next, %for.body ] |  | ||||||
|   %i.255 = sub i64 255, %i |  | ||||||
|   %y.ld.addr = getelementptr [256 x i32]* @y, i64 0, i64 %i |  | ||||||
|   %x.ld.addr = getelementptr [256 x i32]* @x, i64 0, i64 %i.255 |  | ||||||
|   %x.st.addr = getelementptr [256 x i32]* @x, i64 0, i64 %i |  | ||||||
|   %x = load i32* %x.ld.addr     ; 0 |  | ||||||
|   %y = load i32* %y.ld.addr     ; 1 |  | ||||||
|   %r = add i32 %y, %x |  | ||||||
|   store i32 %r, i32* %x.st.addr ; 2 |  | ||||||
| ; CHECK: 0,2: dep |  | ||||||
| ; CHECK: 1,2: ind |  | ||||||
|   %i.next = add i64 %i, 1 |  | ||||||
|   %exitcond = icmp eq i64 %i.next, 256 |  | ||||||
|   br i1 %exitcond, label %for.end, label %for.body |  | ||||||
|  |  | ||||||
| for.end: |  | ||||||
|   ret void |  | ||||||
| } |  | ||||||
|  |  | ||||||
| ;; for (i = 0; i < 100; i++) |  | ||||||
| ;;   x[i] = x[255 - i] + y[i] |  | ||||||
|  |  | ||||||
| define void @f2(...) nounwind { |  | ||||||
| entry: |  | ||||||
|   br label %for.body |  | ||||||
|  |  | ||||||
| for.body: |  | ||||||
|   %i = phi i64 [ 0, %entry ], [ %i.next, %for.body ] |  | ||||||
|   %i.255 = sub i64 255, %i |  | ||||||
|   %y.ld.addr = getelementptr [256 x i32]* @y, i64 0, i64 %i |  | ||||||
|   %x.ld.addr = getelementptr [256 x i32]* @x, i64 0, i64 %i.255 |  | ||||||
|   %x.st.addr = getelementptr [256 x i32]* @x, i64 0, i64 %i |  | ||||||
|   %x = load i32* %x.ld.addr     ; 0 |  | ||||||
|   %y = load i32* %y.ld.addr     ; 1 |  | ||||||
|   %r = add i32 %y, %x |  | ||||||
|   store i32 %r, i32* %x.st.addr ; 2 |  | ||||||
| ; CHECK: 0,2: dep |  | ||||||
| ; CHECK: 1,2: ind |  | ||||||
|   %i.next = add i64 %i, 1 |  | ||||||
|   %exitcond = icmp eq i64 %i.next, 100 |  | ||||||
|   br i1 %exitcond, label %for.end, label %for.body |  | ||||||
|  |  | ||||||
| for.end: |  | ||||||
|   ret void |  | ||||||
| } |  | ||||||
|  |  | ||||||
| ;; // the first iteration (i=0) leads to an out-of-bounds access of x. as the |  | ||||||
| ;; // result of this access is undefined, _any_ dependence result is safe. |  | ||||||
| ;; for (i = 0; i < 256; i++) |  | ||||||
| ;;   x[i] = x[256 - i] + y[i] |  | ||||||
|  |  | ||||||
| define void @f3(...) nounwind { |  | ||||||
| entry: |  | ||||||
|   br label %for.body |  | ||||||
|  |  | ||||||
| for.body: |  | ||||||
|   %i = phi i64 [ 0, %entry ], [ %i.next, %for.body ] |  | ||||||
|   %i.256 = sub i64 0, %i |  | ||||||
|   %y.ld.addr = getelementptr [256 x i32]* @y, i64 0, i64 %i |  | ||||||
|   %x.ld.addr = getelementptr [256 x i32]* @x, i64 1, i64 %i.256 |  | ||||||
|   %x.st.addr = getelementptr [256 x i32]* @x, i64 0, i64 %i |  | ||||||
|   %x = load i32* %x.ld.addr     ; 0 |  | ||||||
|   %y = load i32* %y.ld.addr     ; 1 |  | ||||||
|   %r = add i32 %y, %x |  | ||||||
|   store i32 %r, i32* %x.st.addr ; 2 |  | ||||||
| ; CHECK: 0,2: dep |  | ||||||
| ; CHECK: 1,2: |  | ||||||
|   %i.next = add i64 %i, 1 |  | ||||||
|   %exitcond = icmp eq i64 %i.next, 256 |  | ||||||
|   br i1 %exitcond, label %for.end, label %for.body |  | ||||||
|  |  | ||||||
| for.end: |  | ||||||
|   ret void |  | ||||||
| } |  | ||||||
|  |  | ||||||
| ;; // slightly contrived but valid IR for the following loop, where all |  | ||||||
| ;; // accesses in all iterations are within bounds. while this example's first |  | ||||||
| ;; // (ZIV-)subscript is (0, 1), accesses are dependent. |  | ||||||
| ;; for (i = 1; i < 256; i++) |  | ||||||
| ;;   x[i] = x[256 - i] + y[i] |  | ||||||
|  |  | ||||||
| define void @f4(...) nounwind { |  | ||||||
| entry: |  | ||||||
|   br label %for.body |  | ||||||
|  |  | ||||||
| for.body: |  | ||||||
|   %i = phi i64 [ 0, %entry ], [ %i.next, %for.body ] |  | ||||||
|   %i.1 = add i64 1, %i |  | ||||||
|   %i.256 = sub i64 -1, %i |  | ||||||
|   %y.ld.addr = getelementptr [256 x i32]* @y, i64 0, i64 %i.1 |  | ||||||
|   %x.ld.addr = getelementptr [256 x i32]* @x, i64 1, i64 %i.256 |  | ||||||
|   %x.st.addr = getelementptr [256 x i32]* @x, i64 0, i64 %i.1 |  | ||||||
|   %x = load i32* %x.ld.addr     ; 0 |  | ||||||
|   %y = load i32* %y.ld.addr     ; 1 |  | ||||||
|   %r = add i32 %y, %x |  | ||||||
|   store i32 %r, i32* %x.st.addr ; 2 |  | ||||||
| ; CHECK: 0,2: dep |  | ||||||
| ; CHECK: 1,2: ind |  | ||||||
|   %i.next = add i64 %i, 1 |  | ||||||
|   %exitcond = icmp eq i64 %i.next, 256 |  | ||||||
|   br i1 %exitcond, label %for.end, label %for.body |  | ||||||
|  |  | ||||||
| for.end: |  | ||||||
|   ret void |  | ||||||
| } |  | ||||||
| @@ -1,56 +0,0 @@ | |||||||
| ; RUN: opt < %s -analyze -basicaa -lda | FileCheck %s |  | ||||||
|  |  | ||||||
| @x = common global [256 x i32] zeroinitializer, align 4 |  | ||||||
| @y = common global [256 x i32] zeroinitializer, align 4 |  | ||||||
|  |  | ||||||
| ;; for (i = 0; i < 256; i++) |  | ||||||
| ;;   x[i] = x[42] + y[i] |  | ||||||
|  |  | ||||||
| define void @f1(...) nounwind { |  | ||||||
| entry: |  | ||||||
|   %x.ld.addr = getelementptr [256 x i32]* @x, i64 0, i64 42 |  | ||||||
|   br label %for.body |  | ||||||
|  |  | ||||||
| for.body: |  | ||||||
|   %i = phi i64 [ 0, %entry ], [ %i.next, %for.body ] |  | ||||||
|   %x.addr = getelementptr [256 x i32]* @x, i64 0, i64 %i |  | ||||||
|   %y.addr = getelementptr [256 x i32]* @y, i64 0, i64 %i |  | ||||||
|   %x = load i32* %x.ld.addr   ; 0 |  | ||||||
|   %y = load i32* %y.addr      ; 1 |  | ||||||
|   %r = add i32 %y, %x |  | ||||||
|   store i32 %r, i32* %x.addr  ; 2 |  | ||||||
| ; CHECK: 0,2: dep |  | ||||||
| ; CHECK: 1,2: ind |  | ||||||
|   %i.next = add i64 %i, 1 |  | ||||||
|   %exitcond = icmp eq i64 %i.next, 256 |  | ||||||
|   br i1 %exitcond, label %for.end, label %for.body |  | ||||||
|  |  | ||||||
| for.end: |  | ||||||
|   ret void |  | ||||||
| } |  | ||||||
|  |  | ||||||
| ;; for (i = 0; i < 250; i++) |  | ||||||
| ;;   x[i] = x[255] + y[i] |  | ||||||
|  |  | ||||||
| define void @f2(...) nounwind { |  | ||||||
| entry: |  | ||||||
|   %x.ld.addr = getelementptr [256 x i32]* @x, i64 0, i64 255 |  | ||||||
|   br label %for.body |  | ||||||
|  |  | ||||||
| for.body: |  | ||||||
|   %i = phi i64 [ 0, %entry ], [ %i.next, %for.body ] |  | ||||||
|   %x.addr = getelementptr [256 x i32]* @x, i64 0, i64 %i |  | ||||||
|   %y.addr = getelementptr [256 x i32]* @y, i64 0, i64 %i |  | ||||||
|   %x = load i32* %x.ld.addr   ; 0 |  | ||||||
|   %y = load i32* %y.addr      ; 1 |  | ||||||
|   %r = add i32 %y, %x |  | ||||||
|   store i32 %r, i32* %x.addr  ; 2 |  | ||||||
| ; CHECK: 0,2: dep |  | ||||||
| ; CHECK: 1,2: ind |  | ||||||
|   %i.next = add i64 %i, 1 |  | ||||||
|   %exitcond = icmp eq i64 %i.next, 250 |  | ||||||
|   br i1 %exitcond, label %for.end, label %for.body |  | ||||||
|  |  | ||||||
| for.end: |  | ||||||
|   ret void |  | ||||||
| } |  | ||||||
| @@ -1,63 +0,0 @@ | |||||||
| ; RUN: opt < %s -analyze -basicaa -lda | FileCheck %s |  | ||||||
|  |  | ||||||
| @x = common global [256 x i32] zeroinitializer, align 4 |  | ||||||
|  |  | ||||||
| ;; x[5] = x[6] |  | ||||||
|  |  | ||||||
| define void @f1(...) nounwind { |  | ||||||
| entry: |  | ||||||
|   br label %for.body |  | ||||||
|  |  | ||||||
| for.body: |  | ||||||
|   %i = phi i64 [ 0, %entry ], [ %i.next, %for.body ] |  | ||||||
|   %x = load i32* getelementptr ([256 x i32]* @x, i32 0, i64 6) |  | ||||||
|   store i32 %x, i32* getelementptr ([256 x i32]* @x, i32 0, i64 5) |  | ||||||
| ; CHECK: 0,1: ind |  | ||||||
|   %i.next = add i64 %i, 1 |  | ||||||
|   %exitcond = icmp eq i64 %i.next, 256 |  | ||||||
|   br i1 %exitcond, label %for.end, label %for.body |  | ||||||
|  |  | ||||||
| for.end: |  | ||||||
|   ret void |  | ||||||
| } |  | ||||||
|  |  | ||||||
| ;; x[c] = x[c+1] // with c being a loop-invariant constant |  | ||||||
|  |  | ||||||
| define void @f2(i64 %c0) nounwind { |  | ||||||
| entry: |  | ||||||
|   %c1 = add i64 %c0, 1 |  | ||||||
|   %x.ld.addr = getelementptr [256 x i32]* @x, i64 0, i64 %c0 |  | ||||||
|   %x.st.addr = getelementptr [256 x i32]* @x, i64 0, i64 %c1 |  | ||||||
|   br label %for.body |  | ||||||
|  |  | ||||||
| for.body: |  | ||||||
|   %i = phi i64 [ 0, %entry ], [ %i.next, %for.body ] |  | ||||||
|   %x = load i32* %x.ld.addr |  | ||||||
|   store i32 %x, i32* %x.st.addr |  | ||||||
| ; CHECK: 0,1: ind |  | ||||||
|   %i.next = add i64 %i, 1 |  | ||||||
|   %exitcond = icmp eq i64 %i.next, 256 |  | ||||||
|   br i1 %exitcond, label %for.end, label %for.body |  | ||||||
|  |  | ||||||
| for.end: |  | ||||||
|   ret void |  | ||||||
| } |  | ||||||
|  |  | ||||||
| ;; x[6] = x[6] |  | ||||||
|  |  | ||||||
| define void @f3(...) nounwind { |  | ||||||
| entry: |  | ||||||
|   br label %for.body |  | ||||||
|  |  | ||||||
| for.body: |  | ||||||
|   %i = phi i64 [ 0, %entry ], [ %i.next, %for.body ] |  | ||||||
|   %x = load i32* getelementptr ([256 x i32]* @x, i32 0, i64 6) |  | ||||||
|   store i32 %x, i32* getelementptr ([256 x i32]* @x, i32 0, i64 6) |  | ||||||
| ; CHECK: 0,1: dep |  | ||||||
|   %i.next = add i64 %i, 1 |  | ||||||
|   %exitcond = icmp eq i64 %i.next, 256 |  | ||||||
|   br i1 %exitcond, label %for.end, label %for.body |  | ||||||
|  |  | ||||||
| for.end: |  | ||||||
|   ret void |  | ||||||
| } |  | ||||||
		Reference in New Issue
	
	Block a user