forked from OSchip/llvm-project
Remove LoopDependenceAnalysis.
It was unmaintained and not much more than a stub. The new DependenceAnalysis pass is both more general and complete. llvm-svn: 166810
This commit is contained in:
parent
2d26c29e0c
commit
6dc1e2f287
|
@ -77,6 +77,7 @@ perl -e '$/ = undef; for (split(/\n/, <>)) { s:^ *///? ?::; print " <p>\n" if !
|
||||||
<tr><td><a href="#basicaa">-basicaa</a></td><td>Basic Alias Analysis (stateless AA impl)</td></tr>
|
<tr><td><a href="#basicaa">-basicaa</a></td><td>Basic Alias Analysis (stateless AA impl)</td></tr>
|
||||||
<tr><td><a href="#basiccg">-basiccg</a></td><td>Basic CallGraph Construction</td></tr>
|
<tr><td><a href="#basiccg">-basiccg</a></td><td>Basic CallGraph Construction</td></tr>
|
||||||
<tr><td><a href="#count-aa">-count-aa</a></td><td>Count Alias Analysis Query Responses</td></tr>
|
<tr><td><a href="#count-aa">-count-aa</a></td><td>Count Alias Analysis Query Responses</td></tr>
|
||||||
|
<tr><td><a href="#da">-da</a></td><td>Dependence Analysis</td></tr>
|
||||||
<tr><td><a href="#debug-aa">-debug-aa</a></td><td>AA use debugger</td></tr>
|
<tr><td><a href="#debug-aa">-debug-aa</a></td><td>AA use debugger</td></tr>
|
||||||
<tr><td><a href="#domfrontier">-domfrontier</a></td><td>Dominance Frontier Construction</td></tr>
|
<tr><td><a href="#domfrontier">-domfrontier</a></td><td>Dominance Frontier Construction</td></tr>
|
||||||
<tr><td><a href="#domtree">-domtree</a></td><td>Dominator Tree Construction</td></tr>
|
<tr><td><a href="#domtree">-domtree</a></td><td>Dominator Tree Construction</td></tr>
|
||||||
|
@ -92,7 +93,6 @@ perl -e '$/ = undef; for (split(/\n/, <>)) { s:^ *///? ?::; print " <p>\n" if !
|
||||||
<tr><td><a href="#intervals">-intervals</a></td><td>Interval Partition Construction</td></tr>
|
<tr><td><a href="#intervals">-intervals</a></td><td>Interval Partition Construction</td></tr>
|
||||||
<tr><td><a href="#iv-users">-iv-users</a></td><td>Induction Variable Users</td></tr>
|
<tr><td><a href="#iv-users">-iv-users</a></td><td>Induction Variable Users</td></tr>
|
||||||
<tr><td><a href="#lazy-value-info">-lazy-value-info</a></td><td>Lazy Value Information Analysis</td></tr>
|
<tr><td><a href="#lazy-value-info">-lazy-value-info</a></td><td>Lazy Value Information Analysis</td></tr>
|
||||||
<tr><td><a href="#lda">-lda</a></td><td>Loop Dependence Analysis</td></tr>
|
|
||||||
<tr><td><a href="#libcall-aa">-libcall-aa</a></td><td>LibCall Alias Analysis</td></tr>
|
<tr><td><a href="#libcall-aa">-libcall-aa</a></td><td>LibCall Alias Analysis</td></tr>
|
||||||
<tr><td><a href="#lint">-lint</a></td><td>Statically lint-checks LLVM IR</td></tr>
|
<tr><td><a href="#lint">-lint</a></td><td>Statically lint-checks LLVM IR</td></tr>
|
||||||
<tr><td><a href="#loops">-loops</a></td><td>Natural Loop Information</td></tr>
|
<tr><td><a href="#loops">-loops</a></td><td>Natural Loop Information</td></tr>
|
||||||
|
@ -249,6 +249,15 @@ perl -e '$/ = undef; for (split(/\n/, <>)) { s:^ *///? ?::; print " <p>\n" if !
|
||||||
</p>
|
</p>
|
||||||
</div>
|
</div>
|
||||||
|
|
||||||
|
<!-------------------------------------------------------------------------- -->
|
||||||
|
<h3>
|
||||||
|
<a name="da">-da: Dependence Analysis</a>
|
||||||
|
</h3>
|
||||||
|
<div>
|
||||||
|
<p>Dependence analysis framework, which is used to detect dependences in
|
||||||
|
memory accesses.</p>
|
||||||
|
</div>
|
||||||
|
|
||||||
<!-------------------------------------------------------------------------- -->
|
<!-------------------------------------------------------------------------- -->
|
||||||
<h3>
|
<h3>
|
||||||
<a name="debug-aa">-debug-aa: AA use debugger</a>
|
<a name="debug-aa">-debug-aa: AA use debugger</a>
|
||||||
|
@ -431,15 +440,6 @@ perl -e '$/ = undef; for (split(/\n/, <>)) { s:^ *///? ?::; print " <p>\n" if !
|
||||||
<p>Interface for lazy computation of value constraint information.</p>
|
<p>Interface for lazy computation of value constraint information.</p>
|
||||||
</div>
|
</div>
|
||||||
|
|
||||||
<!-------------------------------------------------------------------------- -->
|
|
||||||
<h3>
|
|
||||||
<a name="lda">-lda: Loop Dependence Analysis</a>
|
|
||||||
</h3>
|
|
||||||
<div>
|
|
||||||
<p>Loop dependence analysis framework, which is used to detect dependences in
|
|
||||||
memory accesses in loops.</p>
|
|
||||||
</div>
|
|
||||||
|
|
||||||
<!-------------------------------------------------------------------------- -->
|
<!-------------------------------------------------------------------------- -->
|
||||||
<h3>
|
<h3>
|
||||||
<a name="libcall-aa">-libcall-aa: LibCall Alias Analysis</a>
|
<a name="libcall-aa">-libcall-aa: LibCall Alias Analysis</a>
|
||||||
|
|
|
@ -1,124 +0,0 @@
|
||||||
//===- llvm/Analysis/LoopDependenceAnalysis.h --------------- -*- C++ -*---===//
|
|
||||||
//
|
|
||||||
// The LLVM Compiler Infrastructure
|
|
||||||
//
|
|
||||||
// This file is distributed under the University of Illinois Open Source
|
|
||||||
// License. See LICENSE.TXT for details.
|
|
||||||
//
|
|
||||||
//===----------------------------------------------------------------------===//
|
|
||||||
//
|
|
||||||
// LoopDependenceAnalysis is an LLVM pass that analyses dependences in memory
|
|
||||||
// accesses in loops.
|
|
||||||
//
|
|
||||||
// Please note that this is work in progress and the interface is subject to
|
|
||||||
// change.
|
|
||||||
//
|
|
||||||
// TODO: adapt as interface progresses
|
|
||||||
//
|
|
||||||
//===----------------------------------------------------------------------===//
|
|
||||||
|
|
||||||
#ifndef LLVM_ANALYSIS_LOOP_DEPENDENCE_ANALYSIS_H
|
|
||||||
#define LLVM_ANALYSIS_LOOP_DEPENDENCE_ANALYSIS_H
|
|
||||||
|
|
||||||
#include "llvm/ADT/DenseSet.h"
|
|
||||||
#include "llvm/ADT/FoldingSet.h"
|
|
||||||
#include "llvm/ADT/SmallVector.h"
|
|
||||||
#include "llvm/Analysis/LoopPass.h"
|
|
||||||
#include "llvm/Support/Allocator.h"
|
|
||||||
|
|
||||||
namespace llvm {
|
|
||||||
|
|
||||||
class AliasAnalysis;
|
|
||||||
class AnalysisUsage;
|
|
||||||
class ScalarEvolution;
|
|
||||||
class SCEV;
|
|
||||||
class Value;
|
|
||||||
class raw_ostream;
|
|
||||||
|
|
||||||
class LoopDependenceAnalysis : public LoopPass {
|
|
||||||
AliasAnalysis *AA;
|
|
||||||
ScalarEvolution *SE;
|
|
||||||
|
|
||||||
/// L - The loop we are currently analysing.
|
|
||||||
Loop *L;
|
|
||||||
|
|
||||||
/// TODO: doc
|
|
||||||
enum DependenceResult { Independent = 0, Dependent = 1, Unknown = 2 };
|
|
||||||
|
|
||||||
/// TODO: doc
|
|
||||||
struct Subscript {
|
|
||||||
/// TODO: Add distance, direction, breaking conditions, ...
|
|
||||||
};
|
|
||||||
|
|
||||||
/// DependencePair - Represents a data dependence relation between to memory
|
|
||||||
/// reference instructions.
|
|
||||||
struct DependencePair : public FastFoldingSetNode {
|
|
||||||
Value *A;
|
|
||||||
Value *B;
|
|
||||||
DependenceResult Result;
|
|
||||||
SmallVector<Subscript, 4> Subscripts;
|
|
||||||
|
|
||||||
DependencePair(const FoldingSetNodeID &ID, Value *a, Value *b) :
|
|
||||||
FastFoldingSetNode(ID), A(a), B(b), Result(Unknown), Subscripts() {}
|
|
||||||
};
|
|
||||||
|
|
||||||
/// findOrInsertDependencePair - Return true if a DependencePair for the
|
|
||||||
/// given Values already exists, false if a new DependencePair had to be
|
|
||||||
/// created. The third argument is set to the pair found or created.
|
|
||||||
bool findOrInsertDependencePair(Value*, Value*, DependencePair*&);
|
|
||||||
|
|
||||||
/// getLoops - Collect all loops of the loop nest L in which
|
|
||||||
/// a given SCEV is variant.
|
|
||||||
void getLoops(const SCEV*, DenseSet<const Loop*>*) const;
|
|
||||||
|
|
||||||
/// isLoopInvariant - True if a given SCEV is invariant in all loops of the
|
|
||||||
/// loop nest starting at the innermost loop L.
|
|
||||||
bool isLoopInvariant(const SCEV*) const;
|
|
||||||
|
|
||||||
/// isAffine - An SCEV is affine with respect to the loop nest starting at
|
|
||||||
/// the innermost loop L if it is of the form A+B*X where A, B are invariant
|
|
||||||
/// in the loop nest and X is a induction variable in the loop nest.
|
|
||||||
bool isAffine(const SCEV*) const;
|
|
||||||
|
|
||||||
/// TODO: doc
|
|
||||||
bool isZIVPair(const SCEV*, const SCEV*) const;
|
|
||||||
bool isSIVPair(const SCEV*, const SCEV*) const;
|
|
||||||
DependenceResult analyseZIV(const SCEV*, const SCEV*, Subscript*) const;
|
|
||||||
DependenceResult analyseSIV(const SCEV*, const SCEV*, Subscript*) const;
|
|
||||||
DependenceResult analyseMIV(const SCEV*, const SCEV*, Subscript*) const;
|
|
||||||
DependenceResult analyseSubscript(const SCEV*, const SCEV*, Subscript*) const;
|
|
||||||
DependenceResult analysePair(DependencePair*) const;
|
|
||||||
|
|
||||||
public:
|
|
||||||
static char ID; // Class identification, replacement for typeinfo
|
|
||||||
LoopDependenceAnalysis() : LoopPass(ID) {
|
|
||||||
initializeLoopDependenceAnalysisPass(*PassRegistry::getPassRegistry());
|
|
||||||
}
|
|
||||||
|
|
||||||
/// isDependencePair - Check whether two values can possibly give rise to
|
|
||||||
/// a data dependence: that is the case if both are instructions accessing
|
|
||||||
/// memory and at least one of those accesses is a write.
|
|
||||||
bool isDependencePair(const Value*, const Value*) const;
|
|
||||||
|
|
||||||
/// depends - Return a boolean indicating if there is a data dependence
|
|
||||||
/// between two instructions.
|
|
||||||
bool depends(Value*, Value*);
|
|
||||||
|
|
||||||
bool runOnLoop(Loop*, LPPassManager&);
|
|
||||||
virtual void releaseMemory();
|
|
||||||
virtual void getAnalysisUsage(AnalysisUsage&) const;
|
|
||||||
void print(raw_ostream&, const Module* = 0) const;
|
|
||||||
|
|
||||||
private:
|
|
||||||
FoldingSet<DependencePair> Pairs;
|
|
||||||
BumpPtrAllocator PairAllocator;
|
|
||||||
}; // class LoopDependenceAnalysis
|
|
||||||
|
|
||||||
// createLoopDependenceAnalysisPass - This creates an instance of the
|
|
||||||
// LoopDependenceAnalysis pass.
|
|
||||||
//
|
|
||||||
LoopPass *createLoopDependenceAnalysisPass();
|
|
||||||
|
|
||||||
} // namespace llvm
|
|
||||||
|
|
||||||
#endif /* LLVM_ANALYSIS_LOOP_DEPENDENCE_ANALYSIS_H */
|
|
|
@ -185,13 +185,6 @@ namespace llvm {
|
||||||
//
|
//
|
||||||
FunctionPass *createDependenceAnalysisPass();
|
FunctionPass *createDependenceAnalysisPass();
|
||||||
|
|
||||||
//===--------------------------------------------------------------------===//
|
|
||||||
//
|
|
||||||
// createLoopDependenceAnalysisPass - This creates an instance of the
|
|
||||||
// LoopDependenceAnalysis pass.
|
|
||||||
//
|
|
||||||
LoopPass *createLoopDependenceAnalysisPass();
|
|
||||||
|
|
||||||
//===--------------------------------------------------------------------===//
|
//===--------------------------------------------------------------------===//
|
||||||
//
|
//
|
||||||
// Minor pass prototypes, allowing us to expose them through bugpoint and
|
// Minor pass prototypes, allowing us to expose them through bugpoint and
|
||||||
|
|
|
@ -147,7 +147,6 @@ void initializeProfileMetadataLoaderPassPass(PassRegistry&);
|
||||||
void initializePathProfileLoaderPassPass(PassRegistry&);
|
void initializePathProfileLoaderPassPass(PassRegistry&);
|
||||||
void initializeLocalStackSlotPassPass(PassRegistry&);
|
void initializeLocalStackSlotPassPass(PassRegistry&);
|
||||||
void initializeLoopDeletionPass(PassRegistry&);
|
void initializeLoopDeletionPass(PassRegistry&);
|
||||||
void initializeLoopDependenceAnalysisPass(PassRegistry&);
|
|
||||||
void initializeLoopExtractorPass(PassRegistry&);
|
void initializeLoopExtractorPass(PassRegistry&);
|
||||||
void initializeLoopInfoPass(PassRegistry&);
|
void initializeLoopInfoPass(PassRegistry&);
|
||||||
void initializeLoopInstSimplifyPass(PassRegistry&);
|
void initializeLoopInstSimplifyPass(PassRegistry&);
|
||||||
|
|
|
@ -86,7 +86,6 @@ namespace {
|
||||||
(void) llvm::createLCSSAPass();
|
(void) llvm::createLCSSAPass();
|
||||||
(void) llvm::createLICMPass();
|
(void) llvm::createLICMPass();
|
||||||
(void) llvm::createLazyValueInfoPass();
|
(void) llvm::createLazyValueInfoPass();
|
||||||
(void) llvm::createLoopDependenceAnalysisPass();
|
|
||||||
(void) llvm::createLoopExtractorPass();
|
(void) llvm::createLoopExtractorPass();
|
||||||
(void) llvm::createLoopSimplifyPass();
|
(void) llvm::createLoopSimplifyPass();
|
||||||
(void) llvm::createLoopStrengthReducePass();
|
(void) llvm::createLoopStrengthReducePass();
|
||||||
|
|
|
@ -47,7 +47,6 @@ void llvm::initializeAnalysis(PassRegistry &Registry) {
|
||||||
initializeLazyValueInfoPass(Registry);
|
initializeLazyValueInfoPass(Registry);
|
||||||
initializeLibCallAliasAnalysisPass(Registry);
|
initializeLibCallAliasAnalysisPass(Registry);
|
||||||
initializeLintPass(Registry);
|
initializeLintPass(Registry);
|
||||||
initializeLoopDependenceAnalysisPass(Registry);
|
|
||||||
initializeLoopInfoPass(Registry);
|
initializeLoopInfoPass(Registry);
|
||||||
initializeMemDepPrinterPass(Registry);
|
initializeMemDepPrinterPass(Registry);
|
||||||
initializeMemoryDependenceAnalysisPass(Registry);
|
initializeMemoryDependenceAnalysisPass(Registry);
|
||||||
|
|
|
@ -27,7 +27,6 @@ add_llvm_library(LLVMAnalysis
|
||||||
LibCallSemantics.cpp
|
LibCallSemantics.cpp
|
||||||
Lint.cpp
|
Lint.cpp
|
||||||
Loads.cpp
|
Loads.cpp
|
||||||
LoopDependenceAnalysis.cpp
|
|
||||||
LoopInfo.cpp
|
LoopInfo.cpp
|
||||||
LoopPass.cpp
|
LoopPass.cpp
|
||||||
MemDepPrinter.cpp
|
MemDepPrinter.cpp
|
||||||
|
|
|
@ -1,362 +0,0 @@
|
||||||
//===- LoopDependenceAnalysis.cpp - LDA Implementation ----------*- C++ -*-===//
|
|
||||||
//
|
|
||||||
// The LLVM Compiler Infrastructure
|
|
||||||
//
|
|
||||||
// This file is distributed under the University of Illinois Open Source
|
|
||||||
// License. See LICENSE.TXT for details.
|
|
||||||
//
|
|
||||||
//===----------------------------------------------------------------------===//
|
|
||||||
//
|
|
||||||
// This is the (beginning) of an implementation of a loop dependence analysis
|
|
||||||
// framework, which is used to detect dependences in memory accesses in loops.
|
|
||||||
//
|
|
||||||
// Please note that this is work in progress and the interface is subject to
|
|
||||||
// change.
|
|
||||||
//
|
|
||||||
// TODO: adapt as implementation progresses.
|
|
||||||
//
|
|
||||||
// TODO: document lingo (pair, subscript, index)
|
|
||||||
//
|
|
||||||
//===----------------------------------------------------------------------===//
|
|
||||||
|
|
||||||
#define DEBUG_TYPE "lda"
|
|
||||||
#include "llvm/ADT/DenseSet.h"
|
|
||||||
#include "llvm/ADT/Statistic.h"
|
|
||||||
#include "llvm/Analysis/AliasAnalysis.h"
|
|
||||||
#include "llvm/Analysis/LoopDependenceAnalysis.h"
|
|
||||||
#include "llvm/Analysis/LoopPass.h"
|
|
||||||
#include "llvm/Analysis/ScalarEvolution.h"
|
|
||||||
#include "llvm/Analysis/ScalarEvolutionExpressions.h"
|
|
||||||
#include "llvm/Analysis/ValueTracking.h"
|
|
||||||
#include "llvm/Assembly/Writer.h"
|
|
||||||
#include "llvm/Instructions.h"
|
|
||||||
#include "llvm/Operator.h"
|
|
||||||
#include "llvm/Support/Allocator.h"
|
|
||||||
#include "llvm/Support/Debug.h"
|
|
||||||
#include "llvm/Support/ErrorHandling.h"
|
|
||||||
#include "llvm/Support/raw_ostream.h"
|
|
||||||
#include "llvm/DataLayout.h"
|
|
||||||
using namespace llvm;
|
|
||||||
|
|
||||||
STATISTIC(NumAnswered, "Number of dependence queries answered");
|
|
||||||
STATISTIC(NumAnalysed, "Number of distinct dependence pairs analysed");
|
|
||||||
STATISTIC(NumDependent, "Number of pairs with dependent accesses");
|
|
||||||
STATISTIC(NumIndependent, "Number of pairs with independent accesses");
|
|
||||||
STATISTIC(NumUnknown, "Number of pairs with unknown accesses");
|
|
||||||
|
|
||||||
LoopPass *llvm::createLoopDependenceAnalysisPass() {
|
|
||||||
return new LoopDependenceAnalysis();
|
|
||||||
}
|
|
||||||
|
|
||||||
INITIALIZE_PASS_BEGIN(LoopDependenceAnalysis, "lda",
|
|
||||||
"Loop Dependence Analysis", false, true)
|
|
||||||
INITIALIZE_PASS_DEPENDENCY(ScalarEvolution)
|
|
||||||
INITIALIZE_AG_DEPENDENCY(AliasAnalysis)
|
|
||||||
INITIALIZE_PASS_END(LoopDependenceAnalysis, "lda",
|
|
||||||
"Loop Dependence Analysis", false, true)
|
|
||||||
char LoopDependenceAnalysis::ID = 0;
|
|
||||||
|
|
||||||
//===----------------------------------------------------------------------===//
|
|
||||||
// Utility Functions
|
|
||||||
//===----------------------------------------------------------------------===//
|
|
||||||
|
|
||||||
static inline bool IsMemRefInstr(const Value *V) {
|
|
||||||
const Instruction *I = dyn_cast<const Instruction>(V);
|
|
||||||
return I && (I->mayReadFromMemory() || I->mayWriteToMemory());
|
|
||||||
}
|
|
||||||
|
|
||||||
static void GetMemRefInstrs(const Loop *L,
|
|
||||||
SmallVectorImpl<Instruction*> &Memrefs) {
|
|
||||||
for (Loop::block_iterator b = L->block_begin(), be = L->block_end();
|
|
||||||
b != be; ++b)
|
|
||||||
for (BasicBlock::iterator i = (*b)->begin(), ie = (*b)->end();
|
|
||||||
i != ie; ++i)
|
|
||||||
if (IsMemRefInstr(i))
|
|
||||||
Memrefs.push_back(i);
|
|
||||||
}
|
|
||||||
|
|
||||||
static bool IsLoadOrStoreInst(Value *I) {
|
|
||||||
// Returns true if the load or store can be analyzed. Atomic and volatile
|
|
||||||
// operations have properties which this analysis does not understand.
|
|
||||||
if (LoadInst *LI = dyn_cast<LoadInst>(I))
|
|
||||||
return LI->isUnordered();
|
|
||||||
else if (StoreInst *SI = dyn_cast<StoreInst>(I))
|
|
||||||
return SI->isUnordered();
|
|
||||||
return false;
|
|
||||||
}
|
|
||||||
|
|
||||||
static Value *GetPointerOperand(Value *I) {
|
|
||||||
if (LoadInst *i = dyn_cast<LoadInst>(I))
|
|
||||||
return i->getPointerOperand();
|
|
||||||
if (StoreInst *i = dyn_cast<StoreInst>(I))
|
|
||||||
return i->getPointerOperand();
|
|
||||||
llvm_unreachable("Value is no load or store instruction!");
|
|
||||||
}
|
|
||||||
|
|
||||||
static AliasAnalysis::AliasResult UnderlyingObjectsAlias(AliasAnalysis *AA,
|
|
||||||
const Value *A,
|
|
||||||
const Value *B) {
|
|
||||||
const Value *aObj = GetUnderlyingObject(A);
|
|
||||||
const Value *bObj = GetUnderlyingObject(B);
|
|
||||||
return AA->alias(aObj, AA->getTypeStoreSize(aObj->getType()),
|
|
||||||
bObj, AA->getTypeStoreSize(bObj->getType()));
|
|
||||||
}
|
|
||||||
|
|
||||||
static inline const SCEV *GetZeroSCEV(ScalarEvolution *SE) {
|
|
||||||
return SE->getConstant(Type::getInt32Ty(SE->getContext()), 0L);
|
|
||||||
}
|
|
||||||
|
|
||||||
//===----------------------------------------------------------------------===//
|
|
||||||
// Dependence Testing
|
|
||||||
//===----------------------------------------------------------------------===//
|
|
||||||
|
|
||||||
bool LoopDependenceAnalysis::isDependencePair(const Value *A,
|
|
||||||
const Value *B) const {
|
|
||||||
return IsMemRefInstr(A) &&
|
|
||||||
IsMemRefInstr(B) &&
|
|
||||||
(cast<const Instruction>(A)->mayWriteToMemory() ||
|
|
||||||
cast<const Instruction>(B)->mayWriteToMemory());
|
|
||||||
}
|
|
||||||
|
|
||||||
bool LoopDependenceAnalysis::findOrInsertDependencePair(Value *A,
|
|
||||||
Value *B,
|
|
||||||
DependencePair *&P) {
|
|
||||||
void *insertPos = 0;
|
|
||||||
FoldingSetNodeID id;
|
|
||||||
id.AddPointer(A);
|
|
||||||
id.AddPointer(B);
|
|
||||||
|
|
||||||
P = Pairs.FindNodeOrInsertPos(id, insertPos);
|
|
||||||
if (P) return true;
|
|
||||||
|
|
||||||
P = new (PairAllocator) DependencePair(id, A, B);
|
|
||||||
Pairs.InsertNode(P, insertPos);
|
|
||||||
return false;
|
|
||||||
}
|
|
||||||
|
|
||||||
void LoopDependenceAnalysis::getLoops(const SCEV *S,
|
|
||||||
DenseSet<const Loop*>* Loops) const {
|
|
||||||
// Refactor this into an SCEVVisitor, if efficiency becomes a concern.
|
|
||||||
for (const Loop *L = this->L; L != 0; L = L->getParentLoop())
|
|
||||||
if (!SE->isLoopInvariant(S, L))
|
|
||||||
Loops->insert(L);
|
|
||||||
}
|
|
||||||
|
|
||||||
bool LoopDependenceAnalysis::isLoopInvariant(const SCEV *S) const {
|
|
||||||
DenseSet<const Loop*> loops;
|
|
||||||
getLoops(S, &loops);
|
|
||||||
return loops.empty();
|
|
||||||
}
|
|
||||||
|
|
||||||
bool LoopDependenceAnalysis::isAffine(const SCEV *S) const {
|
|
||||||
const SCEVAddRecExpr *rec = dyn_cast<SCEVAddRecExpr>(S);
|
|
||||||
return isLoopInvariant(S) || (rec && rec->isAffine());
|
|
||||||
}
|
|
||||||
|
|
||||||
bool LoopDependenceAnalysis::isZIVPair(const SCEV *A, const SCEV *B) const {
|
|
||||||
return isLoopInvariant(A) && isLoopInvariant(B);
|
|
||||||
}
|
|
||||||
|
|
||||||
bool LoopDependenceAnalysis::isSIVPair(const SCEV *A, const SCEV *B) const {
|
|
||||||
DenseSet<const Loop*> loops;
|
|
||||||
getLoops(A, &loops);
|
|
||||||
getLoops(B, &loops);
|
|
||||||
return loops.size() == 1;
|
|
||||||
}
|
|
||||||
|
|
||||||
LoopDependenceAnalysis::DependenceResult
|
|
||||||
LoopDependenceAnalysis::analyseZIV(const SCEV *A,
|
|
||||||
const SCEV *B,
|
|
||||||
Subscript *S) const {
|
|
||||||
assert(isZIVPair(A, B) && "Attempted to ZIV-test non-ZIV SCEVs!");
|
|
||||||
return A == B ? Dependent : Independent;
|
|
||||||
}
|
|
||||||
|
|
||||||
LoopDependenceAnalysis::DependenceResult
|
|
||||||
LoopDependenceAnalysis::analyseSIV(const SCEV *A,
|
|
||||||
const SCEV *B,
|
|
||||||
Subscript *S) const {
|
|
||||||
return Unknown; // TODO: Implement.
|
|
||||||
}
|
|
||||||
|
|
||||||
LoopDependenceAnalysis::DependenceResult
|
|
||||||
LoopDependenceAnalysis::analyseMIV(const SCEV *A,
|
|
||||||
const SCEV *B,
|
|
||||||
Subscript *S) const {
|
|
||||||
return Unknown; // TODO: Implement.
|
|
||||||
}
|
|
||||||
|
|
||||||
LoopDependenceAnalysis::DependenceResult
|
|
||||||
LoopDependenceAnalysis::analyseSubscript(const SCEV *A,
|
|
||||||
const SCEV *B,
|
|
||||||
Subscript *S) const {
|
|
||||||
DEBUG(dbgs() << " Testing subscript: " << *A << ", " << *B << "\n");
|
|
||||||
|
|
||||||
if (A == B) {
|
|
||||||
DEBUG(dbgs() << " -> [D] same SCEV\n");
|
|
||||||
return Dependent;
|
|
||||||
}
|
|
||||||
|
|
||||||
if (!isAffine(A) || !isAffine(B)) {
|
|
||||||
DEBUG(dbgs() << " -> [?] not affine\n");
|
|
||||||
return Unknown;
|
|
||||||
}
|
|
||||||
|
|
||||||
if (isZIVPair(A, B))
|
|
||||||
return analyseZIV(A, B, S);
|
|
||||||
|
|
||||||
if (isSIVPair(A, B))
|
|
||||||
return analyseSIV(A, B, S);
|
|
||||||
|
|
||||||
return analyseMIV(A, B, S);
|
|
||||||
}
|
|
||||||
|
|
||||||
LoopDependenceAnalysis::DependenceResult
|
|
||||||
LoopDependenceAnalysis::analysePair(DependencePair *P) const {
|
|
||||||
DEBUG(dbgs() << "Analysing:\n" << *P->A << "\n" << *P->B << "\n");
|
|
||||||
|
|
||||||
// We only analyse loads and stores but no possible memory accesses by e.g.
|
|
||||||
// free, call, or invoke instructions.
|
|
||||||
if (!IsLoadOrStoreInst(P->A) || !IsLoadOrStoreInst(P->B)) {
|
|
||||||
DEBUG(dbgs() << "--> [?] no load/store\n");
|
|
||||||
return Unknown;
|
|
||||||
}
|
|
||||||
|
|
||||||
Value *aPtr = GetPointerOperand(P->A);
|
|
||||||
Value *bPtr = GetPointerOperand(P->B);
|
|
||||||
|
|
||||||
switch (UnderlyingObjectsAlias(AA, aPtr, bPtr)) {
|
|
||||||
case AliasAnalysis::MayAlias:
|
|
||||||
case AliasAnalysis::PartialAlias:
|
|
||||||
// We can not analyse objects if we do not know about their aliasing.
|
|
||||||
DEBUG(dbgs() << "---> [?] may alias\n");
|
|
||||||
return Unknown;
|
|
||||||
|
|
||||||
case AliasAnalysis::NoAlias:
|
|
||||||
// If the objects noalias, they are distinct, accesses are independent.
|
|
||||||
DEBUG(dbgs() << "---> [I] no alias\n");
|
|
||||||
return Independent;
|
|
||||||
|
|
||||||
case AliasAnalysis::MustAlias:
|
|
||||||
break; // The underlying objects alias, test accesses for dependence.
|
|
||||||
}
|
|
||||||
|
|
||||||
const GEPOperator *aGEP = dyn_cast<GEPOperator>(aPtr);
|
|
||||||
const GEPOperator *bGEP = dyn_cast<GEPOperator>(bPtr);
|
|
||||||
|
|
||||||
if (!aGEP || !bGEP)
|
|
||||||
return Unknown;
|
|
||||||
|
|
||||||
// FIXME: Is filtering coupled subscripts necessary?
|
|
||||||
|
|
||||||
// Collect GEP operand pairs (FIXME: use GetGEPOperands from BasicAA), adding
|
|
||||||
// trailing zeroes to the smaller GEP, if needed.
|
|
||||||
typedef SmallVector<std::pair<const SCEV*, const SCEV*>, 4> GEPOpdPairsTy;
|
|
||||||
GEPOpdPairsTy opds;
|
|
||||||
for(GEPOperator::const_op_iterator aIdx = aGEP->idx_begin(),
|
|
||||||
aEnd = aGEP->idx_end(),
|
|
||||||
bIdx = bGEP->idx_begin(),
|
|
||||||
bEnd = bGEP->idx_end();
|
|
||||||
aIdx != aEnd && bIdx != bEnd;
|
|
||||||
aIdx += (aIdx != aEnd), bIdx += (bIdx != bEnd)) {
|
|
||||||
const SCEV* aSCEV = (aIdx != aEnd) ? SE->getSCEV(*aIdx) : GetZeroSCEV(SE);
|
|
||||||
const SCEV* bSCEV = (bIdx != bEnd) ? SE->getSCEV(*bIdx) : GetZeroSCEV(SE);
|
|
||||||
opds.push_back(std::make_pair(aSCEV, bSCEV));
|
|
||||||
}
|
|
||||||
|
|
||||||
if (!opds.empty() && opds[0].first != opds[0].second) {
|
|
||||||
// We cannot (yet) handle arbitrary GEP pointer offsets. By limiting
|
|
||||||
//
|
|
||||||
// TODO: this could be relaxed by adding the size of the underlying object
|
|
||||||
// to the first subscript. If we have e.g. (GEP x,0,i; GEP x,2,-i) and we
|
|
||||||
// know that x is a [100 x i8]*, we could modify the first subscript to be
|
|
||||||
// (i, 200-i) instead of (i, -i).
|
|
||||||
return Unknown;
|
|
||||||
}
|
|
||||||
|
|
||||||
// Now analyse the collected operand pairs (skipping the GEP ptr offsets).
|
|
||||||
for (GEPOpdPairsTy::const_iterator i = opds.begin() + 1, end = opds.end();
|
|
||||||
i != end; ++i) {
|
|
||||||
Subscript subscript;
|
|
||||||
DependenceResult result = analyseSubscript(i->first, i->second, &subscript);
|
|
||||||
if (result != Dependent) {
|
|
||||||
// We either proved independence or failed to analyse this subscript.
|
|
||||||
// Further subscripts will not improve the situation, so abort early.
|
|
||||||
return result;
|
|
||||||
}
|
|
||||||
P->Subscripts.push_back(subscript);
|
|
||||||
}
|
|
||||||
// We successfully analysed all subscripts but failed to prove independence.
|
|
||||||
return Dependent;
|
|
||||||
}
|
|
||||||
|
|
||||||
bool LoopDependenceAnalysis::depends(Value *A, Value *B) {
|
|
||||||
assert(isDependencePair(A, B) && "Values form no dependence pair!");
|
|
||||||
++NumAnswered;
|
|
||||||
|
|
||||||
DependencePair *p;
|
|
||||||
if (!findOrInsertDependencePair(A, B, p)) {
|
|
||||||
// The pair is not cached, so analyse it.
|
|
||||||
++NumAnalysed;
|
|
||||||
switch (p->Result = analysePair(p)) {
|
|
||||||
case Dependent: ++NumDependent; break;
|
|
||||||
case Independent: ++NumIndependent; break;
|
|
||||||
case Unknown: ++NumUnknown; break;
|
|
||||||
}
|
|
||||||
}
|
|
||||||
return p->Result != Independent;
|
|
||||||
}
|
|
||||||
|
|
||||||
//===----------------------------------------------------------------------===//
|
|
||||||
// LoopDependenceAnalysis Implementation
|
|
||||||
//===----------------------------------------------------------------------===//
|
|
||||||
|
|
||||||
bool LoopDependenceAnalysis::runOnLoop(Loop *L, LPPassManager &) {
|
|
||||||
this->L = L;
|
|
||||||
AA = &getAnalysis<AliasAnalysis>();
|
|
||||||
SE = &getAnalysis<ScalarEvolution>();
|
|
||||||
return false;
|
|
||||||
}
|
|
||||||
|
|
||||||
void LoopDependenceAnalysis::releaseMemory() {
|
|
||||||
Pairs.clear();
|
|
||||||
PairAllocator.Reset();
|
|
||||||
}
|
|
||||||
|
|
||||||
void LoopDependenceAnalysis::getAnalysisUsage(AnalysisUsage &AU) const {
|
|
||||||
AU.setPreservesAll();
|
|
||||||
AU.addRequiredTransitive<AliasAnalysis>();
|
|
||||||
AU.addRequiredTransitive<ScalarEvolution>();
|
|
||||||
}
|
|
||||||
|
|
||||||
static void PrintLoopInfo(raw_ostream &OS,
|
|
||||||
LoopDependenceAnalysis *LDA, const Loop *L) {
|
|
||||||
if (!L->empty()) return; // ignore non-innermost loops
|
|
||||||
|
|
||||||
SmallVector<Instruction*, 8> memrefs;
|
|
||||||
GetMemRefInstrs(L, memrefs);
|
|
||||||
|
|
||||||
OS << "Loop at depth " << L->getLoopDepth() << ", header block: ";
|
|
||||||
WriteAsOperand(OS, L->getHeader(), false);
|
|
||||||
OS << "\n";
|
|
||||||
|
|
||||||
OS << " Load/store instructions: " << memrefs.size() << "\n";
|
|
||||||
for (SmallVector<Instruction*, 8>::const_iterator x = memrefs.begin(),
|
|
||||||
end = memrefs.end(); x != end; ++x)
|
|
||||||
OS << "\t" << (x - memrefs.begin()) << ": " << **x << "\n";
|
|
||||||
|
|
||||||
OS << " Pairwise dependence results:\n";
|
|
||||||
for (SmallVector<Instruction*, 8>::const_iterator x = memrefs.begin(),
|
|
||||||
end = memrefs.end(); x != end; ++x)
|
|
||||||
for (SmallVector<Instruction*, 8>::const_iterator y = x + 1;
|
|
||||||
y != end; ++y)
|
|
||||||
if (LDA->isDependencePair(*x, *y))
|
|
||||||
OS << "\t" << (x - memrefs.begin()) << "," << (y - memrefs.begin())
|
|
||||||
<< ": " << (LDA->depends(*x, *y) ? "dependent" : "independent")
|
|
||||||
<< "\n";
|
|
||||||
}
|
|
||||||
|
|
||||||
void LoopDependenceAnalysis::print(raw_ostream &OS, const Module*) const {
|
|
||||||
// TODO: doc why const_cast is safe
|
|
||||||
PrintLoopInfo(OS, const_cast<LoopDependenceAnalysis*>(this), this->L);
|
|
||||||
}
|
|
|
@ -1,44 +0,0 @@
|
||||||
; RUN: opt < %s -analyze -basicaa -lda | FileCheck %s
|
|
||||||
|
|
||||||
;; x[5] = x[6] // with x being a pointer passed as argument
|
|
||||||
|
|
||||||
define void @f1(i32* nocapture %xptr) nounwind {
|
|
||||||
entry:
|
|
||||||
%x.ld.addr = getelementptr i32* %xptr, i64 6
|
|
||||||
%x.st.addr = getelementptr i32* %xptr, i64 5
|
|
||||||
br label %for.body
|
|
||||||
|
|
||||||
for.body:
|
|
||||||
%i = phi i64 [ 0, %entry ], [ %i.next, %for.body ]
|
|
||||||
%x = load i32* %x.ld.addr
|
|
||||||
store i32 %x, i32* %x.st.addr
|
|
||||||
; CHECK: 0,1: dep
|
|
||||||
%i.next = add i64 %i, 1
|
|
||||||
%exitcond = icmp eq i64 %i.next, 256
|
|
||||||
br i1 %exitcond, label %for.end, label %for.body
|
|
||||||
|
|
||||||
for.end:
|
|
||||||
ret void
|
|
||||||
}
|
|
||||||
|
|
||||||
;; x[5] = x[6] // with x being an array on the stack
|
|
||||||
|
|
||||||
define void @foo(...) nounwind {
|
|
||||||
entry:
|
|
||||||
%xptr = alloca [256 x i32], align 4
|
|
||||||
%x.ld.addr = getelementptr [256 x i32]* %xptr, i64 0, i64 6
|
|
||||||
%x.st.addr = getelementptr [256 x i32]* %xptr, i64 0, i64 5
|
|
||||||
br label %for.body
|
|
||||||
|
|
||||||
for.body:
|
|
||||||
%i = phi i64 [ 0, %entry ], [ %i.next, %for.body ]
|
|
||||||
%x = load i32* %x.ld.addr
|
|
||||||
store i32 %x, i32* %x.st.addr
|
|
||||||
; CHECK: 0,1: ind
|
|
||||||
%i.next = add i64 %i, 1
|
|
||||||
%exitcond = icmp eq i64 %i.next, 256
|
|
||||||
br i1 %exitcond, label %for.end, label %for.body
|
|
||||||
|
|
||||||
for.end:
|
|
||||||
ret void
|
|
||||||
}
|
|
|
@ -1 +0,0 @@
|
||||||
config.suffixes = ['.ll', '.c', '.cpp']
|
|
|
@ -1,110 +0,0 @@
|
||||||
; RUN: opt < %s -analyze -basicaa -lda | FileCheck %s
|
|
||||||
|
|
||||||
@x = common global [256 x i32] zeroinitializer, align 4
|
|
||||||
@y = common global [256 x i32] zeroinitializer, align 4
|
|
||||||
|
|
||||||
;; for (i = 0; i < 256; i++)
|
|
||||||
;; x[i] = x[i] + y[i]
|
|
||||||
|
|
||||||
define void @f1(...) nounwind {
|
|
||||||
entry:
|
|
||||||
br label %for.body
|
|
||||||
|
|
||||||
for.body:
|
|
||||||
%i = phi i64 [ 0, %entry ], [ %i.next, %for.body ]
|
|
||||||
%y.addr = getelementptr [256 x i32]* @y, i64 0, i64 %i
|
|
||||||
%x.addr = getelementptr [256 x i32]* @x, i64 0, i64 %i
|
|
||||||
%x = load i32* %x.addr ; 0
|
|
||||||
%y = load i32* %y.addr ; 1
|
|
||||||
%r = add i32 %y, %x
|
|
||||||
store i32 %r, i32* %x.addr ; 2
|
|
||||||
; CHECK: 0,2: dep
|
|
||||||
; CHECK: 1,2: ind
|
|
||||||
%i.next = add i64 %i, 1
|
|
||||||
%exitcond = icmp eq i64 %i.next, 256
|
|
||||||
br i1 %exitcond, label %for.end, label %for.body
|
|
||||||
|
|
||||||
for.end:
|
|
||||||
ret void
|
|
||||||
}
|
|
||||||
|
|
||||||
;; for (i = 0; i < 256; i++)
|
|
||||||
;; x[i+1] = x[i] + y[i]
|
|
||||||
|
|
||||||
define void @f2(...) nounwind {
|
|
||||||
entry:
|
|
||||||
br label %for.body
|
|
||||||
|
|
||||||
for.body:
|
|
||||||
%i = phi i64 [ 0, %entry ], [ %i.next, %for.body ]
|
|
||||||
%y.ld.addr = getelementptr [256 x i32]* @y, i64 0, i64 %i
|
|
||||||
%x.ld.addr = getelementptr [256 x i32]* @x, i64 0, i64 %i
|
|
||||||
%i.next = add i64 %i, 1
|
|
||||||
%x.st.addr = getelementptr [256 x i32]* @x, i64 0, i64 %i.next
|
|
||||||
%x = load i32* %x.ld.addr ; 0
|
|
||||||
%y = load i32* %y.ld.addr ; 1
|
|
||||||
%r = add i32 %y, %x
|
|
||||||
store i32 %r, i32* %x.st.addr ; 2
|
|
||||||
; CHECK: 0,2: dep
|
|
||||||
; CHECK: 1,2: ind
|
|
||||||
%exitcond = icmp eq i64 %i.next, 256
|
|
||||||
br i1 %exitcond, label %for.end, label %for.body
|
|
||||||
|
|
||||||
for.end:
|
|
||||||
ret void
|
|
||||||
}
|
|
||||||
|
|
||||||
;; for (i = 0; i < 10; i++)
|
|
||||||
;; x[i+20] = x[i] + y[i]
|
|
||||||
|
|
||||||
define void @f3(...) nounwind {
|
|
||||||
entry:
|
|
||||||
br label %for.body
|
|
||||||
|
|
||||||
for.body:
|
|
||||||
%i = phi i64 [ 0, %entry ], [ %i.next, %for.body ]
|
|
||||||
%y.ld.addr = getelementptr [256 x i32]* @y, i64 0, i64 %i
|
|
||||||
%x.ld.addr = getelementptr [256 x i32]* @x, i64 0, i64 %i
|
|
||||||
%i.20 = add i64 %i, 20
|
|
||||||
%x.st.addr = getelementptr [256 x i32]* @x, i64 0, i64 %i.20
|
|
||||||
%x = load i32* %x.ld.addr ; 0
|
|
||||||
%y = load i32* %y.ld.addr ; 1
|
|
||||||
%r = add i32 %y, %x
|
|
||||||
store i32 %r, i32* %x.st.addr ; 2
|
|
||||||
; CHECK: 0,2: dep
|
|
||||||
; CHECK: 1,2: ind
|
|
||||||
%i.next = add i64 %i, 1
|
|
||||||
%exitcond = icmp eq i64 %i.next, 10
|
|
||||||
br i1 %exitcond, label %for.end, label %for.body
|
|
||||||
|
|
||||||
for.end:
|
|
||||||
ret void
|
|
||||||
}
|
|
||||||
|
|
||||||
;; for (i = 0; i < 10; i++)
|
|
||||||
;; x[10*i+1] = x[10*i] + y[i]
|
|
||||||
|
|
||||||
define void @f4(...) nounwind {
|
|
||||||
entry:
|
|
||||||
br label %for.body
|
|
||||||
|
|
||||||
for.body:
|
|
||||||
%i = phi i64 [ 0, %entry ], [ %i.next, %for.body ]
|
|
||||||
%i.10 = mul i64 %i, 10
|
|
||||||
%y.ld.addr = getelementptr [256 x i32]* @y, i64 0, i64 %i.10
|
|
||||||
%x.ld.addr = getelementptr [256 x i32]* @x, i64 0, i64 %i.10
|
|
||||||
%i.10.1 = add i64 %i.10, 1
|
|
||||||
%x.st.addr = getelementptr [256 x i32]* @x, i64 0, i64 %i.10.1
|
|
||||||
%x = load i32* %x.ld.addr ; 0
|
|
||||||
%y = load i32* %y.ld.addr ; 1
|
|
||||||
%r = add i32 %y, %x
|
|
||||||
store i32 %r, i32* %x.st.addr ; 2
|
|
||||||
; CHECK: 0,2: dep
|
|
||||||
; CHECK: 1,2: ind
|
|
||||||
%i.next = add i64 %i, 1
|
|
||||||
%exitcond = icmp eq i64 %i.next, 10
|
|
||||||
br i1 %exitcond, label %for.end, label %for.body
|
|
||||||
|
|
||||||
for.end:
|
|
||||||
ret void
|
|
||||||
}
|
|
|
@ -1,118 +0,0 @@
|
||||||
; RUN: opt < %s -analyze -basicaa -lda | FileCheck %s
|
|
||||||
|
|
||||||
@x = common global [256 x i32] zeroinitializer, align 4
|
|
||||||
@y = common global [256 x i32] zeroinitializer, align 4
|
|
||||||
|
|
||||||
;; for (i = 0; i < 256; i++)
|
|
||||||
;; x[i] = x[255 - i] + y[i]
|
|
||||||
|
|
||||||
define void @f1(...) nounwind {
|
|
||||||
entry:
|
|
||||||
br label %for.body
|
|
||||||
|
|
||||||
for.body:
|
|
||||||
%i = phi i64 [ 0, %entry ], [ %i.next, %for.body ]
|
|
||||||
%i.255 = sub i64 255, %i
|
|
||||||
%y.ld.addr = getelementptr [256 x i32]* @y, i64 0, i64 %i
|
|
||||||
%x.ld.addr = getelementptr [256 x i32]* @x, i64 0, i64 %i.255
|
|
||||||
%x.st.addr = getelementptr [256 x i32]* @x, i64 0, i64 %i
|
|
||||||
%x = load i32* %x.ld.addr ; 0
|
|
||||||
%y = load i32* %y.ld.addr ; 1
|
|
||||||
%r = add i32 %y, %x
|
|
||||||
store i32 %r, i32* %x.st.addr ; 2
|
|
||||||
; CHECK: 0,2: dep
|
|
||||||
; CHECK: 1,2: ind
|
|
||||||
%i.next = add i64 %i, 1
|
|
||||||
%exitcond = icmp eq i64 %i.next, 256
|
|
||||||
br i1 %exitcond, label %for.end, label %for.body
|
|
||||||
|
|
||||||
for.end:
|
|
||||||
ret void
|
|
||||||
}
|
|
||||||
|
|
||||||
;; for (i = 0; i < 100; i++)
|
|
||||||
;; x[i] = x[255 - i] + y[i]
|
|
||||||
|
|
||||||
define void @f2(...) nounwind {
|
|
||||||
entry:
|
|
||||||
br label %for.body
|
|
||||||
|
|
||||||
for.body:
|
|
||||||
%i = phi i64 [ 0, %entry ], [ %i.next, %for.body ]
|
|
||||||
%i.255 = sub i64 255, %i
|
|
||||||
%y.ld.addr = getelementptr [256 x i32]* @y, i64 0, i64 %i
|
|
||||||
%x.ld.addr = getelementptr [256 x i32]* @x, i64 0, i64 %i.255
|
|
||||||
%x.st.addr = getelementptr [256 x i32]* @x, i64 0, i64 %i
|
|
||||||
%x = load i32* %x.ld.addr ; 0
|
|
||||||
%y = load i32* %y.ld.addr ; 1
|
|
||||||
%r = add i32 %y, %x
|
|
||||||
store i32 %r, i32* %x.st.addr ; 2
|
|
||||||
; CHECK: 0,2: dep
|
|
||||||
; CHECK: 1,2: ind
|
|
||||||
%i.next = add i64 %i, 1
|
|
||||||
%exitcond = icmp eq i64 %i.next, 100
|
|
||||||
br i1 %exitcond, label %for.end, label %for.body
|
|
||||||
|
|
||||||
for.end:
|
|
||||||
ret void
|
|
||||||
}
|
|
||||||
|
|
||||||
;; // the first iteration (i=0) leads to an out-of-bounds access of x. as the
|
|
||||||
;; // result of this access is undefined, _any_ dependence result is safe.
|
|
||||||
;; for (i = 0; i < 256; i++)
|
|
||||||
;; x[i] = x[256 - i] + y[i]
|
|
||||||
|
|
||||||
define void @f3(...) nounwind {
|
|
||||||
entry:
|
|
||||||
br label %for.body
|
|
||||||
|
|
||||||
for.body:
|
|
||||||
%i = phi i64 [ 0, %entry ], [ %i.next, %for.body ]
|
|
||||||
%i.256 = sub i64 0, %i
|
|
||||||
%y.ld.addr = getelementptr [256 x i32]* @y, i64 0, i64 %i
|
|
||||||
%x.ld.addr = getelementptr [256 x i32]* @x, i64 1, i64 %i.256
|
|
||||||
%x.st.addr = getelementptr [256 x i32]* @x, i64 0, i64 %i
|
|
||||||
%x = load i32* %x.ld.addr ; 0
|
|
||||||
%y = load i32* %y.ld.addr ; 1
|
|
||||||
%r = add i32 %y, %x
|
|
||||||
store i32 %r, i32* %x.st.addr ; 2
|
|
||||||
; CHECK: 0,2: dep
|
|
||||||
; CHECK: 1,2:
|
|
||||||
%i.next = add i64 %i, 1
|
|
||||||
%exitcond = icmp eq i64 %i.next, 256
|
|
||||||
br i1 %exitcond, label %for.end, label %for.body
|
|
||||||
|
|
||||||
for.end:
|
|
||||||
ret void
|
|
||||||
}
|
|
||||||
|
|
||||||
;; // slightly contrived but valid IR for the following loop, where all
|
|
||||||
;; // accesses in all iterations are within bounds. while this example's first
|
|
||||||
;; // (ZIV-)subscript is (0, 1), accesses are dependent.
|
|
||||||
;; for (i = 1; i < 256; i++)
|
|
||||||
;; x[i] = x[256 - i] + y[i]
|
|
||||||
|
|
||||||
define void @f4(...) nounwind {
|
|
||||||
entry:
|
|
||||||
br label %for.body
|
|
||||||
|
|
||||||
for.body:
|
|
||||||
%i = phi i64 [ 0, %entry ], [ %i.next, %for.body ]
|
|
||||||
%i.1 = add i64 1, %i
|
|
||||||
%i.256 = sub i64 -1, %i
|
|
||||||
%y.ld.addr = getelementptr [256 x i32]* @y, i64 0, i64 %i.1
|
|
||||||
%x.ld.addr = getelementptr [256 x i32]* @x, i64 1, i64 %i.256
|
|
||||||
%x.st.addr = getelementptr [256 x i32]* @x, i64 0, i64 %i.1
|
|
||||||
%x = load i32* %x.ld.addr ; 0
|
|
||||||
%y = load i32* %y.ld.addr ; 1
|
|
||||||
%r = add i32 %y, %x
|
|
||||||
store i32 %r, i32* %x.st.addr ; 2
|
|
||||||
; CHECK: 0,2: dep
|
|
||||||
; CHECK: 1,2: ind
|
|
||||||
%i.next = add i64 %i, 1
|
|
||||||
%exitcond = icmp eq i64 %i.next, 256
|
|
||||||
br i1 %exitcond, label %for.end, label %for.body
|
|
||||||
|
|
||||||
for.end:
|
|
||||||
ret void
|
|
||||||
}
|
|
|
@ -1,56 +0,0 @@
|
||||||
; RUN: opt < %s -analyze -basicaa -lda | FileCheck %s
|
|
||||||
|
|
||||||
@x = common global [256 x i32] zeroinitializer, align 4
|
|
||||||
@y = common global [256 x i32] zeroinitializer, align 4
|
|
||||||
|
|
||||||
;; for (i = 0; i < 256; i++)
|
|
||||||
;; x[i] = x[42] + y[i]
|
|
||||||
|
|
||||||
define void @f1(...) nounwind {
|
|
||||||
entry:
|
|
||||||
%x.ld.addr = getelementptr [256 x i32]* @x, i64 0, i64 42
|
|
||||||
br label %for.body
|
|
||||||
|
|
||||||
for.body:
|
|
||||||
%i = phi i64 [ 0, %entry ], [ %i.next, %for.body ]
|
|
||||||
%x.addr = getelementptr [256 x i32]* @x, i64 0, i64 %i
|
|
||||||
%y.addr = getelementptr [256 x i32]* @y, i64 0, i64 %i
|
|
||||||
%x = load i32* %x.ld.addr ; 0
|
|
||||||
%y = load i32* %y.addr ; 1
|
|
||||||
%r = add i32 %y, %x
|
|
||||||
store i32 %r, i32* %x.addr ; 2
|
|
||||||
; CHECK: 0,2: dep
|
|
||||||
; CHECK: 1,2: ind
|
|
||||||
%i.next = add i64 %i, 1
|
|
||||||
%exitcond = icmp eq i64 %i.next, 256
|
|
||||||
br i1 %exitcond, label %for.end, label %for.body
|
|
||||||
|
|
||||||
for.end:
|
|
||||||
ret void
|
|
||||||
}
|
|
||||||
|
|
||||||
;; for (i = 0; i < 250; i++)
|
|
||||||
;; x[i] = x[255] + y[i]
|
|
||||||
|
|
||||||
define void @f2(...) nounwind {
|
|
||||||
entry:
|
|
||||||
%x.ld.addr = getelementptr [256 x i32]* @x, i64 0, i64 255
|
|
||||||
br label %for.body
|
|
||||||
|
|
||||||
for.body:
|
|
||||||
%i = phi i64 [ 0, %entry ], [ %i.next, %for.body ]
|
|
||||||
%x.addr = getelementptr [256 x i32]* @x, i64 0, i64 %i
|
|
||||||
%y.addr = getelementptr [256 x i32]* @y, i64 0, i64 %i
|
|
||||||
%x = load i32* %x.ld.addr ; 0
|
|
||||||
%y = load i32* %y.addr ; 1
|
|
||||||
%r = add i32 %y, %x
|
|
||||||
store i32 %r, i32* %x.addr ; 2
|
|
||||||
; CHECK: 0,2: dep
|
|
||||||
; CHECK: 1,2: ind
|
|
||||||
%i.next = add i64 %i, 1
|
|
||||||
%exitcond = icmp eq i64 %i.next, 250
|
|
||||||
br i1 %exitcond, label %for.end, label %for.body
|
|
||||||
|
|
||||||
for.end:
|
|
||||||
ret void
|
|
||||||
}
|
|
|
@ -1,63 +0,0 @@
|
||||||
; RUN: opt < %s -analyze -basicaa -lda | FileCheck %s
|
|
||||||
|
|
||||||
@x = common global [256 x i32] zeroinitializer, align 4
|
|
||||||
|
|
||||||
;; x[5] = x[6]
|
|
||||||
|
|
||||||
define void @f1(...) nounwind {
|
|
||||||
entry:
|
|
||||||
br label %for.body
|
|
||||||
|
|
||||||
for.body:
|
|
||||||
%i = phi i64 [ 0, %entry ], [ %i.next, %for.body ]
|
|
||||||
%x = load i32* getelementptr ([256 x i32]* @x, i32 0, i64 6)
|
|
||||||
store i32 %x, i32* getelementptr ([256 x i32]* @x, i32 0, i64 5)
|
|
||||||
; CHECK: 0,1: ind
|
|
||||||
%i.next = add i64 %i, 1
|
|
||||||
%exitcond = icmp eq i64 %i.next, 256
|
|
||||||
br i1 %exitcond, label %for.end, label %for.body
|
|
||||||
|
|
||||||
for.end:
|
|
||||||
ret void
|
|
||||||
}
|
|
||||||
|
|
||||||
;; x[c] = x[c+1] // with c being a loop-invariant constant
|
|
||||||
|
|
||||||
define void @f2(i64 %c0) nounwind {
|
|
||||||
entry:
|
|
||||||
%c1 = add i64 %c0, 1
|
|
||||||
%x.ld.addr = getelementptr [256 x i32]* @x, i64 0, i64 %c0
|
|
||||||
%x.st.addr = getelementptr [256 x i32]* @x, i64 0, i64 %c1
|
|
||||||
br label %for.body
|
|
||||||
|
|
||||||
for.body:
|
|
||||||
%i = phi i64 [ 0, %entry ], [ %i.next, %for.body ]
|
|
||||||
%x = load i32* %x.ld.addr
|
|
||||||
store i32 %x, i32* %x.st.addr
|
|
||||||
; CHECK: 0,1: ind
|
|
||||||
%i.next = add i64 %i, 1
|
|
||||||
%exitcond = icmp eq i64 %i.next, 256
|
|
||||||
br i1 %exitcond, label %for.end, label %for.body
|
|
||||||
|
|
||||||
for.end:
|
|
||||||
ret void
|
|
||||||
}
|
|
||||||
|
|
||||||
;; x[6] = x[6]
|
|
||||||
|
|
||||||
define void @f3(...) nounwind {
|
|
||||||
entry:
|
|
||||||
br label %for.body
|
|
||||||
|
|
||||||
for.body:
|
|
||||||
%i = phi i64 [ 0, %entry ], [ %i.next, %for.body ]
|
|
||||||
%x = load i32* getelementptr ([256 x i32]* @x, i32 0, i64 6)
|
|
||||||
store i32 %x, i32* getelementptr ([256 x i32]* @x, i32 0, i64 6)
|
|
||||||
; CHECK: 0,1: dep
|
|
||||||
%i.next = add i64 %i, 1
|
|
||||||
%exitcond = icmp eq i64 %i.next, 256
|
|
||||||
br i1 %exitcond, label %for.end, label %for.body
|
|
||||||
|
|
||||||
for.end:
|
|
||||||
ret void
|
|
||||||
}
|
|
Loading…
Reference in New Issue