Rename AddReadAttrs to FunctionAttrs, and teach it how

to work out (in a very simplistic way) which function
arguments (pointer arguments only) are only dereferenced
and so do not escape.  Mark such arguments 'nocapture'.

llvm-svn: 61525
This commit is contained in:
Duncan Sands 2008-12-31 16:14:43 +00:00
parent 2cc3ce0002
commit 44c8cd97a5
14 changed files with 175 additions and 25 deletions

View File

@ -122,7 +122,7 @@ namespace {
(void) llvm::createPostDomFrontier(); (void) llvm::createPostDomFrontier();
(void) llvm::createInstructionNamerPass(); (void) llvm::createInstructionNamerPass();
(void) llvm::createPartialSpecializationPass(); (void) llvm::createPartialSpecializationPass();
(void) llvm::createAddReadAttrsPass(); (void) llvm::createFunctionAttrsPass();
(void) llvm::createMergeFunctionsPass(); (void) llvm::createMergeFunctionsPass();
(void) llvm::createPrintModulePass(0); (void) llvm::createPrintModulePass(0);
(void) llvm::createPrintFunctionPass("", 0); (void) llvm::createPrintFunctionPass("", 0);

View File

@ -196,10 +196,12 @@ ModulePass *createStripDeadPrototypesPass();
ModulePass *createPartialSpecializationPass(); ModulePass *createPartialSpecializationPass();
//===----------------------------------------------------------------------===// //===----------------------------------------------------------------------===//
/// createAddReadAttrsPass - This pass discovers functions that do not access /// createFunctionAttrsPass - This pass discovers functions that do not access
/// memory, or only read memory, and gives them the readnone/readonly attribute. /// memory, or only read memory, and gives them the readnone/readonly attribute.
/// It also discovers function arguments that are not captured by the function
/// and marks them with the nocapture attribute.
/// ///
Pass *createAddReadAttrsPass(); Pass *createFunctionAttrsPass();
//===----------------------------------------------------------------------===// //===----------------------------------------------------------------------===//
/// createMergeFunctionsPass - This pass discovers identical functions and /// createMergeFunctionsPass - This pass discovers identical functions and

View File

@ -1,5 +1,5 @@
add_llvm_library(LLVMipo add_llvm_library(LLVMipo
AddReadAttrs.cpp FunctionAttrs.cpp
ArgumentPromotion.cpp ArgumentPromotion.cpp
ConstantMerge.cpp ConstantMerge.cpp
DeadArgumentElimination.cpp DeadArgumentElimination.cpp

View File

@ -1,4 +1,4 @@
//===- AddReadAttrs.cpp - Pass which marks functions readnone or readonly -===// //===- FunctionAttrs.cpp - Pass which marks functions readnone or readonly ===//
// //
// The LLVM Compiler Infrastructure // The LLVM Compiler Infrastructure
// //
@ -14,7 +14,7 @@
// //
//===----------------------------------------------------------------------===// //===----------------------------------------------------------------------===//
#define DEBUG_TYPE "addreadattrs" #define DEBUG_TYPE "functionattrs"
#include "llvm/Transforms/IPO.h" #include "llvm/Transforms/IPO.h"
#include "llvm/CallGraphSCCPass.h" #include "llvm/CallGraphSCCPass.h"
#include "llvm/GlobalVariable.h" #include "llvm/GlobalVariable.h"
@ -28,15 +28,25 @@ using namespace llvm;
STATISTIC(NumReadNone, "Number of functions marked readnone"); STATISTIC(NumReadNone, "Number of functions marked readnone");
STATISTIC(NumReadOnly, "Number of functions marked readonly"); STATISTIC(NumReadOnly, "Number of functions marked readonly");
STATISTIC(NumNoCapture, "Number of arguments marked nocapture");
namespace { namespace {
struct VISIBILITY_HIDDEN AddReadAttrs : public CallGraphSCCPass { struct VISIBILITY_HIDDEN FunctionAttrs : public CallGraphSCCPass {
static char ID; // Pass identification, replacement for typeid static char ID; // Pass identification, replacement for typeid
AddReadAttrs() : CallGraphSCCPass(&ID) {} FunctionAttrs() : CallGraphSCCPass(&ID) {}
// runOnSCC - Analyze the SCC, performing the transformation if possible. // runOnSCC - Analyze the SCC, performing the transformation if possible.
bool runOnSCC(const std::vector<CallGraphNode *> &SCC); bool runOnSCC(const std::vector<CallGraphNode *> &SCC);
// AddReadAttrs - Deduce readonly/readnone attributes for the SCC.
bool AddReadAttrs(const std::vector<CallGraphNode *> &SCC);
// AddNoCaptureAttrs - Deduce nocapture attributes for the SCC.
bool AddNoCaptureAttrs(const std::vector<CallGraphNode *> &SCC);
// isCaptured - Returns whether this pointer value is captured.
bool isCaptured(Function &F, Value *V);
virtual void getAnalysisUsage(AnalysisUsage &AU) const { virtual void getAnalysisUsage(AnalysisUsage &AU) const {
AU.setPreservesCFG(); AU.setPreservesCFG();
CallGraphSCCPass::getAnalysisUsage(AU); CallGraphSCCPass::getAnalysisUsage(AU);
@ -46,17 +56,17 @@ namespace {
}; };
} }
char AddReadAttrs::ID = 0; char FunctionAttrs::ID = 0;
static RegisterPass<AddReadAttrs> static RegisterPass<FunctionAttrs>
X("addreadattrs", "Mark functions readnone/readonly"); X("functionattrs", "Deduce function attributes");
Pass *llvm::createAddReadAttrsPass() { return new AddReadAttrs(); } Pass *llvm::createFunctionAttrsPass() { return new FunctionAttrs(); }
/// PointsToLocalMemory - Returns whether the given pointer value points to /// PointsToLocalMemory - Returns whether the given pointer value points to
/// memory that is local to the function. Global constants are considered /// memory that is local to the function. Global constants are considered
/// local to all functions. /// local to all functions.
bool AddReadAttrs::PointsToLocalMemory(Value *V) { bool FunctionAttrs::PointsToLocalMemory(Value *V) {
V = V->getUnderlyingObject(); V = V->getUnderlyingObject();
// An alloca instruction defines local memory. // An alloca instruction defines local memory.
if (isa<AllocaInst>(V)) if (isa<AllocaInst>(V))
@ -69,8 +79,9 @@ bool AddReadAttrs::PointsToLocalMemory(Value *V) {
return false; return false;
} }
bool AddReadAttrs::runOnSCC(const std::vector<CallGraphNode *> &SCC) { /// AddReadAttrs - Deduce readonly/readnone attributes for the SCC.
SmallPtrSet<CallGraphNode *, 8> SCCNodes; bool FunctionAttrs::AddReadAttrs(const std::vector<CallGraphNode *> &SCC) {
SmallPtrSet<CallGraphNode*, 8> SCCNodes;
CallGraph &CG = getAnalysis<CallGraph>(); CallGraph &CG = getAnalysis<CallGraph>();
// Fill SCCNodes with the elements of the SCC. Used for quickly // Fill SCCNodes with the elements of the SCC. Used for quickly
@ -154,7 +165,7 @@ bool AddReadAttrs::runOnSCC(const std::vector<CallGraphNode *> &SCC) {
F->removeAttribute(~0, Attribute::ReadOnly | Attribute::ReadNone); F->removeAttribute(~0, Attribute::ReadOnly | Attribute::ReadNone);
// Add in the new attribute. // Add in the new attribute.
F->addAttribute(~0, ReadsMemory ? Attribute::ReadOnly : Attribute::ReadNone); F->addAttribute(~0, ReadsMemory? Attribute::ReadOnly : Attribute::ReadNone);
if (ReadsMemory) if (ReadsMemory)
NumReadOnly++; NumReadOnly++;
@ -164,3 +175,106 @@ bool AddReadAttrs::runOnSCC(const std::vector<CallGraphNode *> &SCC) {
return MadeChange; return MadeChange;
} }
/// isCaptured - Returns whether this pointer value is captured.
bool FunctionAttrs::isCaptured(Function &F, Value *V) {
SmallVector<Use*, 16> Worklist;
SmallPtrSet<Use*, 16> Visited;
for (Value::use_iterator UI = V->use_begin(), UE = V->use_end(); UI != UE;
++UI) {
Use *U = &UI.getUse();
Visited.insert(U);
Worklist.push_back(U);
}
while (!Worklist.empty()) {
Use *U = Worklist.pop_back_val();
Instruction *I = cast<Instruction>(U->getUser());
V = U->get();
if (isa<LoadInst>(I)) {
// Loading a pointer does not cause it to escape.
continue;
}
if (isa<StoreInst>(I)) {
if (V == I->getOperand(0))
// Stored the pointer - escapes. TODO: improve this.
return true;
// Storing to the pointee does not cause the pointer to escape.
continue;
}
CallSite CS = CallSite::get(I);
if (CS.getInstruction()) {
// Does not escape if only passed via 'nocapture' arguments. Note
// that calling a function pointer does not in itself cause that
// function pointer to escape. This is a subtle point considering
// that (for example) the callee might return its own address. It
// is analogous to saying that loading a value from a pointer does
// not cause the pointer to escape, even though the loaded value
// might be the pointer itself (think of self-referential objects).
CallSite::arg_iterator B = CS.arg_begin(), E = CS.arg_end();
for (CallSite::arg_iterator A = B; A != E; ++A)
if (A->get() == V && !CS.paramHasAttr(A-B+1, Attribute::NoCapture))
// The parameter is not marked 'nocapture' - escapes.
return true;
// Only passed via 'nocapture' arguments, or is the called function.
// Does not escape.
continue;
}
if (isa<BitCastInst>(I) || isa<GetElementPtrInst>(I)) {
// Type conversion or calculating an offset. Does not escape if the new
// value doesn't.
for (Instruction::use_iterator UI = I->use_begin(), UE = I->use_end();
UI != UE; ++UI) {
Use *U = &UI.getUse();
if (Visited.insert(U))
Worklist.push_back(U);
}
continue;
}
// Something else - be conservative and say it escapes.
return true;
}
return false;
}
/// AddNoCaptureAttrs - Deduce nocapture attributes for the SCC.
bool FunctionAttrs::AddNoCaptureAttrs(const std::vector<CallGraphNode *> &SCC) {
bool Changed = false;
// Check each function in turn, determining which pointer arguments are not
// captured.
for (unsigned i = 0, e = SCC.size(); i != e; ++i) {
Function *F = SCC[i]->getFunction();
if (F == 0)
// External node - skip it;
continue;
// Definitions with weak linkage may be overridden at linktime with
// something that writes memory, so treat them like declarations.
if (F->isDeclaration() || F->mayBeOverridden())
continue;
for (Function::arg_iterator A = F->arg_begin(), E = F->arg_end(); A!=E; ++A)
if (isa<PointerType>(A->getType()) && !isCaptured(*F, A)) {
A->addAttr(Attribute::NoCapture);
NumNoCapture++;
Changed = true;
}
}
return Changed;
}
bool FunctionAttrs::runOnSCC(const std::vector<CallGraphNode *> &SCC) {
bool Changed = AddReadAttrs(SCC);
Changed |= AddNoCaptureAttrs(SCC);
return Changed;
}

View File

@ -1,4 +1,4 @@
; RUN: llvm-as < %s | opt -addreadattrs | llvm-dis | grep readnone ; RUN: llvm-as < %s | opt -functionattrs | llvm-dis | grep readnone
define i32 @a() { define i32 @a() {
%tmp = call i32 @b( ) ; <i32> [#uses=1] %tmp = call i32 @b( ) ; <i32> [#uses=1]

View File

@ -1,4 +1,4 @@
; RUN: llvm-as < %s | opt -addreadattrs | llvm-dis | grep readnone | count 4 ; RUN: llvm-as < %s | opt -functionattrs | llvm-dis | grep readnone | count 4
@x = global i32 0 @x = global i32 0
declare i32 @e() readnone declare i32 @e() readnone

View File

@ -1,4 +1,4 @@
; RUN: llvm-as < %s | opt -addreadattrs | llvm-dis | grep readonly | count 2 ; RUN: llvm-as < %s | opt -functionattrs | llvm-dis | grep readonly | count 2
define i32 @f() { define i32 @f() {
entry: entry:

View File

@ -1,4 +1,4 @@
; RUN: llvm-as < %s | opt -addreadattrs | llvm-dis | not grep read ; RUN: llvm-as < %s | opt -functionattrs | llvm-dis | not grep read
; PR2792 ; PR2792
@g = global i32 0 ; <i32*> [#uses=1] @g = global i32 0 ; <i32*> [#uses=1]

View File

@ -1,4 +1,4 @@
; RUN: llvm-as < %s | opt -addreadattrs | llvm-dis | grep readnone | count 2 ; RUN: llvm-as < %s | opt -functionattrs | llvm-dis | grep readnone | count 2
declare i32 @g(i32*) readnone declare i32 @g(i32*) readnone

View File

@ -1,4 +1,4 @@
; RUN: llvm-as < %s | opt -addreadattrs | llvm-dis | grep readnone ; RUN: llvm-as < %s | opt -functionattrs | llvm-dis | grep readnone
@s = external constant i8 ; <i8*> [#uses=1] @s = external constant i8 ; <i8*> [#uses=1]

View File

@ -0,0 +1,34 @@
; RUN: llvm-as < %s | opt -functionattrs | llvm-dis | not grep {@c.*nocapture}
; RUN: llvm-as < %s | opt -functionattrs | llvm-dis | grep nocapture | count 3
@g = global i32* null ; <i32**> [#uses=1]
define i32* @c1(i32* %p) {
ret i32* %p
}
define void @c2(i32* %p) {
store i32* %p, i32** @g
ret void
}
define void @c3(i32* %p) {
call void @c2(i32* %p)
ret void
}
define i32 @nc1(i32* %p) {
%tmp = bitcast i32* %p to i32* ; <i32*> [#uses=2]
%val = load i32* %tmp ; <i32> [#uses=1]
store i32 0, i32* %tmp
ret i32 %val
}
define void @nc2(i32* %p) {
%1 = call i32 @nc1(i32* %p) ; <i32> [#uses=0]
ret void
}
define void @nc3(void ()* %f) {
call void %f()
ret void
}

View File

@ -291,7 +291,7 @@ void AddOptimizationPasses(PassManager &MPM, FunctionPassManager &FPM,
MPM.add(createCFGSimplificationPass()); // Clean up after IPCP & DAE MPM.add(createCFGSimplificationPass()); // Clean up after IPCP & DAE
if (UnitAtATime) { if (UnitAtATime) {
MPM.add(createPruneEHPass()); // Remove dead EH info MPM.add(createPruneEHPass()); // Remove dead EH info
MPM.add(createAddReadAttrsPass()); // Set readonly/readnone attrs MPM.add(createFunctionAttrsPass()); // Deduce function attrs
} }
if (OptLevel > 1) if (OptLevel > 1)
MPM.add(createFunctionInliningPass()); // Inline small functions MPM.add(createFunctionInliningPass()); // Inline small functions
@ -363,7 +363,7 @@ void AddStandardCompilePasses(PassManager &PM) {
addPass(PM, createCFGSimplificationPass()); // Clean up after IPCP & DAE addPass(PM, createCFGSimplificationPass()); // Clean up after IPCP & DAE
addPass(PM, createPruneEHPass()); // Remove dead EH info addPass(PM, createPruneEHPass()); // Remove dead EH info
addPass(PM, createAddReadAttrsPass()); // Set readonly/readnone attrs addPass(PM, createFunctionAttrsPass()); // Deduce function attrs
if (!DisableInline) if (!DisableInline)
addPass(PM, createFunctionInliningPass()); // Inline small functions addPass(PM, createFunctionInliningPass()); // Inline small functions

View File

@ -344,7 +344,7 @@
Name="IPO" Name="IPO"
> >
<File <File
RelativePath="..\..\lib\Transforms\IPO\AddReadAttrs.cpp" RelativePath="..\..\lib\Transforms\IPO\FunctionAttrs.cpp"
> >
</File> </File>
<File <File