forked from OSchip/llvm-project
609 lines
19 KiB
C++
609 lines
19 KiB
C++
//===--- CFG.cpp - Classes for representing and building CFGs----*- C++ -*-===//
|
|
//
|
|
// The LLVM Compiler Infrastructure
|
|
//
|
|
// This file was developed by Ted Kremenek and is distributed under
|
|
// the University of Illinois Open Source License. See LICENSE.TXT for details.
|
|
//
|
|
//===----------------------------------------------------------------------===//
|
|
//
|
|
// This file defines the CFG and CFGBuilder classes for representing and
|
|
// building Control-Flow Graphs (CFGs) from ASTs.
|
|
//
|
|
//===----------------------------------------------------------------------===//
|
|
|
|
#include "clang/AST/CFG.h"
|
|
#include "clang/AST/Expr.h"
|
|
#include "clang/AST/StmtVisitor.h"
|
|
#include "llvm/ADT/DenseMap.h"
|
|
#include <iostream>
|
|
#include <iomanip>
|
|
#include <algorithm>
|
|
using namespace clang;
|
|
|
|
namespace {
|
|
|
|
// SaveAndRestore - A utility class that uses RIIA to save and restore
|
|
// the value of a variable.
|
|
template<typename T>
|
|
struct SaveAndRestore {
|
|
SaveAndRestore(T& x) : X(x), old_value(x) {}
|
|
~SaveAndRestore() { X = old_value; }
|
|
|
|
T& X;
|
|
T old_value;
|
|
};
|
|
}
|
|
|
|
/// CFGBuilder - This class is implements CFG construction from an AST.
|
|
/// The builder is stateful: an instance of the builder should be used to only
|
|
/// construct a single CFG.
|
|
///
|
|
/// Example usage:
|
|
///
|
|
/// CFGBuilder builder;
|
|
/// CFG* cfg = builder.BuildAST(stmt1);
|
|
///
|
|
/// CFG construction is done via a recursive walk of an AST.
|
|
/// We actually parse the AST in reverse order so that the successor
|
|
/// of a basic block is constructed prior to its predecessor. This
|
|
/// allows us to nicely capture implicit fall-throughs without extra
|
|
/// basic blocks.
|
|
///
|
|
class CFGBuilder : public StmtVisitor<CFGBuilder,CFGBlock*> {
|
|
CFG* cfg;
|
|
CFGBlock* Block;
|
|
CFGBlock* Exit;
|
|
CFGBlock* Succ;
|
|
CFGBlock* ContinueTargetBlock;
|
|
CFGBlock* BreakTargetBlock;
|
|
unsigned NumBlocks;
|
|
|
|
typedef llvm::DenseMap<LabelStmt*,CFGBlock*> LabelMapTy;
|
|
LabelMapTy LabelMap;
|
|
|
|
typedef std::vector<CFGBlock*> BackpatchBlocksTy;
|
|
BackpatchBlocksTy BackpatchBlocks;
|
|
|
|
public:
|
|
explicit CFGBuilder() : cfg(NULL), Block(NULL), Exit(NULL), Succ(NULL),
|
|
ContinueTargetBlock(NULL), BreakTargetBlock(NULL),
|
|
NumBlocks(0) {
|
|
// Create an empty CFG.
|
|
cfg = new CFG();
|
|
}
|
|
|
|
~CFGBuilder() { delete cfg; }
|
|
|
|
/// BuildCFG - Constructs a CFG from an AST (a Stmt*). The AST can
|
|
/// represent an arbitrary statement. Examples include a single expression
|
|
/// or a function body (compound statement). The ownership of the returned
|
|
/// CFG is transferred to the caller. If CFG construction fails, this method
|
|
/// returns NULL.
|
|
CFG* BuildCFG(Stmt* Statement) {
|
|
if (!Statement) return NULL;
|
|
|
|
assert (!Exit && "CFGBuilder should only be used to construct one CFG");
|
|
|
|
// Create the exit block.
|
|
Block = createBlock();
|
|
Exit = Block;
|
|
|
|
// Visit the statements and create the CFG.
|
|
if (CFGBlock* B = Visit(Statement)) {
|
|
// Finalize the last constructed block. This usually involves
|
|
// reversing the order of the statements in the block.
|
|
FinishBlock(B);
|
|
cfg->setEntry(B);
|
|
|
|
// Backpatch the gotos whose label -> block mappings we didn't know
|
|
// when we encountered them.
|
|
for (BackpatchBlocksTy::iterator I = BackpatchBlocks.begin(),
|
|
E = BackpatchBlocks.end(); I != E; ++I ) {
|
|
|
|
CFGBlock* B = *I;
|
|
GotoStmt* G = cast<GotoStmt>(B->getTerminator());
|
|
LabelMapTy::iterator LI = LabelMap.find(G->getLabel());
|
|
|
|
if (LI == LabelMap.end())
|
|
return NULL; // No matching label. Bad CFG.
|
|
|
|
B->addSuccessor(LI->second);
|
|
}
|
|
|
|
// NULL out cfg so that repeated calls
|
|
CFG* t = cfg;
|
|
cfg = NULL;
|
|
return t;
|
|
}
|
|
else return NULL;
|
|
}
|
|
|
|
// createBlock - Used to lazily create blocks that are connected
|
|
// to the current (global) succcessor.
|
|
CFGBlock* createBlock( bool add_successor = true ) {
|
|
CFGBlock* B = cfg->createBlock(NumBlocks++);
|
|
if (add_successor && Succ) B->addSuccessor(Succ);
|
|
return B;
|
|
}
|
|
|
|
// FinishBlock - When the last statement has been added to the block,
|
|
// usually we must reverse the statements because they have been inserted
|
|
// in reverse order. When processing labels, however, there are cases
|
|
// in the recursion where we may have already reversed the statements
|
|
// in a block. This method safely tidies up a block: if the block
|
|
// has a label at the front, it has already been reversed. Otherwise,
|
|
// we reverse it.
|
|
void FinishBlock(CFGBlock* B) {
|
|
assert (B);
|
|
CFGBlock::iterator I = B->begin();
|
|
if (I != B->end()) {
|
|
Stmt* S = *I;
|
|
if (S->getStmtClass() != Stmt::LabelStmtClass)
|
|
B->reverseStmts();
|
|
}
|
|
}
|
|
|
|
/// Here we handle statements with no branching control flow.
|
|
CFGBlock* VisitStmt(Stmt* Statement) {
|
|
// We cannot assume that we are in the middle of a basic block, since
|
|
// the CFG might only be constructed for this single statement. If
|
|
// we have no current basic block, just create one lazily.
|
|
if (!Block) Block = createBlock();
|
|
|
|
// Simply add the statement to the current block. We actually
|
|
// insert statements in reverse order; this order is reversed later
|
|
// when processing the containing element in the AST.
|
|
Block->appendStmt(Statement);
|
|
|
|
return Block;
|
|
}
|
|
|
|
CFGBlock* VisitNullStmt(NullStmt* Statement) {
|
|
return Block;
|
|
}
|
|
|
|
CFGBlock* VisitCompoundStmt(CompoundStmt* C) {
|
|
// The value returned from this function is the last created CFGBlock
|
|
// that represents the "entry" point for the translated AST node.
|
|
CFGBlock* LastBlock;
|
|
|
|
for (CompoundStmt::reverse_body_iterator I = C->body_rbegin(),
|
|
E = C->body_rend(); I != E; ++I )
|
|
// Add the statement to the current block.
|
|
if (!(LastBlock=Visit(*I)))
|
|
return NULL;
|
|
|
|
return LastBlock;
|
|
}
|
|
|
|
CFGBlock* VisitIfStmt(IfStmt* I) {
|
|
|
|
// We may see an if statement in the middle of a basic block, or
|
|
// it may be the first statement we are processing. In either case,
|
|
// we create a new basic block. First, we create the blocks for
|
|
// the then...else statements, and then we create the block containing
|
|
// the if statement. If we were in the middle of a block, we
|
|
// stop processing that block and reverse its statements. That block
|
|
// is then the implicit successor for the "then" and "else" clauses.
|
|
|
|
// The block we were proccessing is now finished. Make it the
|
|
// successor block.
|
|
if (Block) {
|
|
Succ = Block;
|
|
FinishBlock(Block);
|
|
}
|
|
|
|
// Process the false branch. NULL out Block so that the recursive
|
|
// call to Visit will create a new basic block.
|
|
// Null out Block so that all successor
|
|
CFGBlock* ElseBlock = Succ;
|
|
|
|
if (Stmt* Else = I->getElse()) {
|
|
SaveAndRestore<CFGBlock*> sv(Succ);
|
|
|
|
// NULL out Block so that the recursive call to Visit will
|
|
// create a new basic block.
|
|
Block = NULL;
|
|
ElseBlock = Visit(Else);
|
|
if (!ElseBlock) return NULL;
|
|
FinishBlock(ElseBlock);
|
|
}
|
|
|
|
// Process the true branch. NULL out Block so that the recursive
|
|
// call to Visit will create a new basic block.
|
|
// Null out Block so that all successor
|
|
CFGBlock* ThenBlock;
|
|
{
|
|
Stmt* Then = I->getThen();
|
|
assert (Then);
|
|
SaveAndRestore<CFGBlock*> sv(Succ);
|
|
Block = NULL;
|
|
ThenBlock = Visit(Then);
|
|
if (!ThenBlock) return NULL;
|
|
FinishBlock(ThenBlock);
|
|
}
|
|
|
|
// Now create a new block containing the if statement.
|
|
Block = createBlock(false);
|
|
|
|
// Add the condition as the last statement in the new block.
|
|
Block->appendStmt(I->getCond());
|
|
|
|
// Set the terminator of the new block to the If statement.
|
|
Block->setTerminator(I);
|
|
|
|
// Now add the successors.
|
|
Block->addSuccessor(ThenBlock);
|
|
Block->addSuccessor(ElseBlock);
|
|
|
|
return Block;
|
|
}
|
|
|
|
CFGBlock* VisitReturnStmt(ReturnStmt* R) {
|
|
// If we were in the middle of a block we stop processing that block
|
|
// and reverse its statements.
|
|
//
|
|
// NOTE: If a "return" appears in the middle of a block, this means
|
|
// that the code afterwards is DEAD (unreachable). We still
|
|
// keep a basic block for that code; a simple "mark-and-sweep"
|
|
// from the entry block will be able to report such dead
|
|
// blocks.
|
|
if (Block) FinishBlock(Block);
|
|
|
|
// Create the new block.
|
|
Block = createBlock(false);
|
|
|
|
// The Exit block is the only successor.
|
|
Block->addSuccessor(Exit);
|
|
|
|
// Add the return expression to the block.
|
|
Block->appendStmt(R);
|
|
|
|
// Add the return statement itself to the block.
|
|
if (R->getRetValue()) Block->appendStmt(R->getRetValue());
|
|
|
|
return Block;
|
|
}
|
|
|
|
CFGBlock* VisitLabelStmt(LabelStmt* L) {
|
|
// Get the block of the labeled statement. Add it to our map.
|
|
CFGBlock* LabelBlock = Visit(L->getSubStmt());
|
|
assert (LabelBlock);
|
|
|
|
assert (LabelMap.find(L) == LabelMap.end() && "label already in map");
|
|
LabelMap[ L ] = LabelBlock;
|
|
|
|
// Labels partition blocks, so this is the end of the basic block
|
|
// we were processing (the label is the first statement).
|
|
LabelBlock->appendStmt(L);
|
|
FinishBlock(LabelBlock);
|
|
|
|
// We set Block to NULL to allow lazy creation of a new block
|
|
// (if necessary);
|
|
Block = NULL;
|
|
|
|
// This block is now the implicit successor of other blocks.
|
|
Succ = LabelBlock;
|
|
|
|
return LabelBlock;
|
|
}
|
|
|
|
CFGBlock* VisitGotoStmt(GotoStmt* G) {
|
|
// Goto is a control-flow statement. Thus we stop processing the
|
|
// current block and create a new one.
|
|
if (Block) FinishBlock(Block);
|
|
Block = createBlock(false);
|
|
Block->setTerminator(G);
|
|
|
|
// If we already know the mapping to the label block add the
|
|
// successor now.
|
|
LabelMapTy::iterator I = LabelMap.find(G->getLabel());
|
|
|
|
if (I == LabelMap.end())
|
|
// We will need to backpatch this block later.
|
|
BackpatchBlocks.push_back(Block);
|
|
else
|
|
Block->addSuccessor(I->second);
|
|
|
|
return Block;
|
|
}
|
|
|
|
CFGBlock* VisitForStmt(ForStmt* F) {
|
|
// "for" is a control-flow statement. Thus we stop processing the
|
|
// current block.
|
|
|
|
CFGBlock* LoopSuccessor = NULL;
|
|
|
|
if (Block) {
|
|
FinishBlock(Block);
|
|
LoopSuccessor = Block;
|
|
}
|
|
else LoopSuccessor = Succ;
|
|
|
|
// Create the condition block.
|
|
CFGBlock* ConditionBlock = createBlock(false);
|
|
ConditionBlock->setTerminator(F);
|
|
if (Stmt* C = F->getCond()) ConditionBlock->appendStmt(C);
|
|
|
|
// The condition block is the implicit successor for the loop body as
|
|
// well as any code above the loop.
|
|
Succ = ConditionBlock;
|
|
|
|
// Now create the loop body.
|
|
{
|
|
assert (F->getBody());
|
|
|
|
// Save the current values for Block, Succ, and continue and break targets
|
|
SaveAndRestore<CFGBlock*> save_Block(Block), save_Succ(Succ),
|
|
save_continue(ContinueTargetBlock),
|
|
save_break(BreakTargetBlock);
|
|
|
|
// All continues within this loop should go to the condition block
|
|
ContinueTargetBlock = ConditionBlock;
|
|
|
|
// All breaks should go to the code following the loop.
|
|
BreakTargetBlock = LoopSuccessor;
|
|
|
|
// Create a new block to contain the (bottom) of the loop body.
|
|
Block = createBlock();
|
|
|
|
// If we have increment code, insert it at the end of the body block.
|
|
if (Stmt* I = F->getInc()) Block->appendStmt(I);
|
|
|
|
// Now populate the body block, and in the process create new blocks
|
|
// as we walk the body of the loop.
|
|
CFGBlock* BodyBlock = Visit(F->getBody());
|
|
assert (BodyBlock);
|
|
FinishBlock(BodyBlock);
|
|
|
|
// This new body block is a successor to our condition block.
|
|
ConditionBlock->addSuccessor(BodyBlock);
|
|
}
|
|
|
|
// Link up the condition block with the code that follows the loop.
|
|
// (the false branch).
|
|
ConditionBlock->addSuccessor(LoopSuccessor);
|
|
|
|
// If the loop contains initialization, create a new block for those
|
|
// statements. This block can also contain statements that precede
|
|
// the loop.
|
|
if (Stmt* I = F->getInit()) {
|
|
Block = createBlock();
|
|
Block->appendStmt(I);
|
|
return Block;
|
|
}
|
|
else {
|
|
// There is no loop initialization. We are thus basically a while
|
|
// loop. NULL out Block to force lazy block construction.
|
|
Block = NULL;
|
|
return ConditionBlock;
|
|
}
|
|
}
|
|
|
|
CFGBlock* VisitWhileStmt(WhileStmt* W) {
|
|
// "while" is a control-flow statement. Thus we stop processing the
|
|
// current block.
|
|
|
|
CFGBlock* LoopSuccessor = NULL;
|
|
|
|
if (Block) {
|
|
FinishBlock(Block);
|
|
LoopSuccessor = Block;
|
|
}
|
|
else LoopSuccessor = Succ;
|
|
|
|
// Create the condition block.
|
|
CFGBlock* ConditionBlock = createBlock(false);
|
|
ConditionBlock->setTerminator(W);
|
|
if (Stmt* C = W->getCond()) ConditionBlock->appendStmt(C);
|
|
|
|
// The condition block is the implicit successor for the loop body as
|
|
// well as any code above the loop.
|
|
Succ = ConditionBlock;
|
|
|
|
// Process the loop body.
|
|
{
|
|
assert (W->getBody());
|
|
|
|
// Save the current values for Block, Succ, and continue and break targets
|
|
SaveAndRestore<CFGBlock*> save_Block(Block), save_Succ(Succ),
|
|
save_continue(ContinueTargetBlock),
|
|
save_break(BreakTargetBlock);
|
|
|
|
// All continues within this loop should go to the condition block
|
|
ContinueTargetBlock = ConditionBlock;
|
|
|
|
// All breaks should go to the code following the loop.
|
|
BreakTargetBlock = LoopSuccessor;
|
|
|
|
// NULL out Block to force lazy instantiation of blocks for the body.
|
|
Block = NULL;
|
|
|
|
// Create the body. The returned block is the entry to the loop body.
|
|
CFGBlock* BodyBlock = Visit(W->getBody());
|
|
assert (BodyBlock);
|
|
FinishBlock(BodyBlock);
|
|
|
|
// Add the loop body entry as a successor to the condition.
|
|
ConditionBlock->addSuccessor(BodyBlock);
|
|
}
|
|
|
|
// Link up the condition block with the code that follows the loop.
|
|
// (the false branch).
|
|
ConditionBlock->addSuccessor(LoopSuccessor);
|
|
|
|
// There can be no more statements in the condition block
|
|
// since we loop back to this block. NULL out Block to force
|
|
// lazy creation of another block.
|
|
Block = NULL;
|
|
|
|
// Return the condition block, which is the dominating block for the loop.
|
|
return ConditionBlock;
|
|
}
|
|
|
|
CFGBlock* VisitContinueStmt(ContinueStmt* C) {
|
|
// "continue" is a control-flow statement. Thus we stop processing the
|
|
// current block.
|
|
if (Block) FinishBlock(Block);
|
|
|
|
// Now create a new block that ends with the continue statement.
|
|
Block = createBlock(false);
|
|
Block->setTerminator(C);
|
|
|
|
// FIXME: We should gracefully handle continues without resolved targets.
|
|
assert (ContinueTargetBlock);
|
|
|
|
Block->addSuccessor(ContinueTargetBlock);
|
|
return Block;
|
|
}
|
|
|
|
CFGBlock* VisitBreakStmt(BreakStmt* B) {
|
|
// "break" is a control-flow statement. Thus we stop processing the
|
|
// current block.
|
|
if (Block) FinishBlock(Block);
|
|
|
|
// Now create a new block that ends with the continue statement.
|
|
Block = createBlock(false);
|
|
Block->setTerminator(B);
|
|
|
|
// FIXME: We should gracefully handle breaks without resolved targets.
|
|
assert (BreakTargetBlock);
|
|
|
|
Block->addSuccessor(BreakTargetBlock);
|
|
return Block;
|
|
}
|
|
|
|
};
|
|
|
|
// BuildCFG - A helper function that builds CFGs from ASTS.
|
|
CFG* CFG::BuildCFG(Stmt* Statement) {
|
|
CFGBuilder Builder;
|
|
return Builder.BuildCFG(Statement);
|
|
}
|
|
|
|
// reverseStmts - A method that reverses the order of the statements within
|
|
// a CFGBlock.
|
|
void CFGBlock::reverseStmts() { std::reverse(Stmts.begin(),Stmts.end()); }
|
|
|
|
// dump - A simple pretty printer of a CFG that outputs to stderr.
|
|
void CFG::dump() { print(std::cerr); }
|
|
|
|
// print - A simple pretty printer of a CFG that outputs to an ostream.
|
|
void CFG::print(std::ostream& OS) {
|
|
// First print out the Entry block, which may not be the first block
|
|
// in our list of blocks
|
|
if (begin() != end()) {
|
|
CFGBlock& Entry = getEntry();
|
|
OS << "\n [ B" << Entry.getBlockID() << " (ENTRY) ]\n";
|
|
Entry.print(OS);
|
|
}
|
|
|
|
// Iterate through the CFGBlocks and print them one by one. Specially
|
|
// designate the Entry and Exit blocks.
|
|
for (iterator I = Blocks.begin(), E = Blocks.end() ; I != E ; ++I) {
|
|
// Skip the entry block, because we already printed it.
|
|
if (&(*I) == &getEntry())
|
|
continue;
|
|
|
|
OS << "\n [ B" << I->getBlockID();
|
|
|
|
if (&(*I) == &getExit()) OS << " (EXIT) ]\n";
|
|
else OS << " ]\n";
|
|
|
|
I->print(OS);
|
|
}
|
|
OS << "\n";
|
|
}
|
|
|
|
|
|
namespace {
|
|
|
|
class CFGBlockTerminatorPrint : public StmtVisitor<CFGBlockTerminatorPrint,
|
|
void > {
|
|
std::ostream& OS;
|
|
public:
|
|
CFGBlockTerminatorPrint(std::ostream& os) : OS(os) {}
|
|
|
|
void VisitIfStmt(IfStmt* I) {
|
|
OS << "if ";
|
|
I->getCond()->printPretty(std::cerr);
|
|
OS << "\n";
|
|
}
|
|
|
|
// Default case.
|
|
void VisitStmt(Stmt* S) { S->printPretty(OS); }
|
|
|
|
void VisitForStmt(ForStmt* F) {
|
|
OS << "for (" ;
|
|
if (Stmt* I = F->getInit()) I->printPretty(OS);
|
|
OS << " ; ";
|
|
if (Stmt* C = F->getCond()) C->printPretty(OS);
|
|
OS << " ; ";
|
|
if (Stmt* I = F->getInc()) I->printPretty(OS);
|
|
OS << ")\n";
|
|
}
|
|
|
|
void VisitWhileStmt(WhileStmt* W) {
|
|
OS << "while " ;
|
|
if (Stmt* C = W->getCond()) C->printPretty(OS);
|
|
OS << "\n";
|
|
}
|
|
};
|
|
}
|
|
|
|
// dump - A simply pretty printer of a CFGBlock that outputs to stderr.
|
|
void CFGBlock::dump() { print(std::cerr); }
|
|
|
|
// print - A simple pretty printer of a CFGBlock that outputs to an ostream.
|
|
// Generally this will only be called from CFG::print.
|
|
void CFGBlock::print(std::ostream& OS) {
|
|
|
|
// Iterate through the statements in the block and print them.
|
|
OS << " ------------------------\n";
|
|
unsigned j = 1;
|
|
for (iterator I = Stmts.begin(), E = Stmts.end() ; I != E ; ++I, ++j ) {
|
|
// Print the statement # in the basic block.
|
|
OS << " " << std::setw(3) << j << ": ";
|
|
|
|
// Print the statement/expression.
|
|
Stmt* S = *I;
|
|
|
|
if (LabelStmt* L = dyn_cast<LabelStmt>(S))
|
|
OS << L->getName() << ": (LABEL)\n";
|
|
else
|
|
(*I)->printPretty(OS);
|
|
|
|
// Expressions need a newline.
|
|
if (isa<Expr>(*I)) OS << '\n';
|
|
}
|
|
OS << " ------------------------\n";
|
|
|
|
// Print the predecessors of this block.
|
|
OS << " Predecessors (" << pred_size() << "):";
|
|
unsigned i = 0;
|
|
for (pred_iterator I = pred_begin(), E = pred_end(); I != E; ++I, ++i ) {
|
|
if (i == 8 || (i-8) == 0) {
|
|
OS << "\n ";
|
|
}
|
|
OS << " B" << (*I)->getBlockID();
|
|
}
|
|
|
|
// Print the terminator of this block.
|
|
OS << "\n Terminator: ";
|
|
if (ControlFlowStmt)
|
|
CFGBlockTerminatorPrint(OS).Visit(ControlFlowStmt);
|
|
else
|
|
OS << "<NULL>\n";
|
|
|
|
// Print the successors of this block.
|
|
OS << " Successors (" << succ_size() << "):";
|
|
i = 0;
|
|
for (succ_iterator I = succ_begin(), E = succ_end(); I != E; ++I, ++i ) {
|
|
if (i == 8 || (i-8) % 10 == 0) {
|
|
OS << "\n ";
|
|
}
|
|
OS << " B" << (*I)->getBlockID();
|
|
}
|
|
OS << '\n';
|
|
} |