//===- CallGraph.cpp - Build a Module's call graph ------------------------===//
//
-// This interface is used to build and manipulate a call graph, which is a very
-// useful tool for interprocedural optimization.
+// The LLVM Compiler Infrastructure
//
-// Every method in a module is represented as a node in the call graph. The
-// callgraph node keeps track of which methods the are called by the method
-// corresponding to the node.
-//
-// A call graph will contain nodes where the method that they correspond to is
-// null. This 'external' node is used to represent control flow that is not
-// represented (or analyzable) in the module. As such, the external node will
-// have edges to methods with the following properties:
-// 1. All methods in the module without internal linkage, since they could
-// be called by methods outside of the our analysis capability.
-// 2. All methods whose address is used for something more than a direct call,
-// for example being stored into a memory location. Since they may be
-// called by an unknown caller later, they must be tracked as such.
-//
-// Similarly, methods have a call edge to the external node iff:
-// 1. The method is external, reflecting the fact that they could call
-// anything without internal linkage or that has its address taken.
-// 2. The method contains an indirect method call.
-//
-// As an extension in the future, there may be multiple nodes with a null
-// method. These will be used when we can prove (through pointer analysis) that
-// an indirect call site can call only a specific set of methods.
-//
-// Because of these properties, the CallGraph captures a conservative superset
-// of all of the caller-callee relationships, which is useful for
-// transformations.
-//
-// The CallGraph class also attempts to figure out what the root of the
-// CallGraph is, which is currently does by looking for a method named 'main'.
-// If no method named 'main' is found, the external node is used as the entry
-// node, reflecting the fact that any method without internal linkage could
-// be called into (which is common for libraries).
+// This file is distributed under the University of Illinois Open Source
+// License. See LICENSE.TXT for details.
//
//===----------------------------------------------------------------------===//
#include "llvm/Analysis/CallGraph.h"
-#include "llvm/Module.h"
-#include "llvm/Function.h"
-#include "llvm/iOther.h"
-#include "llvm/iTerminators.h"
-#include "Support/STLExtras.h"
-#include <algorithm>
-#include <iostream>
-
-AnalysisID CallGraph::ID(AnalysisID::create<CallGraph>());
-
-// getNodeFor - Return the node for the specified method or create one if it
-// does not already exist.
+#include "llvm/IR/CallSite.h"
+#include "llvm/IR/Instructions.h"
+#include "llvm/IR/IntrinsicInst.h"
+#include "llvm/IR/Module.h"
+#include "llvm/Support/Debug.h"
+#include "llvm/Support/raw_ostream.h"
+using namespace llvm;
+
+//===----------------------------------------------------------------------===//
+// Implementations of the CallGraph class methods.
//
-CallGraphNode *CallGraph::getNodeFor(Function *F) {
- CallGraphNode *&CGN = MethodMap[F];
- if (CGN) return CGN;
- assert((!F || F->getParent() == Mod) && "Function not in current module!");
- return CGN = new CallGraphNode(F);
+CallGraph::CallGraph(Module &M)
+ : M(M), Root(nullptr), ExternalCallingNode(getOrInsertFunction(nullptr)),
+ CallsExternalNode(llvm::make_unique<CallGraphNode>(nullptr)) {
+ // Add every function to the call graph.
+ for (Function &F : M)
+ addToCallGraph(&F);
+
+ // If we didn't find a main function, use the external call graph node
+ if (!Root)
+ Root = ExternalCallingNode;
}
-// addToCallGraph - Add a method to the call graph, and link the node to all of
-// the methods that it calls.
-//
-void CallGraph::addToCallGraph(Function *M) {
- CallGraphNode *Node = getNodeFor(M);
+CallGraph::~CallGraph() {
+ // CallsExternalNode is not in the function map, delete it explicitly.
+ if (CallsExternalNode)
+ CallsExternalNode->allReferencesDropped();
+
+// Reset all node's use counts to zero before deleting them to prevent an
+// assertion from firing.
+#ifndef NDEBUG
+ for (auto &I : FunctionMap)
+ I.second->allReferencesDropped();
+#endif
+}
+
+void CallGraph::addToCallGraph(Function *F) {
+ CallGraphNode *Node = getOrInsertFunction(F);
- // If this method has external linkage,
- if (!M->hasInternalLinkage()) {
- ExternalNode->addCalledMethod(Node);
+ // If this function has external linkage, anything could call it.
+ if (!F->hasLocalLinkage()) {
+ ExternalCallingNode->addCalledFunction(CallSite(), Node);
// Found the entry point?
- if (M->getName() == "main") {
- if (Root)
- Root = ExternalNode; // Found multiple external mains? Don't pick one.
+ if (F->getName() == "main") {
+ if (Root) // Found multiple external mains? Don't pick one.
+ Root = ExternalCallingNode;
else
- Root = Node; // Found a main, keep track of it!
+ Root = Node; // Found a main, keep track of it!
}
- } else if (M->isExternal()) { // Not defined in this xlation unit?
- Node->addCalledMethod(ExternalNode); // It could call anything...
}
- // Loop over all of the users of the method... looking for callers...
- //
- for (Value::use_iterator I = M->use_begin(), E = M->use_end(); I != E; ++I) {
- User *U = *I;
- if (CallInst *CI = dyn_cast<CallInst>(U))
- getNodeFor(CI->getParent()->getParent())->addCalledMethod(Node);
- else if (InvokeInst *II = dyn_cast<InvokeInst>(U))
- getNodeFor(II->getParent()->getParent())->addCalledMethod(Node);
- else // Can't classify the user!
- ExternalNode->addCalledMethod(Node);
- }
+ // If this function has its address taken, anything could call it.
+ if (F->hasAddressTaken())
+ ExternalCallingNode->addCalledFunction(CallSite(), Node);
+
+ // If this function is not defined in this translation unit, it could call
+ // anything.
+ if (F->isDeclaration() && !F->isIntrinsic())
+ Node->addCalledFunction(CallSite(), CallsExternalNode.get());
- // Look for an indirect method call...
- for (Function::iterator BBI = M->begin(), BBE = M->end(); BBI != BBE; ++BBI) {
- BasicBlock *BB = *BBI;
- for (BasicBlock::iterator II = BB->begin(), IE = BB->end(); II != IE; ++II){
- Instruction *I = *II;
-
- if (CallInst *CI = dyn_cast<CallInst>(I)) {
- if (CI->getCalledFunction() == 0)
- Node->addCalledMethod(ExternalNode);
- } else if (InvokeInst *II = dyn_cast<InvokeInst>(I)) {
- if (II->getCalledFunction() == 0)
- Node->addCalledMethod(ExternalNode);
+ // Look for calls by this function.
+ for (Function::iterator BB = F->begin(), BBE = F->end(); BB != BBE; ++BB)
+ for (BasicBlock::iterator II = BB->begin(), IE = BB->end(); II != IE;
+ ++II) {
+ CallSite CS(cast<Value>(II));
+ if (CS) {
+ const Function *Callee = CS.getCalledFunction();
+ if (!Callee || !Intrinsic::isLeaf(Callee->getIntrinsicID()))
+ // Indirect calls of intrinsics are not allowed so no need to check.
+ // We can be more precise here by using TargetArg returned by
+ // Intrinsic::isLeaf.
+ Node->addCalledFunction(CS, CallsExternalNode.get());
+ else if (!Callee->isIntrinsic())
+ Node->addCalledFunction(CS, getOrInsertFunction(Callee));
}
}
+}
+
+void CallGraph::print(raw_ostream &OS) const {
+ OS << "CallGraph Root is: ";
+ if (Function *F = Root->getFunction())
+ OS << F->getName() << "\n";
+ else {
+ OS << "<<null function: 0x" << Root << ">>\n";
}
+
+ // Print in a deterministic order by sorting CallGraphNodes by name. We do
+ // this here to avoid slowing down the non-printing fast path.
+
+ SmallVector<CallGraphNode *, 16> Nodes;
+ Nodes.reserve(FunctionMap.size());
+
+ for (auto I = begin(), E = end(); I != E; ++I)
+ Nodes.push_back(I->second.get());
+
+ std::sort(Nodes.begin(), Nodes.end(),
+ [](CallGraphNode *LHS, CallGraphNode *RHS) {
+ if (Function *LF = LHS->getFunction())
+ if (Function *RF = RHS->getFunction())
+ return LF->getName() < RF->getName();
+
+ return RHS->getFunction() != nullptr;
+ });
+
+ for (CallGraphNode *CN : Nodes)
+ CN->print(OS);
}
-bool CallGraph::run(Module *TheModule) {
- destroy();
+#if !defined(NDEBUG) || defined(LLVM_ENABLE_DUMP)
+void CallGraph::dump() const { print(dbgs()); }
+#endif
- Mod = TheModule;
- ExternalNode = getNodeFor(0);
- Root = 0;
+// removeFunctionFromModule - Unlink the function from this module, returning
+// it. Because this removes the function from the module, the call graph node
+// is destroyed. This is only valid if the function does not call any other
+// functions (ie, there are no edges in it's CGN). The easiest way to do this
+// is to dropAllReferences before calling this.
+//
+Function *CallGraph::removeFunctionFromModule(CallGraphNode *CGN) {
+ assert(CGN->empty() && "Cannot remove function from call "
+ "graph if it references other functions!");
+ Function *F = CGN->getFunction(); // Get the function for the call graph node
+ FunctionMap.erase(F); // Remove the call graph node from the map
- // Add every method to the call graph...
- for_each(Mod->begin(), Mod->end(), bind_obj(this,&CallGraph::addToCallGraph));
+ M.getFunctionList().remove(F);
+ return F;
+}
- // If we didn't find a main method, use the external call graph node
- if (Root == 0) Root = ExternalNode;
-
- return false;
+/// spliceFunction - Replace the function represented by this node by another.
+/// This does not rescan the body of the function, so it is suitable when
+/// splicing the body of the old function to the new while also updating all
+/// callers from old to new.
+///
+void CallGraph::spliceFunction(const Function *From, const Function *To) {
+ assert(FunctionMap.count(From) && "No CallGraphNode for function!");
+ assert(!FunctionMap.count(To) &&
+ "Pointing CallGraphNode at a function that already exists");
+ FunctionMapTy::iterator I = FunctionMap.find(From);
+ I->second->F = const_cast<Function*>(To);
+ FunctionMap[To] = std::move(I->second);
+ FunctionMap.erase(I);
}
-void CallGraph::destroy() {
- for (MethodMapTy::iterator I = MethodMap.begin(), E = MethodMap.end();
- I != E; ++I)
- delete I->second;
- MethodMap.clear();
+// getOrInsertFunction - This method is identical to calling operator[], but
+// it will insert a new CallGraphNode for the specified function if one does
+// not already exist.
+CallGraphNode *CallGraph::getOrInsertFunction(const Function *F) {
+ auto &CGN = FunctionMap[F];
+ if (CGN)
+ return CGN.get();
+
+ assert((!F || F->getParent() == &M) && "Function not in current module!");
+ CGN = llvm::make_unique<CallGraphNode>(const_cast<Function *>(F));
+ return CGN.get();
}
+//===----------------------------------------------------------------------===//
+// Implementations of the CallGraphNode class methods.
+//
-void WriteToOutput(const CallGraphNode *CGN, std::ostream &o) {
- if (CGN->getMethod())
- o << "Call graph node for method: '" << CGN->getMethod()->getName() <<"'\n";
+void CallGraphNode::print(raw_ostream &OS) const {
+ if (Function *F = getFunction())
+ OS << "Call graph node for function: '" << F->getName() << "'";
else
- o << "Call graph node null method:\n";
+ OS << "Call graph node <<null function>>";
+
+ OS << "<<" << this << ">> #uses=" << getNumReferences() << '\n';
- for (unsigned i = 0; i < CGN->size(); ++i)
- if ((*CGN)[i]->getMethod())
- o << " Calls method '" << (*CGN)[i]->getMethod()->getName() << "'\n";
+ for (const_iterator I = begin(), E = end(); I != E; ++I) {
+ OS << " CS<" << I->first << "> calls ";
+ if (Function *FI = I->second->getFunction())
+ OS << "function '" << FI->getName() <<"'\n";
else
- o << " Calls external node\n";
- o << "\n";
+ OS << "external node\n";
+ }
+ OS << '\n';
}
-void WriteToOutput(const CallGraph &CG, std::ostream &o) {
- for (CallGraph::const_iterator I = CG.begin(), E = CG.end(); I != E; ++I)
- o << I->second;
+#if !defined(NDEBUG) || defined(LLVM_ENABLE_DUMP)
+void CallGraphNode::dump() const { print(dbgs()); }
+#endif
+
+/// removeCallEdgeFor - This method removes the edge in the node for the
+/// specified call site. Note that this method takes linear time, so it
+/// should be used sparingly.
+void CallGraphNode::removeCallEdgeFor(CallSite CS) {
+ for (CalledFunctionsVector::iterator I = CalledFunctions.begin(); ; ++I) {
+ assert(I != CalledFunctions.end() && "Cannot find callsite to remove!");
+ if (I->first == CS.getInstruction()) {
+ I->second->DropRef();
+ *I = CalledFunctions.back();
+ CalledFunctions.pop_back();
+ return;
+ }
+ }
}
+// removeAnyCallEdgeTo - This method removes any call edges from this node to
+// the specified callee function. This takes more time to execute than
+// removeCallEdgeTo, so it should not be used unless necessary.
+void CallGraphNode::removeAnyCallEdgeTo(CallGraphNode *Callee) {
+ for (unsigned i = 0, e = CalledFunctions.size(); i != e; ++i)
+ if (CalledFunctions[i].second == Callee) {
+ Callee->DropRef();
+ CalledFunctions[i] = CalledFunctions.back();
+ CalledFunctions.pop_back();
+ --i; --e;
+ }
+}
+
+/// removeOneAbstractEdgeTo - Remove one edge associated with a null callsite
+/// from this node to the specified callee function.
+void CallGraphNode::removeOneAbstractEdgeTo(CallGraphNode *Callee) {
+ for (CalledFunctionsVector::iterator I = CalledFunctions.begin(); ; ++I) {
+ assert(I != CalledFunctions.end() && "Cannot find callee to remove!");
+ CallRecord &CR = *I;
+ if (CR.second == Callee && CR.first == nullptr) {
+ Callee->DropRef();
+ *I = CalledFunctions.back();
+ CalledFunctions.pop_back();
+ return;
+ }
+ }
+}
+
+/// replaceCallEdge - This method replaces the edge in the node for the
+/// specified call site with a new one. Note that this method takes linear
+/// time, so it should be used sparingly.
+void CallGraphNode::replaceCallEdge(CallSite CS,
+ CallSite NewCS, CallGraphNode *NewNode){
+ for (CalledFunctionsVector::iterator I = CalledFunctions.begin(); ; ++I) {
+ assert(I != CalledFunctions.end() && "Cannot find callsite to remove!");
+ if (I->first == CS.getInstruction()) {
+ I->second->DropRef();
+ I->first = NewCS.getInstruction();
+ I->second = NewNode;
+ NewNode->AddRef();
+ return;
+ }
+ }
+}
//===----------------------------------------------------------------------===//
-// Implementations of public modification methods
+// Implementations of the CallGraphWrapperPass class methods.
//
-// Methods to keep a call graph up to date with a method that has been
-// modified
-//
-void CallGraph::addMethodToModule(Function *Meth) {
- assert(0 && "not implemented");
- abort();
+CallGraphWrapperPass::CallGraphWrapperPass() : ModulePass(ID) {
+ initializeCallGraphWrapperPassPass(*PassRegistry::getPassRegistry());
}
-// removeMethodFromModule - Unlink the method from this module, returning it.
-// Because this removes the method from the module, the call graph node is
-// destroyed. This is only valid if the method does not call any other
-// methods (ie, there are no edges in it's CGN). The easiest way to do this
-// is to dropAllReferences before calling this.
-//
-Function *CallGraph::removeMethodFromModule(CallGraphNode *CGN) {
- assert(CGN->CalledMethods.empty() && "Cannot remove method from call graph"
- " if it references other methods!");
- Function *M = CGN->getMethod(); // Get the function for the call graph node
- delete CGN; // Delete the call graph node for this func
- MethodMap.erase(M); // Remove the call graph node from the map
+CallGraphWrapperPass::~CallGraphWrapperPass() {}
+
+void CallGraphWrapperPass::getAnalysisUsage(AnalysisUsage &AU) const {
+ AU.setPreservesAll();
+}
+
+bool CallGraphWrapperPass::runOnModule(Module &M) {
+ // All the real work is done in the constructor for the CallGraph.
+ G.reset(new CallGraph(M));
+ return false;
+}
+
+INITIALIZE_PASS(CallGraphWrapperPass, "basiccg", "CallGraph Construction",
+ false, true)
+
+char CallGraphWrapperPass::ID = 0;
+
+void CallGraphWrapperPass::releaseMemory() { G.reset(); }
+
+void CallGraphWrapperPass::print(raw_ostream &OS, const Module *) const {
+ if (!G) {
+ OS << "No call graph has been built!\n";
+ return;
+ }
- Mod->getFunctionList().remove(M);
- return M;
+ // Just delegate.
+ G->print(OS);
}
+#if !defined(NDEBUG) || defined(LLVM_ENABLE_DUMP)
+void CallGraphWrapperPass::dump() const { print(dbgs(), nullptr); }
+#endif