-//===- DataStructure.h - Build a Module's call graph -------------*- C++ -*--=//
+//===- DataStructure.h - Build data structure graphs ------------*- C++ -*-===//
//
// Implement the LLVM data structure analysis library.
//
#ifndef LLVM_ANALYSIS_DATA_STRUCTURE_H
#define LLVM_ANALYSIS_DATA_STRUCTURE_H
+#include "llvm/Analysis/DSSupport.h"
#include "llvm/Pass.h"
-#include <string>
+#include <set>
class Type;
-class CallInst;
-class AllocationInst;
-class FunctionArgument;
+class DSGraph;
class DSNode;
-class FunctionRepBuilder;
-class GlobalValue;
-class FunctionDSGraph;
-class DataStructure;
-
-// FIXME: move this somewhere private
-unsigned countPointerFields(const Type *Ty);
-
-// PointerVal - Represent a pointer to a datastructure. The pointer points to
-// a node, and can index into it. This is used for getelementptr instructions,
-// which do not affect which node a pointer points to, but does change the field
-// index
-//
-struct PointerVal {
- DSNode *Node;
- unsigned Index; // Index into Node->FieldLinks[]
-public:
- PointerVal(DSNode *N, unsigned Idx = 0) : Node(N), Index(Idx) {}
-
- DSNode *getNode() const { return Node; }
- unsigned getIndex() const { return Index; }
-
- inline bool operator==(DSNode *N) const { return Node == N; }
- inline bool operator!=(DSNode *N) const { return Node != N; }
-
- // operator< - Allow insertion into a map...
- bool operator<(const PointerVal &PV) const {
- return Node < PV.Node || (Node == PV.Node && Index < PV.Index);
- }
-
- inline bool operator==(const PointerVal &PV) const {
- return Node == PV.Node && Index == PV.Index;
- }
- inline bool operator!=(const PointerVal &PV) const { return !operator==(PV); }
-
- void print(std::ostream &O) const;
-};
-
-
-// PointerValSet - This class represents a list of pointer values. The add
-// method is used to add values to the set, and ensures that duplicates cannot
-// happen.
-//
-class PointerValSet {
- std::vector<PointerVal> Vals;
- void dropRefs();
- void addRefs();
-public:
- PointerValSet() {}
- PointerValSet(const PointerValSet &PVS) : Vals(PVS.Vals) { addRefs(); }
- ~PointerValSet() { dropRefs(); }
- const PointerValSet &operator=(const PointerValSet &PVS);
-
- // operator< - Allow insertion into a map...
- bool operator<(const PointerValSet &PVS) const;
- bool operator==(const PointerValSet &PVS) const;
-
- const PointerVal &operator[](unsigned i) const { return Vals[i]; }
-
- unsigned size() const { return Vals.size(); }
- bool empty() const { return Vals.empty(); }
- void clear() { dropRefs(); Vals.clear(); }
-
- // add - Add the specified pointer, or contents of the specified PVS to this
- // pointer set. If a 'Pointer' value is provided, notify the underlying data
- // structure node that the pointer is pointing to it, so that it can be
- // invalidated if neccesary later. True is returned if the value is new to
- // this pointer.
+class LocalDataStructures; // A collection of local graphs for a program
+class BUDataStructures; // A collection of bu graphs for a program
+class TDDataStructures; // A collection of td graphs for a program
+
+// FIXME: move this stuff to a private header
+namespace DataStructureAnalysis {
+ // isPointerType - Return true if this first class type is big enough to hold
+ // a pointer.
//
- bool add(const PointerVal &PV, Value *Pointer = 0);
- bool add(const PointerValSet &PVS, Value *Pointer = 0) {
- bool Changed = false;
- for (unsigned i = 0, e = PVS.size(); i != e; ++i)
- Changed |= add(PVS[i], Pointer);
- return Changed;
- }
-
- // removePointerTo - Remove a single pointer val that points to the specified
- // node...
- void removePointerTo(DSNode *Node);
-
- void print(std::ostream &O) const;
-};
+ bool isPointerType(const Type *Ty);
+}
-//===----------------------------------------------------------------------===//
-// DSNode - Base class for all data structure nodes...
+// LocalDataStructures - The analysis that computes the local data structure
+// graphs for all of the functions in the program.
//
-// This class keeps track of its type, the pointer fields in the data structure,
-// and a list of LLVM values that are pointing to this node.
+// FIXME: This should be a Function pass that can be USED by a Pass, and would
+// be automatically preserved. Until we can do that, this is a Pass.
//
-class DSNode {
- friend class FunctionDSGraph;
- const Type *Ty;
- std::vector<PointerValSet> FieldLinks;
- std::vector<Value*> Pointers; // Values pointing to me...
- std::vector<PointerValSet*> Referrers;
-
- DSNode(const DSNode &); // DO NOT IMPLEMENT
- void operator=(const DSNode &); // DO NOT IMPLEMENT
+class LocalDataStructures : public Pass {
+ // DSInfo, one graph for each function
+ std::map<const Function*, DSGraph*> DSInfo;
public:
- enum NodeTy {
- NewNode, CallNode, ShadowNode, ArgNode, GlobalNode
- } NodeType;
+ ~LocalDataStructures() { releaseMemory(); }
- DSNode(enum NodeTy NT, const Type *T);
- virtual ~DSNode() {
- dropAllReferences();
- assert(Referrers.empty() && "Referrers to dead node exist!");
- }
+ virtual bool run(Module &M);
- unsigned getNumLinks() const { return FieldLinks.size(); }
- PointerValSet &getLink(unsigned i) {
- assert(i < getNumLinks() && "Field links access out of range...");
- return FieldLinks[i];
+ // getDSGraph - Return the data structure graph for the specified function.
+ DSGraph &getDSGraph(const Function &F) const {
+ std::map<const Function*, DSGraph*>::const_iterator I = DSInfo.find(&F);
+ assert(I != DSInfo.end() && "Function not in module!");
+ return *I->second;
}
- // addReferrer - Keep the referrer set up to date...
- void addReferrer(PointerValSet *PVS) { Referrers.push_back(PVS); }
- void removeReferrer(PointerValSet *PVS);
- const std::vector<PointerValSet*> &getReferrers() const { return Referrers; }
-
- // removeAllIncomingEdges - Erase all edges in the graph that point to
- // this node
- void removeAllIncomingEdges();
-
- void addPointer(Value *V) { Pointers.push_back(V); }
- const std::vector<Value*> &getPointers() const { return Pointers; }
-
- const Type *getType() const { return Ty; }
-
- void print(std::ostream &O) const;
-
- virtual std::string getCaption() const = 0;
- virtual const std::vector<PointerValSet> *getAuxLinks() const {
- return 0; // Default to nothing...
- }
-
- // isEquivalentTo - Return true if the nodes should be merged...
- virtual bool isEquivalentTo(DSNode *Node) const = 0;
-
- DSNode *clone() const {
- DSNode *New = cloneImpl();
- // Add all of the pointers to the new node...
- for (unsigned pn = 0, pe = Pointers.size(); pn != pe; ++pn)
- New->addPointer(Pointers[pn]);
- return New;
- }
+ // print - Print out the analysis results...
+ void print(std::ostream &O, const Module *M) const;
+ // If the pass pipeline is done with this pass, we can release our memory...
+ virtual void releaseMemory();
- virtual void dropAllReferences() {
- FieldLinks.clear();
+ // getAnalysisUsage - This obviously provides a data structure graph.
+ virtual void getAnalysisUsage(AnalysisUsage &AU) const {
+ AU.setPreservesAll();
}
-
- static bool classof(const DSNode *N) { return true; }
-protected:
- virtual DSNode *cloneImpl() const = 0;
- virtual void mapNode(std::map<const DSNode*, DSNode*> &NodeMap,
- const DSNode *Old);
-};
-
-
-// AllocDSNode - Represent all allocation (malloc or alloca) in the program.
-//
-class AllocDSNode : public DSNode {
- AllocationInst *Allocation;
-public:
- AllocDSNode(AllocationInst *V);
-
- virtual std::string getCaption() const;
-
- bool isAllocaNode() const;
- bool isMallocNode() const { return !isAllocaNode(); }
-
- AllocationInst *getAllocation() const { return Allocation; }
-
- // isEquivalentTo - Return true if the nodes should be merged...
- virtual bool isEquivalentTo(DSNode *Node) const;
-
- // Support type inquiry through isa, cast, and dyn_cast...
- static bool classof(const AllocDSNode *) { return true; }
- static bool classof(const DSNode *N) { return N->NodeType == NewNode; }
-protected:
- virtual AllocDSNode *cloneImpl() const { return new AllocDSNode(Allocation); }
};
-
-// GlobalDSNode - Represent the memory location that a global variable occupies
-//
-class GlobalDSNode : public DSNode {
- GlobalValue *Val;
-public:
- GlobalDSNode(GlobalValue *V);
-
- GlobalValue *getGlobal() const { return Val; }
-
- virtual std::string getCaption() const;
-
- // isEquivalentTo - Return true if the nodes should be merged...
- virtual bool isEquivalentTo(DSNode *Node) const;
-
- // Support type inquiry through isa, cast, and dyn_cast...
- static bool classof(const GlobalDSNode *) { return true; }
- static bool classof(const DSNode *N) { return N->NodeType == GlobalNode; }
-private:
- virtual GlobalDSNode *cloneImpl() const { return new GlobalDSNode(Val); }
-};
-
-
-// CallDSNode - Represent a call instruction in the program...
+// BUDataStructures - The analysis that computes the interprocedurally closed
+// data structure graphs for all of the functions in the program. This pass
+// only performs a "Bottom Up" propagation (hence the name).
//
-class CallDSNode : public DSNode {
- friend class FunctionDSGraph;
- CallInst *CI;
- std::vector<PointerValSet> ArgLinks;
+class BUDataStructures : public Pass {
+ // DSInfo, one graph for each function
+ std::map<const Function*, DSGraph*> DSInfo;
public:
- CallDSNode(CallInst *CI);
+ ~BUDataStructures() { releaseMemory(); }
- CallInst *getCall() const { return CI; }
+ virtual bool run(Module &M);
- const std::vector<PointerValSet> *getAuxLinks() const { return &ArgLinks; }
- virtual std::string getCaption() const;
-
- bool addArgValue(unsigned ArgNo, const PointerValSet &PVS) {
- return ArgLinks[ArgNo].add(PVS);
- }
-
- unsigned getNumArgs() const { return ArgLinks.size(); }
- const PointerValSet &getArgValues(unsigned ArgNo) const {
- assert(ArgNo < ArgLinks.size() && "Arg # out of range!");
- return ArgLinks[ArgNo];
- }
- const std::vector<PointerValSet> &getArgs() const { return ArgLinks; }
-
- virtual void dropAllReferences() {
- DSNode::dropAllReferences();
- ArgLinks.clear();
+ // getDSGraph - Return the data structure graph for the specified function.
+ DSGraph &getDSGraph(const Function &F) const {
+ std::map<const Function*, DSGraph*>::const_iterator I = DSInfo.find(&F);
+ assert(I != DSInfo.end() && "Function not in module!");
+ return *I->second;
}
- // isEquivalentTo - Return true if the nodes should be merged...
- virtual bool isEquivalentTo(DSNode *Node) const;
-
- // Support type inquiry through isa, cast, and dyn_cast...
- static bool classof(const CallDSNode *) { return true; }
- static bool classof(const DSNode *N) { return N->NodeType == CallNode; }
-private:
- virtual CallDSNode *cloneImpl() const { return new CallDSNode(CI); }
- virtual void mapNode(std::map<const DSNode*, DSNode*> &NodeMap,
- const DSNode *Old);
-};
-
+ // print - Print out the analysis results...
+ void print(std::ostream &O, const Module *M) const;
-// ArgDSNode - Represent an incoming argument to the current function...
-//
-class ArgDSNode : public DSNode {
- FunctionArgument *FuncArg;
-public:
- ArgDSNode(FunctionArgument *MA);
- virtual std::string getCaption() const;
-
- // isEquivalentTo - Return true if the nodes should be merged...
- virtual bool isEquivalentTo(DSNode *Node) const;
+ // If the pass pipeline is done with this pass, we can release our memory...
+ virtual void releaseMemory();
- // Support type inquiry through isa, cast, and dyn_cast...
- static bool classof(const ArgDSNode *) { return true; }
- static bool classof(const DSNode *N) { return N->NodeType == ArgNode; }
+ virtual void getAnalysisUsage(AnalysisUsage &AU) const {
+ AU.setPreservesAll();
+ AU.addRequired<LocalDataStructures>();
+ }
private:
- virtual ArgDSNode *cloneImpl() const { return new ArgDSNode(FuncArg); }
+ DSGraph &calculateGraph(Function &F);
};
-
-// ShadowDSNode - Represent a chunk of memory that we need to be able to
-// address. These are generated due to (for example) pointer type method
-// arguments... if the pointer is dereferenced, we need to have a node to point
-// to. When functions are integrated into each other, shadow nodes are
-// resolved.
-//
-// Shadow nodes may be marked as "critical" nodes when they are created. This
-// mark indicates that the node is the result of a function call, the value
-// pointed to by an incoming argument, or the value pointed to by a global
-// variable [fixme todo]. Since it is not possible to know what these nodes
-// point to, given just the current context, they are marked "Critical" to avoid
-// having the shadow node merger eliminate them.
+// TDDataStructures - Analysis that computes new data structure graphs
+// for each function using the closed graphs for the callers computed
+// by the bottom-up pass.
//
-class ShadowDSNode : public DSNode {
- friend class FunctionDSGraph;
- DSNode *Parent;
- Module *Mod;
- ShadowDSNode *ShadowParent; // Nonnull if this is a synthesized node...
- std::vector<std::pair<const Type *, ShadowDSNode *> > SynthNodes;
- bool CriticalNode;
+class TDDataStructures : public Pass {
+ // DSInfo, one graph for each function
+ std::map<const Function*, DSGraph*> DSInfo;
+ std::set<const Function*> GraphDone;
public:
- ShadowDSNode(DSNode *Parent, Module *M, bool Critical = false);
- virtual std::string getCaption() const;
+ ~TDDataStructures() { releaseMemory(); }
- // synthesizeNode - Create a new shadow node that is to be linked into this
- // chain..
- //
- ShadowDSNode *synthesizeNode(const Type *Ty, FunctionRepBuilder *Rep);
-
- bool isCriticalNode() const { return CriticalNode; }
- void resetCriticalMark() { CriticalNode = false; }
-
- // isEquivalentTo - Return true if the nodes should be merged...
- virtual bool isEquivalentTo(DSNode *Node) const;
-
- // Support type inquiry through isa, cast, and dyn_cast...
- static bool classof(const ShadowDSNode *) { return true; }
- static bool classof(const DSNode *N) { return N->NodeType == ShadowNode; }
+ virtual bool run(Module &M);
-private:
- ShadowDSNode(const Type *Ty, Module *M, ShadowDSNode *ShadParent);
-protected:
- virtual void mapNode(std::map<const DSNode*, DSNode*> &NodeMap,
- const DSNode *Old);
- virtual ShadowDSNode *cloneImpl() const {
- if (ShadowParent)
- return new ShadowDSNode(getType(), Mod, ShadowParent);
- else
- return new ShadowDSNode(Parent, Mod, CriticalNode);
+ // getDSGraph - Return the data structure graph for the specified function.
+ DSGraph &getDSGraph(const Function &F) const {
+ std::map<const Function*, DSGraph*>::const_iterator I = DSInfo.find(&F);
+ assert(I != DSInfo.end() && "Function not in module!");
+ return *I->second;
}
-};
+ // print - Print out the analysis results...
+ void print(std::ostream &O, const Module *M) const;
-// FunctionDSGraph - The graph that represents a method.
-//
-class FunctionDSGraph {
- Function *Func;
- std::vector<ArgDSNode*> ArgNodes;
- std::vector<AllocDSNode*> AllocNodes;
- std::vector<ShadowDSNode*> ShadowNodes;
- std::vector<GlobalDSNode*> GlobalNodes;
- std::vector<CallDSNode*> CallNodes;
- PointerValSet RetNode; // Node that gets returned...
- std::map<Value*, PointerValSet> ValueMap;
-
- // cloneFunctionIntoSelf - Clone the specified method graph into the current
- // method graph, returning the Return's set of the graph. If ValueMap is set
- // to true, the ValueMap of the function is cloned into this function as well
- // as the data structure graph itself.
- //
- PointerValSet cloneFunctionIntoSelf(const FunctionDSGraph &G, bool ValueMap);
- bool RemoveUnreachableNodes();
- bool UnlinkUndistinguishableNodes();
- void MarkEscapeableNodesReachable(std::vector<bool> &RSN,
- std::vector<bool> &RAN);
+ // If the pass pipeline is done with this pass, we can release our memory...
+ virtual void releaseMemory();
+ // getAnalysisUsage - This obviously provides a data structure graph.
+ virtual void getAnalysisUsage(AnalysisUsage &AU) const {
+ AU.setPreservesAll();
+ AU.addRequired<BUDataStructures>();
+ }
private:
- // Define the interface only accessable to DataStructure
- friend class DataStructure;
- FunctionDSGraph(Function *F);
- FunctionDSGraph(const FunctionDSGraph &DSG);
- ~FunctionDSGraph();
-
- void computeClosure(const DataStructure &DS);
-public:
+ void calculateGraph(Function &F);
+ DSGraph &getOrCreateDSGraph(Function &F);
- Function *getFunction() const { return Func; }
-
- // getEscapingAllocations - Add all allocations that escape the current
- // function to the specified vector.
- //
- void getEscapingAllocations(std::vector<AllocDSNode*> &Allocs);
-
- // getNonEscapingAllocations - Add all allocations that do not escape the
- // current function to the specified vector.
- //
- void getNonEscapingAllocations(std::vector<AllocDSNode*> &Allocs);
-
- // getValueMap - Get a map that describes what the nodes the scalars in this
- // function point to...
- //
- std::map<Value*, PointerValSet> &getValueMap() { return ValueMap; }
-
-
-
- void printFunction(std::ostream &O, const char *Label) const;
+ void ResolveCallSite(DSGraph &Graph, const DSCallSite &CallSite);
};
+#if 0
+// GlobalDSGraph - A common graph for all the globals and their outgoing links
+// to externally visible nodes. This includes GlobalValues, New nodes,
+// Cast nodes, and Calls. This graph can only be used by one of the
+// individual function graphs, and it goes away when they all go away.
+//
+class GlobalDSGraph : public DSGraph {
+ hash_set<const DSGraph*> Referrers;
+ void addReference(const DSGraph* referrer);
+ void removeReference(const DSGraph* referrer);
+ friend class DSGraph; // give access to Referrers
+
+ GlobalDSGraph(const GlobalDSGraph &GlobalDSG); // Do not implement
-// FIXME: This should be a FunctionPass. When the pass framework sees a 'Pass'
-// that uses the output of a FunctionPass, it should automatically build a map
-// of output from the method pass that the pass can use.
-//
-class DataStructure : public Pass {
- // DSInfo, one intraprocedural and one closed graph for each method...
- typedef std::map<Function*, std::pair<FunctionDSGraph*,
- FunctionDSGraph*> > InfoMap;
- mutable InfoMap DSInfo;
-public:
- static AnalysisID ID; // DataStructure Analysis ID
-
- DataStructure(AnalysisID id) { assert(id == ID); }
- ~DataStructure() { releaseMemory(); }
-
- // run - Do nothing, because methods are analyzed lazily
- virtual bool run(Module *TheModule) { return false; }
-
- // getDSGraph - Return the data structure graph for the specified method.
- // Since method graphs are lazily computed, we may have to create one on the
- // fly here.
- //
- FunctionDSGraph &getDSGraph(Function *F) const {
- std::pair<FunctionDSGraph*, FunctionDSGraph*> &N = DSInfo[F];
- if (N.first) return *N.first;
- return *(N.first = new FunctionDSGraph(F));
- }
-
- // getClosedDSGraph - Return the data structure graph for the specified
- // method. Since method graphs are lazily computed, we may have to create one
- // on the fly here. This is different than the normal DSGraph for the method
- // because any function calls that are resolvable will have the data structure
- // graphs of the called function incorporated into this function as well.
- //
- FunctionDSGraph &getClosedDSGraph(Function *F) const {
- std::pair<FunctionDSGraph*, FunctionDSGraph*> &N = DSInfo[F];
- if (N.second) return *N.second;
- N.second = new FunctionDSGraph(getDSGraph(F));
- N.second->computeClosure(*this);
- return *N.second;
- }
-
- // invalidateFunction - Inform this analysis that you changed the specified
- // function, so the graphs that depend on it are out of date.
- //
- void invalidateFunction(Function *F) const {
- // FIXME: THis should invalidate all functions who have inlined the
- // specified graph!
- //
- std::pair<FunctionDSGraph*, FunctionDSGraph*> &N = DSInfo[F];
- delete N.first;
- delete N.second;
- N.first = N.second = 0;
- }
-
- // print - Print out the analysis results...
- void print(std::ostream &O, Module *M) const;
+ // Helper function for cloneGlobals and cloneCalls
+ DSNode* cloneNodeInto(DSNode *OldNode,
+ std::map<const DSNode*, DSNode*> &NodeCache,
+ bool GlobalsAreFinal = false);
- // If the pass pipeline is done with this pass, we can release our memory...
- virtual void releaseMemory();
+public:
+ GlobalDSGraph(); // Create an empty DSGraph
+ virtual ~GlobalDSGraph();
- // getAnalysisUsageInfo - This obviously provides a call graph
- virtual void getAnalysisUsageInfo(AnalysisSet &Required,
- AnalysisSet &Destroyed,
- AnalysisSet &Provided) {
- Provided.push_back(ID);
- }
+ void cloneGlobals(DSGraph& Graph, bool CloneCalls = false);
+ void cloneCalls (DSGraph& Graph);
};
+#endif
#endif