1 //=-- ExplodedGraph.h - Local, Path-Sens. "Exploded Graph" -*- C++ -*-------==// 2 // 3 // The LLVM Compiler Infrastructure 4 // 5 // This file is distributed under the University of Illinois Open Source 6 // License. See LICENSE.TXT for details. 7 // 8 //===----------------------------------------------------------------------===// 9 // 10 // This file defines the template classes ExplodedNode and ExplodedGraph, 11 // which represent a path-sensitive, intra-procedural "exploded graph." 12 // See "Precise interprocedural dataflow analysis via graph reachability" 13 // by Reps, Horwitz, and Sagiv 14 // (http://portal.acm.org/citation.cfm?id=199462) for the definition of an 15 // exploded graph. 16 // 17 //===----------------------------------------------------------------------===// 18 19 #ifndef LLVM_CLANG_STATICANALYZER_CORE_PATHSENSITIVE_EXPLODEDGRAPH_H 20 #define LLVM_CLANG_STATICANALYZER_CORE_PATHSENSITIVE_EXPLODEDGRAPH_H 21 22 #include "clang/AST/Decl.h" 23 #include "clang/Analysis/AnalysisDeclContext.h" 24 #include "clang/Analysis/ProgramPoint.h" 25 #include "clang/Analysis/Support/BumpVector.h" 26 #include "clang/StaticAnalyzer/Core/PathSensitive/ProgramState.h" 27 #include "llvm/ADT/DepthFirstIterator.h" 28 #include "llvm/ADT/FoldingSet.h" 29 #include "llvm/ADT/GraphTraits.h" 30 #include "llvm/ADT/SetVector.h" 31 #include "llvm/Support/Allocator.h" 32 #include "llvm/Support/Casting.h" 33 #include <memory> 34 #include <utility> 35 #include <vector> 36 37 namespace clang { 38 39 class CFG; 40 41 namespace ento { 42 43 class ExplodedGraph; 44 45 //===----------------------------------------------------------------------===// 46 // ExplodedGraph "implementation" classes. These classes are not typed to 47 // contain a specific kind of state. Typed-specialized versions are defined 48 // on top of these classes. 49 //===----------------------------------------------------------------------===// 50 51 // ExplodedNode is not constified all over the engine because we need to add 52 // successors to it at any time after creating it. 53 54 class ExplodedNode : public llvm::FoldingSetNode { 55 friend class ExplodedGraph; 56 friend class CoreEngine; 57 friend class NodeBuilder; 58 friend class BranchNodeBuilder; 59 friend class IndirectGotoNodeBuilder; 60 friend class SwitchNodeBuilder; 61 friend class EndOfFunctionNodeBuilder; 62 63 /// Efficiently stores a list of ExplodedNodes, or an optional flag. 64 /// 65 /// NodeGroup provides opaque storage for a list of ExplodedNodes, optimizing 66 /// for the case when there is only one node in the group. This is a fairly 67 /// common case in an ExplodedGraph, where most nodes have only one 68 /// predecessor and many have only one successor. It can also be used to 69 /// store a flag rather than a node list, which ExplodedNode uses to mark 70 /// whether a node is a sink. If the flag is set, the group is implicitly 71 /// empty and no nodes may be added. 72 class NodeGroup { 73 // Conceptually a discriminated union. If the low bit is set, the node is 74 // a sink. If the low bit is not set, the pointer refers to the storage 75 // for the nodes in the group. 76 // This is not a PointerIntPair in order to keep the storage type opaque. 77 uintptr_t P; 78 79 public: 80 NodeGroup(bool Flag = false) : P(Flag) { 81 assert(getFlag() == Flag); 82 } 83 84 ExplodedNode * const *begin() const; 85 86 ExplodedNode * const *end() const; 87 88 unsigned size() const; 89 90 bool empty() const { return P == 0 || getFlag() != 0; } 91 92 /// Adds a node to the list. 93 /// 94 /// The group must not have been created with its flag set. 95 void addNode(ExplodedNode *N, ExplodedGraph &G); 96 97 /// Replaces the single node in this group with a new node. 98 /// 99 /// Note that this should only be used when you know the group was not 100 /// created with its flag set, and that the group is empty or contains 101 /// only a single node. 102 void replaceNode(ExplodedNode *node); 103 104 /// Returns whether this group was created with its flag set. 105 bool getFlag() const { 106 return (P & 1); 107 } 108 }; 109 110 /// Location - The program location (within a function body) associated 111 /// with this node. 112 const ProgramPoint Location; 113 114 /// State - The state associated with this node. 115 ProgramStateRef State; 116 117 /// Preds - The predecessors of this node. 118 NodeGroup Preds; 119 120 /// Succs - The successors of this node. 121 NodeGroup Succs; 122 123 public: 124 explicit ExplodedNode(const ProgramPoint &loc, ProgramStateRef state, 125 bool IsSink) 126 : Location(loc), State(std::move(state)), Succs(IsSink) { 127 assert(isSink() == IsSink); 128 } 129 130 /// getLocation - Returns the edge associated with the given node. 131 ProgramPoint getLocation() const { return Location; } 132 133 const LocationContext *getLocationContext() const { 134 return getLocation().getLocationContext(); 135 } 136 137 const StackFrameContext *getStackFrame() const { 138 return getLocationContext()->getCurrentStackFrame(); 139 } 140 141 const Decl &getCodeDecl() const { return *getLocationContext()->getDecl(); } 142 143 CFG &getCFG() const { return *getLocationContext()->getCFG(); } 144 145 ParentMap &getParentMap() const {return getLocationContext()->getParentMap();} 146 147 template <typename T> 148 T &getAnalysis() const { 149 return *getLocationContext()->getAnalysis<T>(); 150 } 151 152 const ProgramStateRef &getState() const { return State; } 153 154 template <typename T> 155 Optional<T> getLocationAs() const LLVM_LVALUE_FUNCTION { 156 return Location.getAs<T>(); 157 } 158 159 /// Get the value of an arbitrary expression at this node. 160 SVal getSVal(const Stmt *S) const { 161 return getState()->getSVal(S, getLocationContext()); 162 } 163 164 static void Profile(llvm::FoldingSetNodeID &ID, 165 const ProgramPoint &Loc, 166 const ProgramStateRef &state, 167 bool IsSink) { 168 ID.Add(Loc); 169 ID.AddPointer(state.get()); 170 ID.AddBoolean(IsSink); 171 } 172 173 void Profile(llvm::FoldingSetNodeID& ID) const { 174 // We avoid copy constructors by not using accessors. 175 Profile(ID, Location, State, isSink()); 176 } 177 178 /// addPredeccessor - Adds a predecessor to the current node, and 179 /// in tandem add this node as a successor of the other node. 180 void addPredecessor(ExplodedNode *V, ExplodedGraph &G); 181 182 unsigned succ_size() const { return Succs.size(); } 183 unsigned pred_size() const { return Preds.size(); } 184 bool succ_empty() const { return Succs.empty(); } 185 bool pred_empty() const { return Preds.empty(); } 186 187 bool isSink() const { return Succs.getFlag(); } 188 189 bool hasSinglePred() const { 190 return (pred_size() == 1); 191 } 192 193 ExplodedNode *getFirstPred() { 194 return pred_empty() ? nullptr : *(pred_begin()); 195 } 196 197 const ExplodedNode *getFirstPred() const { 198 return const_cast<ExplodedNode*>(this)->getFirstPred(); 199 } 200 201 const ExplodedNode *getFirstSucc() const { 202 return succ_empty() ? nullptr : *(succ_begin()); 203 } 204 205 // Iterators over successor and predecessor vertices. 206 typedef ExplodedNode* const * succ_iterator; 207 typedef const ExplodedNode* const * const_succ_iterator; 208 typedef ExplodedNode* const * pred_iterator; 209 typedef const ExplodedNode* const * const_pred_iterator; 210 211 pred_iterator pred_begin() { return Preds.begin(); } 212 pred_iterator pred_end() { return Preds.end(); } 213 214 const_pred_iterator pred_begin() const { 215 return const_cast<ExplodedNode*>(this)->pred_begin(); 216 } 217 const_pred_iterator pred_end() const { 218 return const_cast<ExplodedNode*>(this)->pred_end(); 219 } 220 221 succ_iterator succ_begin() { return Succs.begin(); } 222 succ_iterator succ_end() { return Succs.end(); } 223 224 const_succ_iterator succ_begin() const { 225 return const_cast<ExplodedNode*>(this)->succ_begin(); 226 } 227 const_succ_iterator succ_end() const { 228 return const_cast<ExplodedNode*>(this)->succ_end(); 229 } 230 231 // For debugging. 232 233 public: 234 235 class Auditor { 236 public: 237 virtual ~Auditor(); 238 virtual void AddEdge(ExplodedNode *Src, ExplodedNode *Dst) = 0; 239 }; 240 241 static void SetAuditor(Auditor* A); 242 243 private: 244 void replaceSuccessor(ExplodedNode *node) { Succs.replaceNode(node); } 245 void replacePredecessor(ExplodedNode *node) { Preds.replaceNode(node); } 246 }; 247 248 typedef llvm::DenseMap<const ExplodedNode *, const ExplodedNode *> 249 InterExplodedGraphMap; 250 251 class ExplodedGraph { 252 protected: 253 friend class CoreEngine; 254 255 // Type definitions. 256 typedef std::vector<ExplodedNode *> NodeVector; 257 258 /// The roots of the simulation graph. Usually there will be only 259 /// one, but clients are free to establish multiple subgraphs within a single 260 /// SimulGraph. Moreover, these subgraphs can often merge when paths from 261 /// different roots reach the same state at the same program location. 262 NodeVector Roots; 263 264 /// The nodes in the simulation graph which have been 265 /// specially marked as the endpoint of an abstract simulation path. 266 NodeVector EndNodes; 267 268 /// Nodes - The nodes in the graph. 269 llvm::FoldingSet<ExplodedNode> Nodes; 270 271 /// BVC - Allocator and context for allocating nodes and their predecessor 272 /// and successor groups. 273 BumpVectorContext BVC; 274 275 /// NumNodes - The number of nodes in the graph. 276 unsigned NumNodes; 277 278 /// A list of recently allocated nodes that can potentially be recycled. 279 NodeVector ChangedNodes; 280 281 /// A list of nodes that can be reused. 282 NodeVector FreeNodes; 283 284 /// Determines how often nodes are reclaimed. 285 /// 286 /// If this is 0, nodes will never be reclaimed. 287 unsigned ReclaimNodeInterval; 288 289 /// Counter to determine when to reclaim nodes. 290 unsigned ReclaimCounter; 291 292 public: 293 294 /// \brief Retrieve the node associated with a (Location,State) pair, 295 /// where the 'Location' is a ProgramPoint in the CFG. If no node for 296 /// this pair exists, it is created. IsNew is set to true if 297 /// the node was freshly created. 298 ExplodedNode *getNode(const ProgramPoint &L, ProgramStateRef State, 299 bool IsSink = false, 300 bool* IsNew = nullptr); 301 302 /// \brief Create a node for a (Location, State) pair, 303 /// but don't store it for deduplication later. This 304 /// is useful when copying an already completed 305 /// ExplodedGraph for further processing. 306 ExplodedNode *createUncachedNode(const ProgramPoint &L, 307 ProgramStateRef State, 308 bool IsSink = false); 309 310 std::unique_ptr<ExplodedGraph> MakeEmptyGraph() const { 311 return llvm::make_unique<ExplodedGraph>(); 312 } 313 314 /// addRoot - Add an untyped node to the set of roots. 315 ExplodedNode *addRoot(ExplodedNode *V) { 316 Roots.push_back(V); 317 return V; 318 } 319 320 /// addEndOfPath - Add an untyped node to the set of EOP nodes. 321 ExplodedNode *addEndOfPath(ExplodedNode *V) { 322 EndNodes.push_back(V); 323 return V; 324 } 325 326 ExplodedGraph(); 327 328 ~ExplodedGraph(); 329 330 unsigned num_roots() const { return Roots.size(); } 331 unsigned num_eops() const { return EndNodes.size(); } 332 333 bool empty() const { return NumNodes == 0; } 334 unsigned size() const { return NumNodes; } 335 336 void reserve(unsigned NodeCount) { Nodes.reserve(NodeCount); } 337 338 // Iterators. 339 typedef ExplodedNode NodeTy; 340 typedef llvm::FoldingSet<ExplodedNode> AllNodesTy; 341 typedef NodeVector::iterator roots_iterator; 342 typedef NodeVector::const_iterator const_roots_iterator; 343 typedef NodeVector::iterator eop_iterator; 344 typedef NodeVector::const_iterator const_eop_iterator; 345 typedef AllNodesTy::iterator node_iterator; 346 typedef AllNodesTy::const_iterator const_node_iterator; 347 348 node_iterator nodes_begin() { return Nodes.begin(); } 349 350 node_iterator nodes_end() { return Nodes.end(); } 351 352 const_node_iterator nodes_begin() const { return Nodes.begin(); } 353 354 const_node_iterator nodes_end() const { return Nodes.end(); } 355 356 roots_iterator roots_begin() { return Roots.begin(); } 357 358 roots_iterator roots_end() { return Roots.end(); } 359 360 const_roots_iterator roots_begin() const { return Roots.begin(); } 361 362 const_roots_iterator roots_end() const { return Roots.end(); } 363 364 eop_iterator eop_begin() { return EndNodes.begin(); } 365 366 eop_iterator eop_end() { return EndNodes.end(); } 367 368 const_eop_iterator eop_begin() const { return EndNodes.begin(); } 369 370 const_eop_iterator eop_end() const { return EndNodes.end(); } 371 372 llvm::BumpPtrAllocator & getAllocator() { return BVC.getAllocator(); } 373 BumpVectorContext &getNodeAllocator() { return BVC; } 374 375 typedef llvm::DenseMap<const ExplodedNode*, ExplodedNode*> NodeMap; 376 377 /// Creates a trimmed version of the graph that only contains paths leading 378 /// to the given nodes. 379 /// 380 /// \param Nodes The nodes which must appear in the final graph. Presumably 381 /// these are end-of-path nodes (i.e. they have no successors). 382 /// \param[out] ForwardMap A optional map from nodes in this graph to nodes in 383 /// the returned graph. 384 /// \param[out] InverseMap An optional map from nodes in the returned graph to 385 /// nodes in this graph. 386 /// \returns The trimmed graph 387 std::unique_ptr<ExplodedGraph> 388 trim(ArrayRef<const NodeTy *> Nodes, 389 InterExplodedGraphMap *ForwardMap = nullptr, 390 InterExplodedGraphMap *InverseMap = nullptr) const; 391 392 /// Enable tracking of recently allocated nodes for potential reclamation 393 /// when calling reclaimRecentlyAllocatedNodes(). 394 void enableNodeReclamation(unsigned Interval) { 395 ReclaimCounter = ReclaimNodeInterval = Interval; 396 } 397 398 /// Reclaim "uninteresting" nodes created since the last time this method 399 /// was called. 400 void reclaimRecentlyAllocatedNodes(); 401 402 /// \brief Returns true if nodes for the given expression kind are always 403 /// kept around. 404 static bool isInterestingLValueExpr(const Expr *Ex); 405 406 private: 407 bool shouldCollect(const ExplodedNode *node); 408 void collectNode(ExplodedNode *node); 409 }; 410 411 class ExplodedNodeSet { 412 typedef llvm::SmallSetVector<ExplodedNode*, 4> ImplTy; 413 ImplTy Impl; 414 415 public: 416 ExplodedNodeSet(ExplodedNode *N) { 417 assert (N && !static_cast<ExplodedNode*>(N)->isSink()); 418 Impl.insert(N); 419 } 420 421 ExplodedNodeSet() {} 422 423 inline void Add(ExplodedNode *N) { 424 if (N && !static_cast<ExplodedNode*>(N)->isSink()) Impl.insert(N); 425 } 426 427 typedef ImplTy::iterator iterator; 428 typedef ImplTy::const_iterator const_iterator; 429 430 unsigned size() const { return Impl.size(); } 431 bool empty() const { return Impl.empty(); } 432 bool erase(ExplodedNode *N) { return Impl.remove(N); } 433 434 void clear() { Impl.clear(); } 435 void insert(const ExplodedNodeSet &S) { 436 assert(&S != this); 437 if (empty()) 438 Impl = S.Impl; 439 else 440 Impl.insert(S.begin(), S.end()); 441 } 442 443 inline iterator begin() { return Impl.begin(); } 444 inline iterator end() { return Impl.end(); } 445 446 inline const_iterator begin() const { return Impl.begin(); } 447 inline const_iterator end() const { return Impl.end(); } 448 }; 449 450 } // end GR namespace 451 452 } // end clang namespace 453 454 // GraphTraits 455 456 namespace llvm { 457 template<> struct GraphTraits<clang::ento::ExplodedNode*> { 458 typedef clang::ento::ExplodedNode *NodeRef; 459 typedef clang::ento::ExplodedNode::succ_iterator ChildIteratorType; 460 typedef llvm::df_iterator<NodeRef> nodes_iterator; 461 462 static NodeRef getEntryNode(NodeRef N) { return N; } 463 464 static ChildIteratorType child_begin(NodeRef N) { return N->succ_begin(); } 465 466 static ChildIteratorType child_end(NodeRef N) { return N->succ_end(); } 467 468 static nodes_iterator nodes_begin(NodeRef N) { return df_begin(N); } 469 470 static nodes_iterator nodes_end(NodeRef N) { return df_end(N); } 471 }; 472 473 template<> struct GraphTraits<const clang::ento::ExplodedNode*> { 474 typedef const clang::ento::ExplodedNode *NodeRef; 475 typedef clang::ento::ExplodedNode::const_succ_iterator ChildIteratorType; 476 typedef llvm::df_iterator<NodeRef> nodes_iterator; 477 478 static NodeRef getEntryNode(NodeRef N) { return N; } 479 480 static ChildIteratorType child_begin(NodeRef N) { return N->succ_begin(); } 481 482 static ChildIteratorType child_end(NodeRef N) { return N->succ_end(); } 483 484 static nodes_iterator nodes_begin(NodeRef N) { return df_begin(N); } 485 486 static nodes_iterator nodes_end(NodeRef N) { return df_end(N); } 487 }; 488 489 } // end llvm namespace 490 491 #endif 492