clang 23.0.0git
ExplodedGraph.h
Go to the documentation of this file.
1//===- ExplodedGraph.h - Local, Path-Sens. "Exploded Graph" -----*- C++ -*-===//
2//
3// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4// See https://llvm.org/LICENSE.txt for license information.
5// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6//
7//===----------------------------------------------------------------------===//
8//
9// This file defines the template classes ExplodedNode and ExplodedGraph,
10// which represent a path-sensitive, intra-procedural "exploded graph".
11// See "Precise interprocedural dataflow analysis via graph reachability"
12// by Reps, Horwitz, and Sagiv
13// (http://portal.acm.org/citation.cfm?id=199462) for the definition of an
14// exploded graph.
15//
16//===----------------------------------------------------------------------===//
17
18#ifndef LLVM_CLANG_STATICANALYZER_CORE_PATHSENSITIVE_EXPLODEDGRAPH_H
19#define LLVM_CLANG_STATICANALYZER_CORE_PATHSENSITIVE_EXPLODEDGRAPH_H
20
24#include "clang/Basic/LLVM.h"
28#include "llvm/ADT/ArrayRef.h"
29#include "llvm/ADT/DenseMap.h"
30#include "llvm/ADT/DepthFirstIterator.h"
31#include "llvm/ADT/FoldingSet.h"
32#include "llvm/ADT/GraphTraits.h"
33#include "llvm/ADT/STLExtras.h"
34#include "llvm/ADT/SetVector.h"
35#include "llvm/ADT/iterator_range.h"
36#include "llvm/Support/Allocator.h"
37#include "llvm/Support/Compiler.h"
38#include <cassert>
39#include <cstdint>
40#include <memory>
41#include <optional>
42#include <utility>
43#include <vector>
44
45namespace clang {
46
47class CFG;
48class Decl;
49class Expr;
50class ParentMap;
51class Stmt;
52
53namespace ento {
54
55class ExplodedGraph;
56
57//===----------------------------------------------------------------------===//
58// ExplodedGraph "implementation" classes. These classes are not typed to
59// contain a specific kind of state. Typed-specialized versions are defined
60// on top of these classes.
61//===----------------------------------------------------------------------===//
62
63// ExplodedNode is not constified all over the engine because we need to add
64// successors to it at any time after creating it.
65
66class ExplodedNode : public llvm::FoldingSetNode {
67 friend class CoreEngine;
68 friend class ExplodedGraph;
69 friend class NodeBuilder;
70
71 /// Efficiently stores a list of ExplodedNodes, or an optional flag.
72 ///
73 /// NodeGroup provides opaque storage for a list of ExplodedNodes, optimizing
74 /// for the case when there is only one node in the group. This is a fairly
75 /// common case in an ExplodedGraph, where most nodes have only one
76 /// predecessor and many have only one successor. It can also be used to
77 /// store a flag rather than a node list, which ExplodedNode uses to mark
78 /// whether a node is a sink. If the flag is set, the group is implicitly
79 /// empty and no nodes may be added.
80 class NodeGroup {
81 // Conceptually a discriminated union. If the low bit is set, the node is
82 // a sink. If the low bit is not set, the pointer refers to the storage
83 // for the nodes in the group.
84 // This is not a PointerIntPair in order to keep the storage type opaque.
85 uintptr_t P;
86
87 public:
88 NodeGroup(bool Flag = false) : P(Flag) {
89 assert(getFlag() == Flag);
90 }
91
92 ExplodedNode * const *begin() const;
93
94 ExplodedNode * const *end() const;
95
96 unsigned size() const;
97
98 bool empty() const { return P == 0 || getFlag() != 0; }
99
100 /// Adds a node to the list.
101 ///
102 /// The group must not have been created with its flag set.
103 void addNode(ExplodedNode *N, ExplodedGraph &G);
104
105 /// Replaces the single node in this group with a new node.
106 ///
107 /// Note that this should only be used when you know the group was not
108 /// created with its flag set, and that the group is empty or contains
109 /// only a single node.
110 void replaceNode(ExplodedNode *node);
111
112 /// Returns whether this group was created with its flag set.
113 bool getFlag() const {
114 return (P & 1);
115 }
116 };
117
118 /// Location - The program location (within a function body) associated
119 /// with this node.
120 const ProgramPoint Location;
121
122 /// State - The state associated with this node.
123 ProgramStateRef State;
124
125 /// Preds - The predecessors of this node.
126 NodeGroup Preds;
127
128 /// Succs - The successors of this node.
129 NodeGroup Succs;
130
131 int64_t Id;
132
133public:
135 int64_t Id, bool IsSink)
136 : Location(loc), State(std::move(state)), Succs(IsSink), Id(Id) {
137 assert(isSink() == IsSink);
138 }
139
140 /// getLocation - Returns the edge associated with the given node.
141 ProgramPoint getLocation() const { return Location; }
142
145 }
146
148 return getLocation().getStackFrame();
149 }
150
151 const Decl &getCodeDecl() const { return *getLocationContext()->getDecl(); }
152
153 CFG &getCFG() const { return *getLocationContext()->getCFG(); }
154
155 const CFGBlock *getCFGBlock() const;
156
157 const ParentMap &getParentMap() const {
159 }
160
161 template <typename T> T &getAnalysis() const {
162 return *getLocationContext()->getAnalysis<T>();
163 }
164
165 const ProgramStateRef &getState() const { return State; }
166
167 template <typename T> std::optional<T> getLocationAs() const & {
168 return Location.getAs<T>();
169 }
170
171 /// Get the value of an arbitrary expression at this node.
172 SVal getSVal(const Stmt *S) const {
173 return getState()->getSVal(S, getLocationContext());
174 }
175
176 static void Profile(llvm::FoldingSetNodeID &ID,
177 const ProgramPoint &Loc,
178 const ProgramStateRef &state,
179 bool IsSink) {
180 ID.Add(Loc);
181 ID.AddPointer(state.get());
182 ID.AddBoolean(IsSink);
183 }
184
185 void Profile(llvm::FoldingSetNodeID& ID) const {
186 // We avoid copy constructors by not using accessors.
187 Profile(ID, Location, State, isSink());
188 }
189
190 /// addPredeccessor - Adds a predecessor to the current node, and
191 /// in tandem add this node as a successor of the other node.
193
194 unsigned succ_size() const { return Succs.size(); }
195 unsigned pred_size() const { return Preds.size(); }
196 bool succ_empty() const { return Succs.empty(); }
197 bool pred_empty() const { return Preds.empty(); }
198
199 bool isSink() const { return Succs.getFlag(); }
200
201 bool hasSinglePred() const {
202 return (pred_size() == 1);
203 }
204
206 return pred_empty() ? nullptr : *(pred_begin());
207 }
208
209 const ExplodedNode *getFirstPred() const {
210 return const_cast<ExplodedNode*>(this)->getFirstPred();
211 }
212
214 return succ_empty() ? nullptr : *(succ_begin());
215 }
216
217 const ExplodedNode *getFirstSucc() const {
218 return const_cast<ExplodedNode*>(this)->getFirstSucc();
219 }
220
221 // Iterators over successor and predecessor vertices.
222 using succ_iterator = ExplodedNode * const *;
223 using succ_range = llvm::iterator_range<succ_iterator>;
224
225 using const_succ_iterator = const ExplodedNode * const *;
226 using const_succ_range = llvm::iterator_range<const_succ_iterator>;
227
228 using pred_iterator = ExplodedNode * const *;
229 using pred_range = llvm::iterator_range<pred_iterator>;
230
231 using const_pred_iterator = const ExplodedNode * const *;
232 using const_pred_range = llvm::iterator_range<const_pred_iterator>;
233
234 pred_iterator pred_begin() { return Preds.begin(); }
235 pred_iterator pred_end() { return Preds.end(); }
236 pred_range preds() { return {Preds.begin(), Preds.end()}; }
237
239 return const_cast<ExplodedNode*>(this)->pred_begin();
240 }
242 return const_cast<ExplodedNode*>(this)->pred_end();
243 }
244 const_pred_range preds() const { return {Preds.begin(), Preds.end()}; }
245
246 succ_iterator succ_begin() { return Succs.begin(); }
247 succ_iterator succ_end() { return Succs.end(); }
248 succ_range succs() { return {Succs.begin(), Succs.end()}; }
249
251 return const_cast<ExplodedNode*>(this)->succ_begin();
252 }
254 return const_cast<ExplodedNode*>(this)->succ_end();
255 }
256 const_succ_range succs() const { return {Succs.begin(), Succs.end()}; }
257
258 int64_t getID() const { return Id; }
259
260 /// The node is trivial if it has only one successor, only one predecessor,
261 /// it's predecessor has only one successor,
262 /// and its program state is the same as the program state of the previous
263 /// node.
264 /// Trivial nodes may be skipped while printing exploded graph.
265 bool isTrivial() const;
266
267 /// If the node's program point corresponds to a statement, retrieve that
268 /// statement. Useful for figuring out where to put a warning or a note.
269 /// If the statement belongs to a body-farmed definition,
270 /// retrieve the call site for that definition.
271 const Stmt *getStmtForDiagnostics() const;
272
273 /// Find the next statement that was executed on this node's execution path.
274 /// Useful for explaining control flow that follows the current node.
275 /// If the statement belongs to a body-farmed definition, retrieve the
276 /// call site for that definition.
277 const Stmt *getNextStmtForDiagnostics() const;
278
279 /// Find the statement that was executed immediately before this node.
280 /// Useful when the node corresponds to a CFG block entrance.
281 /// If the statement belongs to a body-farmed definition, retrieve the
282 /// call site for that definition.
283 const Stmt *getPreviousStmtForDiagnostics() const;
284
285 /// Find the statement that was executed at or immediately before this node.
286 /// Useful when any nearby statement will do.
287 /// If the statement belongs to a body-farmed definition, retrieve the
288 /// call site for that definition.
290
291private:
292 void replaceSuccessor(ExplodedNode *node) { Succs.replaceNode(node); }
293 void replacePredecessor(ExplodedNode *node) { Preds.replaceNode(node); }
294};
295
297 llvm::DenseMap<const ExplodedNode *, const ExplodedNode *>;
298
300protected:
301 friend class CoreEngine;
302
303 // Type definitions.
304 using NodeVector = std::vector<ExplodedNode *>;
305
306 /// The root of the simulation graph. Can be nullptr if the graph is empty or
307 /// if it was populated by `createUncachedNode()`.
308 ExplodedNode *Root = nullptr;
309
310 /// The nodes in the simulation graph which have been
311 /// specially marked as the endpoint of an abstract simulation path.
313
314 /// Nodes - The nodes in the graph.
315 llvm::FoldingSet<ExplodedNode> Nodes;
316
317 /// BVC - Allocator and context for allocating nodes and their predecessor
318 /// and successor groups.
320
321 /// NumNodes - The number of nodes in the graph.
322 int64_t NumNodes = 0;
323
324 /// A list of recently allocated nodes that can potentially be recycled.
326
327 /// A list of nodes that can be reused.
329
330 /// Determines how often nodes are reclaimed.
331 ///
332 /// If this is 0, nodes will never be reclaimed.
334
335 /// Counter to determine when to reclaim nodes.
337
338public:
341
342 /// Get the root node of the graph. This may return nullptr if the graph is
343 /// empty or under construction.
344 ExplodedNode *getRoot() const { return Root; }
345
346 /// Retrieve the node associated with a (Location, State) pair, where the
347 /// 'Location' is a ProgramPoint in the CFG. If no node for this pair exists,
348 /// it is created. IsNew is set to true if the node was freshly created.
350 bool IsSink = false,
351 bool* IsNew = nullptr);
352
353 /// Create a node for a (Location, State) pair, but don't store it for
354 /// deduplication later. This is useful when copying some nodes from an
355 /// already completed ExplodedGraph for further processing.
357 ProgramStateRef State,
358 int64_t Id,
359 bool IsSink = false);
360
361 /// Mark a node as the root of the graph. Calling this is an error if the
362 /// graph already has a root node.
364 assert(V && "Cannot designate nullptr as root!");
365 assert(!Root && "The graph already has a root, cannot designate another!");
366 Root = V;
367 }
368
369 /// addEndOfPath - Add an untyped node to the set of EOP nodes.
371 EndNodes.push_back(V);
372 return V;
373 }
374
375 unsigned num_eops() const { return EndNodes.size(); }
376
377 bool empty() const { return NumNodes == 0; }
378 unsigned size() const { return NumNodes; }
379
380 void reserve(unsigned NodeCount) { Nodes.reserve(NodeCount); }
381
382 // Iterators.
384 using AllNodesTy = llvm::FoldingSet<ExplodedNode>;
385 using eop_iterator = NodeVector::iterator;
386 using const_eop_iterator = NodeVector::const_iterator;
387 using node_iterator = AllNodesTy::iterator;
388 using const_node_iterator = AllNodesTy::const_iterator;
389
390 llvm::iterator_range<node_iterator> nodes() { return Nodes; }
391
392 llvm::iterator_range<const_node_iterator> nodes() const { return Nodes; }
393
394 eop_iterator eop_begin() { return EndNodes.begin(); }
395
396 eop_iterator eop_end() { return EndNodes.end(); }
397
398 const_eop_iterator eop_begin() const { return EndNodes.begin(); }
399
400 const_eop_iterator eop_end() const { return EndNodes.end(); }
401
402 llvm::BumpPtrAllocator & getAllocator() { return BVC.getAllocator(); }
404
405 using NodeMap = llvm::DenseMap<const ExplodedNode *, ExplodedNode *>;
406
407 /// Creates a trimmed version of the graph that only contains paths leading
408 /// to the given nodes.
409 ///
410 /// \param Nodes The nodes which must appear in the final graph. Presumably
411 /// these are end-of-path nodes (i.e. they have no successors).
412 /// \param[out] ForwardMap An optional map from nodes in this graph to nodes
413 /// in the returned graph.
414 /// \param[out] InverseMap An optional map from nodes in the returned graph to
415 /// nodes in this graph.
416 /// \returns The trimmed graph
417 std::unique_ptr<ExplodedGraph>
419 InterExplodedGraphMap *ForwardMap = nullptr,
420 InterExplodedGraphMap *InverseMap = nullptr) const;
421
422 /// Enable tracking of recently allocated nodes for potential reclamation
423 /// when calling reclaimRecentlyAllocatedNodes().
424 void enableNodeReclamation(unsigned Interval) {
426 }
427
428 /// Reclaim "uninteresting" nodes created since the last time this method
429 /// was called.
431
432 /// Returns true if nodes for the given expression kind are always
433 /// kept around.
434 static bool isInterestingLValueExpr(const Expr *Ex);
435
436private:
437 bool shouldCollect(const ExplodedNode *node);
438 void collectNode(ExplodedNode *node);
439};
440
441/// ExplodedNodeSet is a set of `ExplodedNode *` elements with the invariant
442/// that its elements cannot be nullpointers or sink nodes. Insertion of null
443/// or sink nodes is silently ignored (which is comfortable in many use cases).
444/// Note that `ExplodedNode *` is implicitly convertible to an
445/// `ExplodedNodeSet` containing 0 or 1 elements (where null pointers and sink
446/// nodes converted to the empty set).
447/// This type has set semantics (repeated insertions are ignored), but the
448/// iteration order is always the order of (first) insertion.
451 ImplTy Impl;
452
453public:
455
456 ExplodedNodeSet() = default;
457
458 using iterator = ImplTy::iterator;
459 using const_iterator = ImplTy::const_iterator;
460
461 unsigned size() const { return Impl.size(); }
462 bool empty() const { return Impl.empty(); }
463 bool erase(ExplodedNode *N) { return Impl.remove(N); }
464
465 void clear() { Impl.clear(); }
466
468 if (N && !N->isSink())
469 Impl.insert(N);
470 }
471
472 void insert(const ExplodedNodeSet &S) {
473 if (&S == this)
474 return;
475 if (empty())
476 Impl = S.Impl;
477 else
478 Impl.insert_range(S);
479 }
480
481 iterator begin() { return Impl.begin(); }
482 iterator end() { return Impl.end(); }
483
484 const_iterator begin() const { return Impl.begin(); }
485 const_iterator end() const { return Impl.end(); }
486};
487
488} // namespace ento
489
490} // namespace clang
491
492// GraphTraits
493
494namespace llvm {
495 template <> struct GraphTraits<clang::ento::ExplodedGraph *> {
499 using nodes_iterator = llvm::df_iterator<GraphTy>;
500
501 static NodeRef getEntryNode(const GraphTy G) { return G->getRoot(); }
502
504 return N->succ_size() == 1 && N->getFirstSucc()->isTrivial();
505 }
506
509 return child_begin(*N->succ_begin());
510 return N->succ_begin();
511 }
512
515 return child_end(N->getFirstSucc());
516 return N->succ_end();
517 }
518
520 return df_begin(G);
521 }
522
524 return df_end(G);
525 }
526 };
527} // namespace llvm
528
529#endif // LLVM_CLANG_STATICANALYZER_CORE_PATHSENSITIVE_EXPLODEDGRAPH_H
#define V(N, I)
This file defines AnalysisDeclContext, a class that manages the analysis context data for context sen...
Forward-declares and imports various common LLVM datatypes that clang wants to use unqualified.
Represents a single basic block in a source-level CFG.
Definition CFG.h:632
Represents a source-level, intra-procedural CFG that represents the control-flow of a Stmt.
Definition CFG.h:1250
Decl - This represents one declaration (or definition), e.g.
Definition DeclBase.h:86
This represents one expression.
Definition Expr.h:112
It wraps the AnalysisDeclContext to represent both the call stack with the help of StackFrameContext ...
const Decl * getDecl() const
const ParentMap & getParentMap() const
const StackFrameContext * getStackFrame() const
const LocationContext * getLocationContext() const
It represents a stack frame of the call stack (based on CallEvent).
Stmt - This represents one statement.
Definition Stmt.h:86
std::unique_ptr< ExplodedGraph > trim(ArrayRef< const NodeTy * > Nodes, InterExplodedGraphMap *ForwardMap=nullptr, InterExplodedGraphMap *InverseMap=nullptr) const
Creates a trimmed version of the graph that only contains paths leading to the given nodes.
BumpVectorContext & getNodeAllocator()
std::vector< ExplodedNode * > NodeVector
unsigned ReclaimCounter
Counter to determine when to reclaim nodes.
void reserve(unsigned NodeCount)
NodeVector ChangedNodes
A list of recently allocated nodes that can potentially be recycled.
int64_t NumNodes
NumNodes - The number of nodes in the graph.
void enableNodeReclamation(unsigned Interval)
Enable tracking of recently allocated nodes for potential reclamation when calling reclaimRecentlyAll...
unsigned ReclaimNodeInterval
Determines how often nodes are reclaimed.
NodeVector EndNodes
The nodes in the simulation graph which have been specially marked as the endpoint of an abstract sim...
NodeVector::iterator eop_iterator
llvm::iterator_range< const_node_iterator > nodes() const
void reclaimRecentlyAllocatedNodes()
Reclaim "uninteresting" nodes created since the last time this method was called.
static bool isInterestingLValueExpr(const Expr *Ex)
Returns true if nodes for the given expression kind are always kept around.
AllNodesTy::const_iterator const_node_iterator
llvm::BumpPtrAllocator & getAllocator()
AllNodesTy::iterator node_iterator
llvm::FoldingSet< ExplodedNode > AllNodesTy
ExplodedNode * getNode(const ProgramPoint &L, ProgramStateRef State, bool IsSink=false, bool *IsNew=nullptr)
Retrieve the node associated with a (Location, State) pair, where the 'Location' is a ProgramPoint in...
const_eop_iterator eop_begin() const
NodeVector::const_iterator const_eop_iterator
BumpVectorContext BVC
BVC - Allocator and context for allocating nodes and their predecessor and successor groups.
llvm::iterator_range< node_iterator > nodes()
ExplodedNode * getRoot() const
Get the root node of the graph.
void designateAsRoot(ExplodedNode *V)
Mark a node as the root of the graph.
ExplodedNode * createUncachedNode(const ProgramPoint &L, ProgramStateRef State, int64_t Id, bool IsSink=false)
Create a node for a (Location, State) pair, but don't store it for deduplication later.
llvm::FoldingSet< ExplodedNode > Nodes
Nodes - The nodes in the graph.
llvm::DenseMap< const ExplodedNode *, ExplodedNode * > NodeMap
ExplodedNode * Root
The root of the simulation graph.
ExplodedNode * addEndOfPath(ExplodedNode *V)
addEndOfPath - Add an untyped node to the set of EOP nodes.
NodeVector FreeNodes
A list of nodes that can be reused.
const_eop_iterator eop_end() const
void insert(ExplodedNode *N)
bool erase(ExplodedNode *N)
ExplodedNodeSet(ExplodedNode *N)
ImplTy::const_iterator const_iterator
void insert(const ExplodedNodeSet &S)
const_iterator end() const
const_iterator begin() const
const CFGBlock * getCFGBlock() const
llvm::iterator_range< pred_iterator > pred_range
const ProgramStateRef & getState() const
llvm::iterator_range< const_succ_iterator > const_succ_range
const_pred_iterator pred_begin() const
const Stmt * getStmtForDiagnostics() const
If the node's program point corresponds to a statement, retrieve that statement.
const_succ_iterator succ_begin() const
llvm::iterator_range< succ_iterator > succ_range
bool isTrivial() const
The node is trivial if it has only one successor, only one predecessor, it's predecessor has only one...
const Stmt * getPreviousStmtForDiagnostics() const
Find the statement that was executed immediately before this node.
void Profile(llvm::FoldingSetNodeID &ID) const
ProgramPoint getLocation() const
getLocation - Returns the edge associated with the given node.
void addPredecessor(ExplodedNode *V, ExplodedGraph &G)
addPredeccessor - Adds a predecessor to the current node, and in tandem add this node as a successor ...
llvm::iterator_range< const_pred_iterator > const_pred_range
ExplodedNode * getFirstSucc()
unsigned pred_size() const
static void Profile(llvm::FoldingSetNodeID &ID, const ProgramPoint &Loc, const ProgramStateRef &state, bool IsSink)
const ExplodedNode * getFirstSucc() const
ExplodedNode(const ProgramPoint &loc, ProgramStateRef state, int64_t Id, bool IsSink)
const_succ_range succs() const
const Stmt * getNextStmtForDiagnostics() const
Find the next statement that was executed on this node's execution path.
const StackFrameContext * getStackFrame() const
ExplodedNode *const * succ_iterator
const ExplodedNode * getFirstPred() const
const_pred_range preds() const
const ParentMap & getParentMap() const
SVal getSVal(const Stmt *S) const
Get the value of an arbitrary expression at this node.
const LocationContext * getLocationContext() const
std::optional< T > getLocationAs() const &
const Stmt * getCurrentOrPreviousStmtForDiagnostics() const
Find the statement that was executed at or immediately before this node.
const ExplodedNode *const * const_pred_iterator
ExplodedNode * getFirstPred()
const_succ_iterator succ_end() const
unsigned succ_size() const
ExplodedNode *const * pred_iterator
const ExplodedNode *const * const_succ_iterator
const Decl & getCodeDecl() const
const_pred_iterator pred_end() const
SVal - This represents a symbolic expression, which can be either an L-value or an R-value.
Definition SVals.h:56
llvm::DenseMap< const ExplodedNode *, const ExplodedNode * > InterExplodedGraphMap
IntrusiveRefCntPtr< const ProgramState > ProgramStateRef
const Fact * ProgramPoint
A ProgramPoint identifies a location in the CFG by pointing to a specific Fact.
Definition Facts.h:91
The JSON file list parser is used to communicate input to InstallAPI.
nullptr
This class represents a compute construct, representing a 'Kind' of ‘parallel’, 'serial',...
long int64_t
Diagnostic wrappers for TextAPI types for error reporting.
Definition Dominators.h:30
__UINTPTR_TYPE__ uintptr_t
An unsigned integer type with the property that any valid pointer to void can be converted to this ty...
static nodes_iterator nodes_end(const GraphTy G)
static nodes_iterator nodes_begin(const GraphTy G)
static ChildIteratorType child_end(NodeRef N)
clang::ento::ExplodedNode::succ_iterator ChildIteratorType
static NodeRef getEntryNode(const GraphTy G)
static ChildIteratorType child_begin(NodeRef N)