clang 23.0.0git
ExplodedGraph.h
Go to the documentation of this file.
1//===- ExplodedGraph.h - Local, Path-Sens. "Exploded Graph" -----*- C++ -*-===//
2//
3// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4// See https://llvm.org/LICENSE.txt for license information.
5// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6//
7//===----------------------------------------------------------------------===//
8//
9// This file defines the template classes ExplodedNode and ExplodedGraph,
10// which represent a path-sensitive, intra-procedural "exploded graph".
11// See "Precise interprocedural dataflow analysis via graph reachability"
12// by Reps, Horwitz, and Sagiv
13// (http://portal.acm.org/citation.cfm?id=199462) for the definition of an
14// exploded graph.
15//
16//===----------------------------------------------------------------------===//
17
18#ifndef LLVM_CLANG_STATICANALYZER_CORE_PATHSENSITIVE_EXPLODEDGRAPH_H
19#define LLVM_CLANG_STATICANALYZER_CORE_PATHSENSITIVE_EXPLODEDGRAPH_H
20
24#include "clang/Basic/LLVM.h"
28#include "llvm/ADT/ArrayRef.h"
29#include "llvm/ADT/DenseMap.h"
30#include "llvm/ADT/DepthFirstIterator.h"
31#include "llvm/ADT/FoldingSet.h"
32#include "llvm/ADT/GraphTraits.h"
33#include "llvm/ADT/STLExtras.h"
34#include "llvm/ADT/SetVector.h"
35#include "llvm/ADT/iterator_range.h"
36#include "llvm/Support/Allocator.h"
37#include "llvm/Support/Compiler.h"
38#include <cassert>
39#include <cstdint>
40#include <memory>
41#include <optional>
42#include <utility>
43#include <vector>
44
45namespace clang {
46
47class CFG;
48class Decl;
49class Expr;
50class ParentMap;
51class Stmt;
52
53namespace ento {
54
55class ExplodedGraph;
56
57//===----------------------------------------------------------------------===//
58// ExplodedGraph "implementation" classes. These classes are not typed to
59// contain a specific kind of state. Typed-specialized versions are defined
60// on top of these classes.
61//===----------------------------------------------------------------------===//
62
63// ExplodedNode is not constified all over the engine because we need to add
64// successors to it at any time after creating it.
65
66class ExplodedNode : public llvm::FoldingSetNode {
67 friend class BranchNodeBuilder;
68 friend class CoreEngine;
69 friend class ExplodedGraph;
71 friend class NodeBuilder;
72 friend class SwitchNodeBuilder;
73
74 /// Efficiently stores a list of ExplodedNodes, or an optional flag.
75 ///
76 /// NodeGroup provides opaque storage for a list of ExplodedNodes, optimizing
77 /// for the case when there is only one node in the group. This is a fairly
78 /// common case in an ExplodedGraph, where most nodes have only one
79 /// predecessor and many have only one successor. It can also be used to
80 /// store a flag rather than a node list, which ExplodedNode uses to mark
81 /// whether a node is a sink. If the flag is set, the group is implicitly
82 /// empty and no nodes may be added.
83 class NodeGroup {
84 // Conceptually a discriminated union. If the low bit is set, the node is
85 // a sink. If the low bit is not set, the pointer refers to the storage
86 // for the nodes in the group.
87 // This is not a PointerIntPair in order to keep the storage type opaque.
88 uintptr_t P;
89
90 public:
91 NodeGroup(bool Flag = false) : P(Flag) {
92 assert(getFlag() == Flag);
93 }
94
95 ExplodedNode * const *begin() const;
96
97 ExplodedNode * const *end() const;
98
99 unsigned size() const;
100
101 bool empty() const { return P == 0 || getFlag() != 0; }
102
103 /// Adds a node to the list.
104 ///
105 /// The group must not have been created with its flag set.
106 void addNode(ExplodedNode *N, ExplodedGraph &G);
107
108 /// Replaces the single node in this group with a new node.
109 ///
110 /// Note that this should only be used when you know the group was not
111 /// created with its flag set, and that the group is empty or contains
112 /// only a single node.
113 void replaceNode(ExplodedNode *node);
114
115 /// Returns whether this group was created with its flag set.
116 bool getFlag() const {
117 return (P & 1);
118 }
119 };
120
121 /// Location - The program location (within a function body) associated
122 /// with this node.
123 const ProgramPoint Location;
124
125 /// State - The state associated with this node.
126 ProgramStateRef State;
127
128 /// Preds - The predecessors of this node.
129 NodeGroup Preds;
130
131 /// Succs - The successors of this node.
132 NodeGroup Succs;
133
134 int64_t Id;
135
136public:
138 int64_t Id, bool IsSink)
139 : Location(loc), State(std::move(state)), Succs(IsSink), Id(Id) {
140 assert(isSink() == IsSink);
141 }
142
143 /// getLocation - Returns the edge associated with the given node.
144 ProgramPoint getLocation() const { return Location; }
145
148 }
149
151 return getLocation().getStackFrame();
152 }
153
154 const Decl &getCodeDecl() const { return *getLocationContext()->getDecl(); }
155
156 CFG &getCFG() const { return *getLocationContext()->getCFG(); }
157
158 const CFGBlock *getCFGBlock() const;
159
160 const ParentMap &getParentMap() const {
162 }
163
164 template <typename T> T &getAnalysis() const {
165 return *getLocationContext()->getAnalysis<T>();
166 }
167
168 const ProgramStateRef &getState() const { return State; }
169
170 template <typename T> std::optional<T> getLocationAs() const & {
171 return Location.getAs<T>();
172 }
173
174 /// Get the value of an arbitrary expression at this node.
175 SVal getSVal(const Stmt *S) const {
176 return getState()->getSVal(S, getLocationContext());
177 }
178
179 static void Profile(llvm::FoldingSetNodeID &ID,
180 const ProgramPoint &Loc,
181 const ProgramStateRef &state,
182 bool IsSink) {
183 ID.Add(Loc);
184 ID.AddPointer(state.get());
185 ID.AddBoolean(IsSink);
186 }
187
188 void Profile(llvm::FoldingSetNodeID& ID) const {
189 // We avoid copy constructors by not using accessors.
190 Profile(ID, Location, State, isSink());
191 }
192
193 /// addPredeccessor - Adds a predecessor to the current node, and
194 /// in tandem add this node as a successor of the other node.
196
197 unsigned succ_size() const { return Succs.size(); }
198 unsigned pred_size() const { return Preds.size(); }
199 bool succ_empty() const { return Succs.empty(); }
200 bool pred_empty() const { return Preds.empty(); }
201
202 bool isSink() const { return Succs.getFlag(); }
203
204 bool hasSinglePred() const {
205 return (pred_size() == 1);
206 }
207
209 return pred_empty() ? nullptr : *(pred_begin());
210 }
211
212 const ExplodedNode *getFirstPred() const {
213 return const_cast<ExplodedNode*>(this)->getFirstPred();
214 }
215
217 return succ_empty() ? nullptr : *(succ_begin());
218 }
219
220 const ExplodedNode *getFirstSucc() const {
221 return const_cast<ExplodedNode*>(this)->getFirstSucc();
222 }
223
224 // Iterators over successor and predecessor vertices.
225 using succ_iterator = ExplodedNode * const *;
226 using succ_range = llvm::iterator_range<succ_iterator>;
227
228 using const_succ_iterator = const ExplodedNode * const *;
229 using const_succ_range = llvm::iterator_range<const_succ_iterator>;
230
231 using pred_iterator = ExplodedNode * const *;
232 using pred_range = llvm::iterator_range<pred_iterator>;
233
234 using const_pred_iterator = const ExplodedNode * const *;
235 using const_pred_range = llvm::iterator_range<const_pred_iterator>;
236
237 pred_iterator pred_begin() { return Preds.begin(); }
238 pred_iterator pred_end() { return Preds.end(); }
239 pred_range preds() { return {Preds.begin(), Preds.end()}; }
240
242 return const_cast<ExplodedNode*>(this)->pred_begin();
243 }
245 return const_cast<ExplodedNode*>(this)->pred_end();
246 }
247 const_pred_range preds() const { return {Preds.begin(), Preds.end()}; }
248
249 succ_iterator succ_begin() { return Succs.begin(); }
250 succ_iterator succ_end() { return Succs.end(); }
251 succ_range succs() { return {Succs.begin(), Succs.end()}; }
252
254 return const_cast<ExplodedNode*>(this)->succ_begin();
255 }
257 return const_cast<ExplodedNode*>(this)->succ_end();
258 }
259 const_succ_range succs() const { return {Succs.begin(), Succs.end()}; }
260
261 int64_t getID() const { return Id; }
262
263 /// The node is trivial if it has only one successor, only one predecessor,
264 /// it's predecessor has only one successor,
265 /// and its program state is the same as the program state of the previous
266 /// node.
267 /// Trivial nodes may be skipped while printing exploded graph.
268 bool isTrivial() const;
269
270 /// If the node's program point corresponds to a statement, retrieve that
271 /// statement. Useful for figuring out where to put a warning or a note.
272 /// If the statement belongs to a body-farmed definition,
273 /// retrieve the call site for that definition.
274 const Stmt *getStmtForDiagnostics() const;
275
276 /// Find the next statement that was executed on this node's execution path.
277 /// Useful for explaining control flow that follows the current node.
278 /// If the statement belongs to a body-farmed definition, retrieve the
279 /// call site for that definition.
280 const Stmt *getNextStmtForDiagnostics() const;
281
282 /// Find the statement that was executed immediately before this node.
283 /// Useful when the node corresponds to a CFG block entrance.
284 /// If the statement belongs to a body-farmed definition, retrieve the
285 /// call site for that definition.
286 const Stmt *getPreviousStmtForDiagnostics() const;
287
288 /// Find the statement that was executed at or immediately before this node.
289 /// Useful when any nearby statement will do.
290 /// If the statement belongs to a body-farmed definition, retrieve the
291 /// call site for that definition.
293
294private:
295 void replaceSuccessor(ExplodedNode *node) { Succs.replaceNode(node); }
296 void replacePredecessor(ExplodedNode *node) { Preds.replaceNode(node); }
297};
298
300 llvm::DenseMap<const ExplodedNode *, const ExplodedNode *>;
301
303protected:
304 friend class CoreEngine;
305
306 // Type definitions.
307 using NodeVector = std::vector<ExplodedNode *>;
308
309 /// The root of the simulation graph. Can be nullptr if the graph is empty or
310 /// if it was populated by `createUncachedNode()`.
311 ExplodedNode *Root = nullptr;
312
313 /// The nodes in the simulation graph which have been
314 /// specially marked as the endpoint of an abstract simulation path.
316
317 /// Nodes - The nodes in the graph.
318 llvm::FoldingSet<ExplodedNode> Nodes;
319
320 /// BVC - Allocator and context for allocating nodes and their predecessor
321 /// and successor groups.
323
324 /// NumNodes - The number of nodes in the graph.
325 int64_t NumNodes = 0;
326
327 /// A list of recently allocated nodes that can potentially be recycled.
329
330 /// A list of nodes that can be reused.
332
333 /// Determines how often nodes are reclaimed.
334 ///
335 /// If this is 0, nodes will never be reclaimed.
337
338 /// Counter to determine when to reclaim nodes.
340
341public:
344
345 /// Get the root node of the graph. This may return nullptr if the graph is
346 /// empty or under construction.
347 ExplodedNode *getRoot() const { return Root; }
348
349 /// Retrieve the node associated with a (Location, State) pair, where the
350 /// 'Location' is a ProgramPoint in the CFG. If no node for this pair exists,
351 /// it is created. IsNew is set to true if the node was freshly created.
353 bool IsSink = false,
354 bool* IsNew = nullptr);
355
356 /// Create a node for a (Location, State) pair, but don't store it for
357 /// deduplication later. This is useful when copying some nodes from an
358 /// already completed ExplodedGraph for further processing.
360 ProgramStateRef State,
361 int64_t Id,
362 bool IsSink = false);
363
364 /// Mark a node as the root of the graph. Calling this is an error if the
365 /// graph already has a root node.
367 assert(V && "Cannot designate nullptr as root!");
368 assert(!Root && "The graph already has a root, cannot designate another!");
369 Root = V;
370 }
371
372 /// addEndOfPath - Add an untyped node to the set of EOP nodes.
374 EndNodes.push_back(V);
375 return V;
376 }
377
378 unsigned num_eops() const { return EndNodes.size(); }
379
380 bool empty() const { return NumNodes == 0; }
381 unsigned size() const { return NumNodes; }
382
383 void reserve(unsigned NodeCount) { Nodes.reserve(NodeCount); }
384
385 // Iterators.
387 using AllNodesTy = llvm::FoldingSet<ExplodedNode>;
388 using eop_iterator = NodeVector::iterator;
389 using const_eop_iterator = NodeVector::const_iterator;
390 using node_iterator = AllNodesTy::iterator;
391 using const_node_iterator = AllNodesTy::const_iterator;
392
393 llvm::iterator_range<node_iterator> nodes() { return Nodes; }
394
395 llvm::iterator_range<const_node_iterator> nodes() const { return Nodes; }
396
397 eop_iterator eop_begin() { return EndNodes.begin(); }
398
399 eop_iterator eop_end() { return EndNodes.end(); }
400
401 const_eop_iterator eop_begin() const { return EndNodes.begin(); }
402
403 const_eop_iterator eop_end() const { return EndNodes.end(); }
404
405 llvm::BumpPtrAllocator & getAllocator() { return BVC.getAllocator(); }
407
408 using NodeMap = llvm::DenseMap<const ExplodedNode *, ExplodedNode *>;
409
410 /// Creates a trimmed version of the graph that only contains paths leading
411 /// to the given nodes.
412 ///
413 /// \param Nodes The nodes which must appear in the final graph. Presumably
414 /// these are end-of-path nodes (i.e. they have no successors).
415 /// \param[out] ForwardMap An optional map from nodes in this graph to nodes
416 /// in the returned graph.
417 /// \param[out] InverseMap An optional map from nodes in the returned graph to
418 /// nodes in this graph.
419 /// \returns The trimmed graph
420 std::unique_ptr<ExplodedGraph>
422 InterExplodedGraphMap *ForwardMap = nullptr,
423 InterExplodedGraphMap *InverseMap = nullptr) const;
424
425 /// Enable tracking of recently allocated nodes for potential reclamation
426 /// when calling reclaimRecentlyAllocatedNodes().
427 void enableNodeReclamation(unsigned Interval) {
429 }
430
431 /// Reclaim "uninteresting" nodes created since the last time this method
432 /// was called.
434
435 /// Returns true if nodes for the given expression kind are always
436 /// kept around.
437 static bool isInterestingLValueExpr(const Expr *Ex);
438
439private:
440 bool shouldCollect(const ExplodedNode *node);
441 void collectNode(ExplodedNode *node);
442};
443
446 ImplTy Impl;
447
448public:
450 assert(N && !N->isSink());
451 Impl.insert(N);
452 }
453
454 ExplodedNodeSet() = default;
455
456 void Add(ExplodedNode *N) {
457 if (N && !N->isSink())
458 Impl.insert(N);
459 }
460
461 using iterator = ImplTy::iterator;
462 using const_iterator = ImplTy::const_iterator;
463
464 unsigned size() const { return Impl.size(); }
465 bool empty() const { return Impl.empty(); }
466 bool erase(ExplodedNode *N) { return Impl.remove(N); }
467
468 void clear() { Impl.clear(); }
469
470 void insert(const ExplodedNodeSet &S) {
471 assert(&S != this);
472 if (empty())
473 Impl = S.Impl;
474 else
475 Impl.insert_range(S);
476 }
477
478 iterator begin() { return Impl.begin(); }
479 iterator end() { return Impl.end(); }
480
481 const_iterator begin() const { return Impl.begin(); }
482 const_iterator end() const { return Impl.end(); }
483};
484
485} // namespace ento
486
487} // namespace clang
488
489// GraphTraits
490
491namespace llvm {
492 template <> struct GraphTraits<clang::ento::ExplodedGraph *> {
496 using nodes_iterator = llvm::df_iterator<GraphTy>;
497
498 static NodeRef getEntryNode(const GraphTy G) { return G->getRoot(); }
499
501 return N->succ_size() == 1 && N->getFirstSucc()->isTrivial();
502 }
503
506 return child_begin(*N->succ_begin());
507 return N->succ_begin();
508 }
509
512 return child_end(N->getFirstSucc());
513 return N->succ_end();
514 }
515
517 return df_begin(G);
518 }
519
521 return df_end(G);
522 }
523 };
524} // namespace llvm
525
526#endif // LLVM_CLANG_STATICANALYZER_CORE_PATHSENSITIVE_EXPLODEDGRAPH_H
#define V(N, I)
This file defines AnalysisDeclContext, a class that manages the analysis context data for context sen...
Forward-declares and imports various common LLVM datatypes that clang wants to use unqualified.
Represents a single basic block in a source-level CFG.
Definition CFG.h:632
Represents a source-level, intra-procedural CFG that represents the control-flow of a Stmt.
Definition CFG.h:1250
Decl - This represents one declaration (or definition), e.g.
Definition DeclBase.h:86
This represents one expression.
Definition Expr.h:112
It wraps the AnalysisDeclContext to represent both the call stack with the help of StackFrameContext ...
const Decl * getDecl() const
const ParentMap & getParentMap() const
const StackFrameContext * getStackFrame() const
const LocationContext * getLocationContext() const
It represents a stack frame of the call stack (based on CallEvent).
Stmt - This represents one statement.
Definition Stmt.h:86
std::unique_ptr< ExplodedGraph > trim(ArrayRef< const NodeTy * > Nodes, InterExplodedGraphMap *ForwardMap=nullptr, InterExplodedGraphMap *InverseMap=nullptr) const
Creates a trimmed version of the graph that only contains paths leading to the given nodes.
BumpVectorContext & getNodeAllocator()
std::vector< ExplodedNode * > NodeVector
unsigned ReclaimCounter
Counter to determine when to reclaim nodes.
void reserve(unsigned NodeCount)
NodeVector ChangedNodes
A list of recently allocated nodes that can potentially be recycled.
int64_t NumNodes
NumNodes - The number of nodes in the graph.
void enableNodeReclamation(unsigned Interval)
Enable tracking of recently allocated nodes for potential reclamation when calling reclaimRecentlyAll...
unsigned ReclaimNodeInterval
Determines how often nodes are reclaimed.
NodeVector EndNodes
The nodes in the simulation graph which have been specially marked as the endpoint of an abstract sim...
NodeVector::iterator eop_iterator
llvm::iterator_range< const_node_iterator > nodes() const
void reclaimRecentlyAllocatedNodes()
Reclaim "uninteresting" nodes created since the last time this method was called.
static bool isInterestingLValueExpr(const Expr *Ex)
Returns true if nodes for the given expression kind are always kept around.
AllNodesTy::const_iterator const_node_iterator
llvm::BumpPtrAllocator & getAllocator()
AllNodesTy::iterator node_iterator
llvm::FoldingSet< ExplodedNode > AllNodesTy
ExplodedNode * getNode(const ProgramPoint &L, ProgramStateRef State, bool IsSink=false, bool *IsNew=nullptr)
Retrieve the node associated with a (Location, State) pair, where the 'Location' is a ProgramPoint in...
const_eop_iterator eop_begin() const
NodeVector::const_iterator const_eop_iterator
BumpVectorContext BVC
BVC - Allocator and context for allocating nodes and their predecessor and successor groups.
llvm::iterator_range< node_iterator > nodes()
ExplodedNode * getRoot() const
Get the root node of the graph.
void designateAsRoot(ExplodedNode *V)
Mark a node as the root of the graph.
ExplodedNode * createUncachedNode(const ProgramPoint &L, ProgramStateRef State, int64_t Id, bool IsSink=false)
Create a node for a (Location, State) pair, but don't store it for deduplication later.
llvm::FoldingSet< ExplodedNode > Nodes
Nodes - The nodes in the graph.
llvm::DenseMap< const ExplodedNode *, ExplodedNode * > NodeMap
ExplodedNode * Root
The root of the simulation graph.
ExplodedNode * addEndOfPath(ExplodedNode *V)
addEndOfPath - Add an untyped node to the set of EOP nodes.
NodeVector FreeNodes
A list of nodes that can be reused.
const_eop_iterator eop_end() const
bool erase(ExplodedNode *N)
ExplodedNodeSet(ExplodedNode *N)
ImplTy::const_iterator const_iterator
void insert(const ExplodedNodeSet &S)
const_iterator end() const
void Add(ExplodedNode *N)
const_iterator begin() const
const CFGBlock * getCFGBlock() const
llvm::iterator_range< pred_iterator > pred_range
const ProgramStateRef & getState() const
llvm::iterator_range< const_succ_iterator > const_succ_range
const_pred_iterator pred_begin() const
const Stmt * getStmtForDiagnostics() const
If the node's program point corresponds to a statement, retrieve that statement.
const_succ_iterator succ_begin() const
llvm::iterator_range< succ_iterator > succ_range
bool isTrivial() const
The node is trivial if it has only one successor, only one predecessor, it's predecessor has only one...
const Stmt * getPreviousStmtForDiagnostics() const
Find the statement that was executed immediately before this node.
void Profile(llvm::FoldingSetNodeID &ID) const
ProgramPoint getLocation() const
getLocation - Returns the edge associated with the given node.
void addPredecessor(ExplodedNode *V, ExplodedGraph &G)
addPredeccessor - Adds a predecessor to the current node, and in tandem add this node as a successor ...
llvm::iterator_range< const_pred_iterator > const_pred_range
ExplodedNode * getFirstSucc()
friend class IndirectGotoNodeBuilder
unsigned pred_size() const
static void Profile(llvm::FoldingSetNodeID &ID, const ProgramPoint &Loc, const ProgramStateRef &state, bool IsSink)
const ExplodedNode * getFirstSucc() const
ExplodedNode(const ProgramPoint &loc, ProgramStateRef state, int64_t Id, bool IsSink)
const_succ_range succs() const
const Stmt * getNextStmtForDiagnostics() const
Find the next statement that was executed on this node's execution path.
const StackFrameContext * getStackFrame() const
ExplodedNode *const * succ_iterator
const ExplodedNode * getFirstPred() const
const_pred_range preds() const
const ParentMap & getParentMap() const
SVal getSVal(const Stmt *S) const
Get the value of an arbitrary expression at this node.
const LocationContext * getLocationContext() const
std::optional< T > getLocationAs() const &
const Stmt * getCurrentOrPreviousStmtForDiagnostics() const
Find the statement that was executed at or immediately before this node.
const ExplodedNode *const * const_pred_iterator
ExplodedNode * getFirstPred()
const_succ_iterator succ_end() const
unsigned succ_size() const
ExplodedNode *const * pred_iterator
const ExplodedNode *const * const_succ_iterator
const Decl & getCodeDecl() const
const_pred_iterator pred_end() const
SVal - This represents a symbolic expression, which can be either an L-value or an R-value.
Definition SVals.h:56
llvm::DenseMap< const ExplodedNode *, const ExplodedNode * > InterExplodedGraphMap
IntrusiveRefCntPtr< const ProgramState > ProgramStateRef
const Fact * ProgramPoint
A ProgramPoint identifies a location in the CFG by pointing to a specific Fact.
Definition Facts.h:87
The JSON file list parser is used to communicate input to InstallAPI.
nullptr
This class represents a compute construct, representing a 'Kind' of ‘parallel’, 'serial',...
long int64_t
Diagnostic wrappers for TextAPI types for error reporting.
Definition Dominators.h:30
__UINTPTR_TYPE__ uintptr_t
An unsigned integer type with the property that any valid pointer to void can be converted to this ty...
static nodes_iterator nodes_end(const GraphTy G)
static nodes_iterator nodes_begin(const GraphTy G)
static ChildIteratorType child_end(NodeRef N)
clang::ento::ExplodedNode::succ_iterator ChildIteratorType
static NodeRef getEntryNode(const GraphTy G)
static ChildIteratorType child_begin(NodeRef N)