clang 19.0.0git
UnreachableCodeChecker.cpp
Go to the documentation of this file.
1//==- UnreachableCodeChecker.cpp - Generalized dead code checker -*- C++ -*-==//
2//
3// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4// See https://llvm.org/LICENSE.txt for license information.
5// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6//
7//===----------------------------------------------------------------------===//
8// This file implements a generalized unreachable code checker using a
9// path-sensitive analysis. We mark any path visited, and then walk the CFG as a
10// post-analysis to determine what was never visited.
11//
12// A similar flow-sensitive only check exists in Analysis/ReachableCode.cpp
13//===----------------------------------------------------------------------===//
14
16#include "clang/AST/ParentMap.h"
26#include "llvm/ADT/SmallSet.h"
27#include <optional>
28
29using namespace clang;
30using namespace ento;
31
32namespace {
33class UnreachableCodeChecker : public Checker<check::EndAnalysis> {
34public:
35 void checkEndAnalysis(ExplodedGraph &G, BugReporter &B,
36 ExprEngine &Eng) const;
37private:
38 typedef llvm::SmallSet<unsigned, 32> CFGBlocksSet;
39
40 static inline const Stmt *getUnreachableStmt(const CFGBlock *CB);
41 static void FindUnreachableEntryPoints(const CFGBlock *CB,
42 CFGBlocksSet &reachable,
43 CFGBlocksSet &visited);
44 static bool isInvalidPath(const CFGBlock *CB, const ParentMap &PM);
45 static inline bool isEmptyCFGBlock(const CFGBlock *CB);
46};
47}
48
49void UnreachableCodeChecker::checkEndAnalysis(ExplodedGraph &G,
50 BugReporter &B,
51 ExprEngine &Eng) const {
52 CFGBlocksSet reachable, visited;
53
54 if (Eng.hasWorkRemaining())
55 return;
56
57 const Decl *D = nullptr;
58 CFG *C = nullptr;
59 const ParentMap *PM = nullptr;
60 const LocationContext *LC = nullptr;
61 // Iterate over ExplodedGraph
62 for (const ExplodedNode &N : G.nodes()) {
63 const ProgramPoint &P = N.getLocation();
64 LC = P.getLocationContext();
65 if (!LC->inTopFrame())
66 continue;
67
68 if (!D)
70
71 // Save the CFG if we don't have it already
72 if (!C)
74 if (!PM)
75 PM = &LC->getParentMap();
76
77 if (std::optional<BlockEntrance> BE = P.getAs<BlockEntrance>()) {
78 const CFGBlock *CB = BE->getBlock();
79 reachable.insert(CB->getBlockID());
80 }
81 }
82
83 // Bail out if we didn't get the CFG or the ParentMap.
84 if (!D || !C || !PM)
85 return;
86
87 // Don't do anything for template instantiations. Proving that code
88 // in a template instantiation is unreachable means proving that it is
89 // unreachable in all instantiations.
90 if (const FunctionDecl *FD = dyn_cast<FunctionDecl>(D))
91 if (FD->isTemplateInstantiation())
92 return;
93
94 // Find CFGBlocks that were not covered by any node
95 for (const CFGBlock *CB : *C) {
96 // Check if the block is unreachable
97 if (reachable.count(CB->getBlockID()))
98 continue;
99
100 // Check if the block is empty (an artificial block)
101 if (isEmptyCFGBlock(CB))
102 continue;
103
104 // Find the entry points for this block
105 if (!visited.count(CB->getBlockID()))
106 FindUnreachableEntryPoints(CB, reachable, visited);
107
108 // This block may have been pruned; check if we still want to report it
109 if (reachable.count(CB->getBlockID()))
110 continue;
111
112 // Check for false positives
113 if (isInvalidPath(CB, *PM))
114 continue;
115
116 // It is good practice to always have a "default" label in a "switch", even
117 // if we should never get there. It can be used to detect errors, for
118 // instance. Unreachable code directly under a "default" label is therefore
119 // likely to be a false positive.
120 if (const Stmt *label = CB->getLabel())
121 if (label->getStmtClass() == Stmt::DefaultStmtClass)
122 continue;
123
124 // Special case for __builtin_unreachable.
125 // FIXME: This should be extended to include other unreachable markers,
126 // such as llvm_unreachable.
127 if (!CB->empty()) {
128 bool foundUnreachable = false;
129 for (CFGBlock::const_iterator ci = CB->begin(), ce = CB->end();
130 ci != ce; ++ci) {
131 if (std::optional<CFGStmt> S = (*ci).getAs<CFGStmt>())
132 if (const CallExpr *CE = dyn_cast<CallExpr>(S->getStmt())) {
133 if (CE->getBuiltinCallee() == Builtin::BI__builtin_unreachable ||
134 CE->isBuiltinAssumeFalse(Eng.getContext())) {
135 foundUnreachable = true;
136 break;
137 }
138 }
139 }
140 if (foundUnreachable)
141 continue;
142 }
143
144 // We found a block that wasn't covered - find the statement to report
145 SourceRange SR;
148 if (const Stmt *S = getUnreachableStmt(CB)) {
149 // In macros, 'do {...} while (0)' is often used. Don't warn about the
150 // condition 0 when it is unreachable.
151 if (S->getBeginLoc().isMacroID())
152 if (const auto *I = dyn_cast<IntegerLiteral>(S))
153 if (I->getValue() == 0ULL)
154 if (const Stmt *Parent = PM->getParent(S))
155 if (isa<DoStmt>(Parent))
156 continue;
157 SR = S->getSourceRange();
159 SL = DL.asLocation();
160 if (SR.isInvalid() || !SL.isValid())
161 continue;
162 }
163 else
164 continue;
165
166 // Check if the SourceLocation is in a system header
167 const SourceManager &SM = B.getSourceManager();
168 if (SM.isInSystemHeader(SL) || SM.isInExternCSystemHeader(SL))
169 continue;
170
171 B.EmitBasicReport(D, this, "Unreachable code", categories::UnusedCode,
172 "This statement is never executed", DL, SR);
173 }
174}
175
176// Recursively finds the entry point(s) for this dead CFGBlock.
177void UnreachableCodeChecker::FindUnreachableEntryPoints(const CFGBlock *CB,
178 CFGBlocksSet &reachable,
179 CFGBlocksSet &visited) {
180 visited.insert(CB->getBlockID());
181
182 for (const CFGBlock *PredBlock : CB->preds()) {
183 if (!PredBlock)
184 continue;
185
186 if (!reachable.count(PredBlock->getBlockID())) {
187 // If we find an unreachable predecessor, mark this block as reachable so
188 // we don't report this block
189 reachable.insert(CB->getBlockID());
190 if (!visited.count(PredBlock->getBlockID()))
191 // If we haven't previously visited the unreachable predecessor, recurse
192 FindUnreachableEntryPoints(PredBlock, reachable, visited);
193 }
194 }
195}
196
197// Find the Stmt* in a CFGBlock for reporting a warning
198const Stmt *UnreachableCodeChecker::getUnreachableStmt(const CFGBlock *CB) {
199 for (const CFGElement &Elem : *CB) {
200 if (std::optional<CFGStmt> S = Elem.getAs<CFGStmt>()) {
201 if (!isa<DeclStmt>(S->getStmt()))
202 return S->getStmt();
203 }
204 }
205 return CB->getTerminatorStmt();
206}
207
208// Determines if the path to this CFGBlock contained an element that infers this
209// block is a false positive. We assume that FindUnreachableEntryPoints has
210// already marked only the entry points to any dead code, so we need only to
211// find the condition that led to this block (the predecessor of this block.)
212// There will never be more than one predecessor.
213bool UnreachableCodeChecker::isInvalidPath(const CFGBlock *CB,
214 const ParentMap &PM) {
215 // We only expect a predecessor size of 0 or 1. If it is >1, then an external
216 // condition has broken our assumption (for example, a sink being placed by
217 // another check). In these cases, we choose not to report.
218 if (CB->pred_size() > 1)
219 return true;
220
221 // If there are no predecessors, then this block is trivially unreachable
222 if (CB->pred_size() == 0)
223 return false;
224
225 const CFGBlock *pred = *CB->pred_begin();
226 if (!pred)
227 return false;
228
229 // Get the predecessor block's terminator condition
230 const Stmt *cond = pred->getTerminatorCondition();
231
232 //assert(cond && "CFGBlock's predecessor has a terminator condition");
233 // The previous assertion is invalid in some cases (eg do/while). Leaving
234 // reporting of these situations on at the moment to help triage these cases.
235 if (!cond)
236 return false;
237
238 // Run each of the checks on the conditions
239 return containsMacro(cond) || containsEnum(cond) ||
241 containsStmt<UnaryExprOrTypeTraitExpr>(cond);
242}
243
244// Returns true if the given CFGBlock is empty
245bool UnreachableCodeChecker::isEmptyCFGBlock(const CFGBlock *CB) {
246 return CB->getLabel() == nullptr // No labels
247 && CB->size() == 0 // No statements
248 && !CB->getTerminatorStmt(); // No terminator
249}
250
251void ento::registerUnreachableCodeChecker(CheckerManager &mgr) {
252 mgr.registerChecker<UnreachableCodeChecker>();
253}
254
255bool ento::shouldRegisterUnreachableCodeChecker(const CheckerManager &mgr) {
256 return true;
257}
NodeId Parent
Definition: ASTDiff.cpp:191
StringRef P
#define SM(sm)
Definition: Cuda.cpp:82
Defines enum values for all the target-independent builtin functions.
Defines the SourceManager interface.
const Decl * getDecl() const
Represents a single basic block in a source-level CFG.
Definition: CFG.h:604
ElementList::const_iterator const_iterator
Definition: CFG.h:895
unsigned size() const
Definition: CFG.h:946
iterator begin()
Definition: CFG.h:904
bool empty() const
Definition: CFG.h:947
Stmt * getLabel()
Definition: CFG.h:1100
Stmt * getTerminatorStmt()
Definition: CFG.h:1081
unsigned pred_size() const
Definition: CFG.h:1005
pred_iterator pred_begin()
Definition: CFG.h:966
iterator end()
Definition: CFG.h:905
pred_range preds()
Definition: CFG.h:976
unsigned getBlockID() const
Definition: CFG.h:1105
Stmt * getTerminatorCondition(bool StripParens=true)
Definition: CFG.cpp:6263
Represents a top-level expression in a basic block.
Definition: CFG.h:55
Represents a source-level, intra-procedural CFG that represents the control-flow of a Stmt.
Definition: CFG.h:1214
CallExpr - Represents a function call (C99 6.5.2.2, C++ [expr.call]).
Definition: Expr.h:2820
Decl - This represents one declaration (or definition), e.g.
Definition: DeclBase.h:85
Represents a function declaration or definition.
Definition: Decl.h:1971
It wraps the AnalysisDeclContext to represent both the call stack with the help of StackFrameContext ...
const ParentMap & getParentMap() const
LLVM_ATTRIBUTE_RETURNS_NONNULL AnalysisDeclContext * getAnalysisDeclContext() const
virtual bool inTopFrame() const
Stmt * getParent(Stmt *) const
Definition: ParentMap.cpp:136
Encodes a location in the source.
bool isValid() const
Return true if this is a valid SourceLocation object.
This class handles loading and caching of source files into memory.
A trivial tuple used to represent a source range.
bool isInvalid() const
Stmt - This represents one statement.
Definition: Stmt.h:84
BugReporter is a utility class for generating PathDiagnostics for analysis.
Definition: BugReporter.h:585
const SourceManager & getSourceManager()
Definition: BugReporter.h:623
void EmitBasicReport(const Decl *DeclWithIssue, const CheckerBase *Checker, StringRef BugName, StringRef BugCategory, StringRef BugStr, PathDiagnosticLocation Loc, ArrayRef< SourceRange > Ranges=std::nullopt, ArrayRef< FixItHint > Fixits=std::nullopt)
CHECKER * registerChecker(AT &&... Args)
Used to register checkers.
llvm::iterator_range< node_iterator > nodes()
bool hasWorkRemaining() const
Definition: ExprEngine.h:431
ASTContext & getContext() const
getContext - Return the ASTContext associated with this analysis.
Definition: ExprEngine.h:196
static PathDiagnosticLocation createBegin(const Decl *D, const SourceManager &SM)
Create a location for the beginning of the declaration.
bool containsEnum(const Stmt *S)
bool containsStaticLocal(const Stmt *S)
bool containsBuiltinOffsetOf(const Stmt *S)
bool containsMacro(const Stmt *S)
The JSON file list parser is used to communicate input to InstallAPI.