1 //==- UnreachableCodeChecker.cpp - Generalized dead code checker -*- C++ -*-==//
2 //
3 // The LLVM Compiler Infrastructure
4 //
5 // This file is distributed under the University of Illinois Open Source
6 // License. See LICENSE.TXT for details.
7 //
8 //===----------------------------------------------------------------------===//
9 // This file implements a generalized unreachable code checker using a
10 // path-sensitive analysis. We mark any path visited, and then walk the CFG as a
11 // post-analysis to determine what was never visited.
12 //
13 // A similar flow-sensitive only check exists in Analysis/ReachableCode.cpp
14 //===----------------------------------------------------------------------===//
15
16 #include "ClangSACheckers.h"
17 #include "clang/AST/ParentMap.h"
18 #include "clang/Basic/Builtins.h"
19 #include "clang/Basic/SourceManager.h"
20 #include "clang/StaticAnalyzer/Core/BugReporter/BugReporter.h"
21 #include "clang/StaticAnalyzer/Core/Checker.h"
22 #include "clang/StaticAnalyzer/Core/CheckerManager.h"
23 #include "clang/StaticAnalyzer/Core/PathSensitive/CheckerContext.h"
24 #include "clang/StaticAnalyzer/Core/PathSensitive/CheckerHelpers.h"
25 #include "clang/StaticAnalyzer/Core/PathSensitive/ExplodedGraph.h"
26 #include "clang/StaticAnalyzer/Core/PathSensitive/SVals.h"
27 #include "llvm/ADT/SmallSet.h"
28
29 // The number of CFGBlock pointers we want to reserve memory for. This is used
30 // once for each function we analyze.
31 #define DEFAULT_CFGBLOCKS 256
32
33 using namespace clang;
34 using namespace ento;
35
36 namespace {
37 class UnreachableCodeChecker : public Checker<check::EndAnalysis> {
38 public:
39 void checkEndAnalysis(ExplodedGraph &G, BugReporter &B,
40 ExprEngine &Eng) const;
41 private:
42 typedef llvm::SmallSet<unsigned, DEFAULT_CFGBLOCKS> CFGBlocksSet;
43
44 static inline const Stmt *getUnreachableStmt(const CFGBlock *CB);
45 static void FindUnreachableEntryPoints(const CFGBlock *CB,
46 CFGBlocksSet &reachable,
47 CFGBlocksSet &visited);
48 static bool isInvalidPath(const CFGBlock *CB, const ParentMap &PM);
49 static inline bool isEmptyCFGBlock(const CFGBlock *CB);
50 };
51 }
52
checkEndAnalysis(ExplodedGraph & G,BugReporter & B,ExprEngine & Eng) const53 void UnreachableCodeChecker::checkEndAnalysis(ExplodedGraph &G,
54 BugReporter &B,
55 ExprEngine &Eng) const {
56 CFGBlocksSet reachable, visited;
57
58 if (Eng.hasWorkRemaining())
59 return;
60
61 const Decl *D = nullptr;
62 CFG *C = nullptr;
63 ParentMap *PM = nullptr;
64 const LocationContext *LC = nullptr;
65 // Iterate over ExplodedGraph
66 for (ExplodedGraph::node_iterator I = G.nodes_begin(), E = G.nodes_end();
67 I != E; ++I) {
68 const ProgramPoint &P = I->getLocation();
69 LC = P.getLocationContext();
70 if (!LC->inTopFrame())
71 continue;
72
73 if (!D)
74 D = LC->getAnalysisDeclContext()->getDecl();
75
76 // Save the CFG if we don't have it already
77 if (!C)
78 C = LC->getAnalysisDeclContext()->getUnoptimizedCFG();
79 if (!PM)
80 PM = &LC->getParentMap();
81
82 if (Optional<BlockEntrance> BE = P.getAs<BlockEntrance>()) {
83 const CFGBlock *CB = BE->getBlock();
84 reachable.insert(CB->getBlockID());
85 }
86 }
87
88 // Bail out if we didn't get the CFG or the ParentMap.
89 if (!D || !C || !PM)
90 return;
91
92 // Don't do anything for template instantiations. Proving that code
93 // in a template instantiation is unreachable means proving that it is
94 // unreachable in all instantiations.
95 if (const FunctionDecl *FD = dyn_cast<FunctionDecl>(D))
96 if (FD->isTemplateInstantiation())
97 return;
98
99 // Find CFGBlocks that were not covered by any node
100 for (CFG::const_iterator I = C->begin(), E = C->end(); I != E; ++I) {
101 const CFGBlock *CB = *I;
102 // Check if the block is unreachable
103 if (reachable.count(CB->getBlockID()))
104 continue;
105
106 // Check if the block is empty (an artificial block)
107 if (isEmptyCFGBlock(CB))
108 continue;
109
110 // Find the entry points for this block
111 if (!visited.count(CB->getBlockID()))
112 FindUnreachableEntryPoints(CB, reachable, visited);
113
114 // This block may have been pruned; check if we still want to report it
115 if (reachable.count(CB->getBlockID()))
116 continue;
117
118 // Check for false positives
119 if (CB->size() > 0 && isInvalidPath(CB, *PM))
120 continue;
121
122 // It is good practice to always have a "default" label in a "switch", even
123 // if we should never get there. It can be used to detect errors, for
124 // instance. Unreachable code directly under a "default" label is therefore
125 // likely to be a false positive.
126 if (const Stmt *label = CB->getLabel())
127 if (label->getStmtClass() == Stmt::DefaultStmtClass)
128 continue;
129
130 // Special case for __builtin_unreachable.
131 // FIXME: This should be extended to include other unreachable markers,
132 // such as llvm_unreachable.
133 if (!CB->empty()) {
134 bool foundUnreachable = false;
135 for (CFGBlock::const_iterator ci = CB->begin(), ce = CB->end();
136 ci != ce; ++ci) {
137 if (Optional<CFGStmt> S = (*ci).getAs<CFGStmt>())
138 if (const CallExpr *CE = dyn_cast<CallExpr>(S->getStmt())) {
139 if (CE->getBuiltinCallee() == Builtin::BI__builtin_unreachable) {
140 foundUnreachable = true;
141 break;
142 }
143 }
144 }
145 if (foundUnreachable)
146 continue;
147 }
148
149 // We found a block that wasn't covered - find the statement to report
150 SourceRange SR;
151 PathDiagnosticLocation DL;
152 SourceLocation SL;
153 if (const Stmt *S = getUnreachableStmt(CB)) {
154 SR = S->getSourceRange();
155 DL = PathDiagnosticLocation::createBegin(S, B.getSourceManager(), LC);
156 SL = DL.asLocation();
157 if (SR.isInvalid() || !SL.isValid())
158 continue;
159 }
160 else
161 continue;
162
163 // Check if the SourceLocation is in a system header
164 const SourceManager &SM = B.getSourceManager();
165 if (SM.isInSystemHeader(SL) || SM.isInExternCSystemHeader(SL))
166 continue;
167
168 B.EmitBasicReport(D, this, "Unreachable code", "Dead code",
169 "This statement is never executed", DL, SR);
170 }
171 }
172
173 // Recursively finds the entry point(s) for this dead CFGBlock.
FindUnreachableEntryPoints(const CFGBlock * CB,CFGBlocksSet & reachable,CFGBlocksSet & visited)174 void UnreachableCodeChecker::FindUnreachableEntryPoints(const CFGBlock *CB,
175 CFGBlocksSet &reachable,
176 CFGBlocksSet &visited) {
177 visited.insert(CB->getBlockID());
178
179 for (CFGBlock::const_pred_iterator I = CB->pred_begin(), E = CB->pred_end();
180 I != E; ++I) {
181 if (!*I)
182 continue;
183
184 if (!reachable.count((*I)->getBlockID())) {
185 // If we find an unreachable predecessor, mark this block as reachable so
186 // we don't report this block
187 reachable.insert(CB->getBlockID());
188 if (!visited.count((*I)->getBlockID()))
189 // If we haven't previously visited the unreachable predecessor, recurse
190 FindUnreachableEntryPoints(*I, reachable, visited);
191 }
192 }
193 }
194
195 // Find the Stmt* in a CFGBlock for reporting a warning
getUnreachableStmt(const CFGBlock * CB)196 const Stmt *UnreachableCodeChecker::getUnreachableStmt(const CFGBlock *CB) {
197 for (CFGBlock::const_iterator I = CB->begin(), E = CB->end(); I != E; ++I) {
198 if (Optional<CFGStmt> S = I->getAs<CFGStmt>())
199 return S->getStmt();
200 }
201 if (const Stmt *S = CB->getTerminator())
202 return S;
203 else
204 return nullptr;
205 }
206
207 // Determines if the path to this CFGBlock contained an element that infers this
208 // block is a false positive. We assume that FindUnreachableEntryPoints has
209 // already marked only the entry points to any dead code, so we need only to
210 // find the condition that led to this block (the predecessor of this block.)
211 // There will never be more than one predecessor.
isInvalidPath(const CFGBlock * CB,const ParentMap & PM)212 bool UnreachableCodeChecker::isInvalidPath(const CFGBlock *CB,
213 const ParentMap &PM) {
214 // We only expect a predecessor size of 0 or 1. If it is >1, then an external
215 // condition has broken our assumption (for example, a sink being placed by
216 // another check). In these cases, we choose not to report.
217 if (CB->pred_size() > 1)
218 return true;
219
220 // If there are no predecessors, then this block is trivially unreachable
221 if (CB->pred_size() == 0)
222 return false;
223
224 const CFGBlock *pred = *CB->pred_begin();
225 if (!pred)
226 return false;
227
228 // Get the predecessor block's terminator conditon
229 const Stmt *cond = pred->getTerminatorCondition();
230
231 //assert(cond && "CFGBlock's predecessor has a terminator condition");
232 // The previous assertion is invalid in some cases (eg do/while). Leaving
233 // reporting of these situations on at the moment to help triage these cases.
234 if (!cond)
235 return false;
236
237 // Run each of the checks on the conditions
238 if (containsMacro(cond) || containsEnum(cond)
239 || containsStaticLocal(cond) || containsBuiltinOffsetOf(cond)
240 || containsStmt<UnaryExprOrTypeTraitExpr>(cond))
241 return true;
242
243 return false;
244 }
245
246 // Returns true if the given CFGBlock is empty
isEmptyCFGBlock(const CFGBlock * CB)247 bool UnreachableCodeChecker::isEmptyCFGBlock(const CFGBlock *CB) {
248 return CB->getLabel() == nullptr // No labels
249 && CB->size() == 0 // No statements
250 && !CB->getTerminator(); // No terminator
251 }
252
registerUnreachableCodeChecker(CheckerManager & mgr)253 void ento::registerUnreachableCodeChecker(CheckerManager &mgr) {
254 mgr.registerChecker<UnreachableCodeChecker>();
255 }
256