1 //==- UninitializedValues.cpp - Find Uninitialized Values -------*- C++ --*-==//
2 //
3 //                     The LLVM Compiler Infrastructure
4 //
5 // This file is distributed under the University of Illinois Open Source
6 // License. See LICENSE.TXT for details.
7 //
8 //===----------------------------------------------------------------------===//
9 //
10 // This file implements uninitialized values analysis for source-level CFGs.
11 //
12 //===----------------------------------------------------------------------===//
13 
14 #include "clang/AST/ASTContext.h"
15 #include "clang/AST/Attr.h"
16 #include "clang/AST/Decl.h"
17 #include "clang/AST/DeclCXX.h"
18 #include "clang/AST/StmtVisitor.h"
19 #include "clang/Analysis/Analyses/PostOrderCFGView.h"
20 #include "clang/Analysis/Analyses/UninitializedValues.h"
21 #include "clang/Analysis/AnalysisContext.h"
22 #include "clang/Analysis/CFG.h"
23 #include "clang/Analysis/DomainSpecific/ObjCNoReturn.h"
24 #include "llvm/ADT/DenseMap.h"
25 #include "llvm/ADT/Optional.h"
26 #include "llvm/ADT/PackedVector.h"
27 #include "llvm/ADT/SmallBitVector.h"
28 #include "llvm/ADT/SmallVector.h"
29 #include "llvm/Support/SaveAndRestore.h"
30 #include <utility>
31 
32 using namespace clang;
33 
34 #define DEBUG_LOGGING 0
35 
isTrackedVar(const VarDecl * vd,const DeclContext * dc)36 static bool isTrackedVar(const VarDecl *vd, const DeclContext *dc) {
37   if (vd->isLocalVarDecl() && !vd->hasGlobalStorage() &&
38       !vd->isExceptionVariable() && !vd->isInitCapture() &&
39       !vd->isImplicit() && vd->getDeclContext() == dc) {
40     QualType ty = vd->getType();
41     return ty->isScalarType() || ty->isVectorType() || ty->isRecordType();
42   }
43   return false;
44 }
45 
46 //------------------------------------------------------------------------====//
47 // DeclToIndex: a mapping from Decls we track to value indices.
48 //====------------------------------------------------------------------------//
49 
50 namespace {
51 class DeclToIndex {
52   llvm::DenseMap<const VarDecl *, unsigned> map;
53 public:
DeclToIndex()54   DeclToIndex() {}
55 
56   /// Compute the actual mapping from declarations to bits.
57   void computeMap(const DeclContext &dc);
58 
59   /// Return the number of declarations in the map.
size() const60   unsigned size() const { return map.size(); }
61 
62   /// Returns the bit vector index for a given declaration.
63   Optional<unsigned> getValueIndex(const VarDecl *d) const;
64 };
65 }
66 
computeMap(const DeclContext & dc)67 void DeclToIndex::computeMap(const DeclContext &dc) {
68   unsigned count = 0;
69   DeclContext::specific_decl_iterator<VarDecl> I(dc.decls_begin()),
70                                                E(dc.decls_end());
71   for ( ; I != E; ++I) {
72     const VarDecl *vd = *I;
73     if (isTrackedVar(vd, &dc))
74       map[vd] = count++;
75   }
76 }
77 
getValueIndex(const VarDecl * d) const78 Optional<unsigned> DeclToIndex::getValueIndex(const VarDecl *d) const {
79   llvm::DenseMap<const VarDecl *, unsigned>::const_iterator I = map.find(d);
80   if (I == map.end())
81     return None;
82   return I->second;
83 }
84 
85 //------------------------------------------------------------------------====//
86 // CFGBlockValues: dataflow values for CFG blocks.
87 //====------------------------------------------------------------------------//
88 
89 // These values are defined in such a way that a merge can be done using
90 // a bitwise OR.
91 enum Value { Unknown = 0x0,         /* 00 */
92              Initialized = 0x1,     /* 01 */
93              Uninitialized = 0x2,   /* 10 */
94              MayUninitialized = 0x3 /* 11 */ };
95 
isUninitialized(const Value v)96 static bool isUninitialized(const Value v) {
97   return v >= Uninitialized;
98 }
isAlwaysUninit(const Value v)99 static bool isAlwaysUninit(const Value v) {
100   return v == Uninitialized;
101 }
102 
103 namespace {
104 
105 typedef llvm::PackedVector<Value, 2, llvm::SmallBitVector> ValueVector;
106 
107 class CFGBlockValues {
108   const CFG &cfg;
109   SmallVector<ValueVector, 8> vals;
110   ValueVector scratch;
111   DeclToIndex declToIndex;
112 public:
113   CFGBlockValues(const CFG &cfg);
114 
getNumEntries() const115   unsigned getNumEntries() const { return declToIndex.size(); }
116 
117   void computeSetOfDeclarations(const DeclContext &dc);
getValueVector(const CFGBlock * block)118   ValueVector &getValueVector(const CFGBlock *block) {
119     return vals[block->getBlockID()];
120   }
121 
122   void setAllScratchValues(Value V);
123   void mergeIntoScratch(ValueVector const &source, bool isFirst);
124   bool updateValueVectorWithScratch(const CFGBlock *block);
125 
hasNoDeclarations() const126   bool hasNoDeclarations() const {
127     return declToIndex.size() == 0;
128   }
129 
130   void resetScratch();
131 
132   ValueVector::reference operator[](const VarDecl *vd);
133 
getValue(const CFGBlock * block,const CFGBlock * dstBlock,const VarDecl * vd)134   Value getValue(const CFGBlock *block, const CFGBlock *dstBlock,
135                  const VarDecl *vd) {
136     const Optional<unsigned> &idx = declToIndex.getValueIndex(vd);
137     assert(idx.hasValue());
138     return getValueVector(block)[idx.getValue()];
139   }
140 };
141 } // end anonymous namespace
142 
CFGBlockValues(const CFG & c)143 CFGBlockValues::CFGBlockValues(const CFG &c) : cfg(c), vals(0) {}
144 
computeSetOfDeclarations(const DeclContext & dc)145 void CFGBlockValues::computeSetOfDeclarations(const DeclContext &dc) {
146   declToIndex.computeMap(dc);
147   unsigned decls = declToIndex.size();
148   scratch.resize(decls);
149   unsigned n = cfg.getNumBlockIDs();
150   if (!n)
151     return;
152   vals.resize(n);
153   for (unsigned i = 0; i < n; ++i)
154     vals[i].resize(decls);
155 }
156 
157 #if DEBUG_LOGGING
printVector(const CFGBlock * block,ValueVector & bv,unsigned num)158 static void printVector(const CFGBlock *block, ValueVector &bv,
159                         unsigned num) {
160   llvm::errs() << block->getBlockID() << " :";
161   for (unsigned i = 0; i < bv.size(); ++i) {
162     llvm::errs() << ' ' << bv[i];
163   }
164   llvm::errs() << " : " << num << '\n';
165 }
166 #endif
167 
setAllScratchValues(Value V)168 void CFGBlockValues::setAllScratchValues(Value V) {
169   for (unsigned I = 0, E = scratch.size(); I != E; ++I)
170     scratch[I] = V;
171 }
172 
mergeIntoScratch(ValueVector const & source,bool isFirst)173 void CFGBlockValues::mergeIntoScratch(ValueVector const &source,
174                                       bool isFirst) {
175   if (isFirst)
176     scratch = source;
177   else
178     scratch |= source;
179 }
180 
updateValueVectorWithScratch(const CFGBlock * block)181 bool CFGBlockValues::updateValueVectorWithScratch(const CFGBlock *block) {
182   ValueVector &dst = getValueVector(block);
183   bool changed = (dst != scratch);
184   if (changed)
185     dst = scratch;
186 #if DEBUG_LOGGING
187   printVector(block, scratch, 0);
188 #endif
189   return changed;
190 }
191 
resetScratch()192 void CFGBlockValues::resetScratch() {
193   scratch.reset();
194 }
195 
operator [](const VarDecl * vd)196 ValueVector::reference CFGBlockValues::operator[](const VarDecl *vd) {
197   const Optional<unsigned> &idx = declToIndex.getValueIndex(vd);
198   assert(idx.hasValue());
199   return scratch[idx.getValue()];
200 }
201 
202 //------------------------------------------------------------------------====//
203 // Worklist: worklist for dataflow analysis.
204 //====------------------------------------------------------------------------//
205 
206 namespace {
207 class DataflowWorklist {
208   PostOrderCFGView::iterator PO_I, PO_E;
209   SmallVector<const CFGBlock *, 20> worklist;
210   llvm::BitVector enqueuedBlocks;
211 public:
DataflowWorklist(const CFG & cfg,PostOrderCFGView & view)212   DataflowWorklist(const CFG &cfg, PostOrderCFGView &view)
213     : PO_I(view.begin()), PO_E(view.end()),
214       enqueuedBlocks(cfg.getNumBlockIDs(), true) {
215         // Treat the first block as already analyzed.
216         if (PO_I != PO_E) {
217           assert(*PO_I == &cfg.getEntry());
218           enqueuedBlocks[(*PO_I)->getBlockID()] = false;
219           ++PO_I;
220         }
221       }
222 
223   void enqueueSuccessors(const CFGBlock *block);
224   const CFGBlock *dequeue();
225 };
226 }
227 
enqueueSuccessors(const clang::CFGBlock * block)228 void DataflowWorklist::enqueueSuccessors(const clang::CFGBlock *block) {
229   for (CFGBlock::const_succ_iterator I = block->succ_begin(),
230        E = block->succ_end(); I != E; ++I) {
231     const CFGBlock *Successor = *I;
232     if (!Successor || enqueuedBlocks[Successor->getBlockID()])
233       continue;
234     worklist.push_back(Successor);
235     enqueuedBlocks[Successor->getBlockID()] = true;
236   }
237 }
238 
dequeue()239 const CFGBlock *DataflowWorklist::dequeue() {
240   const CFGBlock *B = nullptr;
241 
242   // First dequeue from the worklist.  This can represent
243   // updates along backedges that we want propagated as quickly as possible.
244   if (!worklist.empty())
245     B = worklist.pop_back_val();
246 
247   // Next dequeue from the initial reverse post order.  This is the
248   // theoretical ideal in the presence of no back edges.
249   else if (PO_I != PO_E) {
250     B = *PO_I;
251     ++PO_I;
252   }
253   else {
254     return nullptr;
255   }
256 
257   assert(enqueuedBlocks[B->getBlockID()] == true);
258   enqueuedBlocks[B->getBlockID()] = false;
259   return B;
260 }
261 
262 //------------------------------------------------------------------------====//
263 // Classification of DeclRefExprs as use or initialization.
264 //====------------------------------------------------------------------------//
265 
266 namespace {
267 class FindVarResult {
268   const VarDecl *vd;
269   const DeclRefExpr *dr;
270 public:
FindVarResult(const VarDecl * vd,const DeclRefExpr * dr)271   FindVarResult(const VarDecl *vd, const DeclRefExpr *dr) : vd(vd), dr(dr) {}
272 
getDeclRefExpr() const273   const DeclRefExpr *getDeclRefExpr() const { return dr; }
getDecl() const274   const VarDecl *getDecl() const { return vd; }
275 };
276 
stripCasts(ASTContext & C,const Expr * Ex)277 static const Expr *stripCasts(ASTContext &C, const Expr *Ex) {
278   while (Ex) {
279     Ex = Ex->IgnoreParenNoopCasts(C);
280     if (const CastExpr *CE = dyn_cast<CastExpr>(Ex)) {
281       if (CE->getCastKind() == CK_LValueBitCast) {
282         Ex = CE->getSubExpr();
283         continue;
284       }
285     }
286     break;
287   }
288   return Ex;
289 }
290 
291 /// If E is an expression comprising a reference to a single variable, find that
292 /// variable.
findVar(const Expr * E,const DeclContext * DC)293 static FindVarResult findVar(const Expr *E, const DeclContext *DC) {
294   if (const DeclRefExpr *DRE =
295         dyn_cast<DeclRefExpr>(stripCasts(DC->getParentASTContext(), E)))
296     if (const VarDecl *VD = dyn_cast<VarDecl>(DRE->getDecl()))
297       if (isTrackedVar(VD, DC))
298         return FindVarResult(VD, DRE);
299   return FindVarResult(nullptr, nullptr);
300 }
301 
302 /// \brief Classify each DeclRefExpr as an initialization or a use. Any
303 /// DeclRefExpr which isn't explicitly classified will be assumed to have
304 /// escaped the analysis and will be treated as an initialization.
305 class ClassifyRefs : public StmtVisitor<ClassifyRefs> {
306 public:
307   enum Class {
308     Init,
309     Use,
310     SelfInit,
311     Ignore
312   };
313 
314 private:
315   const DeclContext *DC;
316   llvm::DenseMap<const DeclRefExpr*, Class> Classification;
317 
isTrackedVar(const VarDecl * VD) const318   bool isTrackedVar(const VarDecl *VD) const {
319     return ::isTrackedVar(VD, DC);
320   }
321 
322   void classify(const Expr *E, Class C);
323 
324 public:
ClassifyRefs(AnalysisDeclContext & AC)325   ClassifyRefs(AnalysisDeclContext &AC) : DC(cast<DeclContext>(AC.getDecl())) {}
326 
327   void VisitDeclStmt(DeclStmt *DS);
328   void VisitUnaryOperator(UnaryOperator *UO);
329   void VisitBinaryOperator(BinaryOperator *BO);
330   void VisitCallExpr(CallExpr *CE);
331   void VisitCastExpr(CastExpr *CE);
332 
operator ()(Stmt * S)333   void operator()(Stmt *S) { Visit(S); }
334 
get(const DeclRefExpr * DRE) const335   Class get(const DeclRefExpr *DRE) const {
336     llvm::DenseMap<const DeclRefExpr*, Class>::const_iterator I
337         = Classification.find(DRE);
338     if (I != Classification.end())
339       return I->second;
340 
341     const VarDecl *VD = dyn_cast<VarDecl>(DRE->getDecl());
342     if (!VD || !isTrackedVar(VD))
343       return Ignore;
344 
345     return Init;
346   }
347 };
348 }
349 
getSelfInitExpr(VarDecl * VD)350 static const DeclRefExpr *getSelfInitExpr(VarDecl *VD) {
351   if (VD->getType()->isRecordType()) return nullptr;
352   if (Expr *Init = VD->getInit()) {
353     const DeclRefExpr *DRE
354       = dyn_cast<DeclRefExpr>(stripCasts(VD->getASTContext(), Init));
355     if (DRE && DRE->getDecl() == VD)
356       return DRE;
357   }
358   return nullptr;
359 }
360 
classify(const Expr * E,Class C)361 void ClassifyRefs::classify(const Expr *E, Class C) {
362   // The result of a ?: could also be an lvalue.
363   E = E->IgnoreParens();
364   if (const ConditionalOperator *CO = dyn_cast<ConditionalOperator>(E)) {
365     classify(CO->getTrueExpr(), C);
366     classify(CO->getFalseExpr(), C);
367     return;
368   }
369 
370   if (const BinaryConditionalOperator *BCO =
371           dyn_cast<BinaryConditionalOperator>(E)) {
372     classify(BCO->getFalseExpr(), C);
373     return;
374   }
375 
376   if (const OpaqueValueExpr *OVE = dyn_cast<OpaqueValueExpr>(E)) {
377     classify(OVE->getSourceExpr(), C);
378     return;
379   }
380 
381   if (const MemberExpr *ME = dyn_cast<MemberExpr>(E)) {
382     if (VarDecl *VD = dyn_cast<VarDecl>(ME->getMemberDecl())) {
383       if (!VD->isStaticDataMember())
384         classify(ME->getBase(), C);
385     }
386     return;
387   }
388 
389   if (const BinaryOperator *BO = dyn_cast<BinaryOperator>(E)) {
390     switch (BO->getOpcode()) {
391     case BO_PtrMemD:
392     case BO_PtrMemI:
393       classify(BO->getLHS(), C);
394       return;
395     case BO_Comma:
396       classify(BO->getRHS(), C);
397       return;
398     default:
399       return;
400     }
401   }
402 
403   FindVarResult Var = findVar(E, DC);
404   if (const DeclRefExpr *DRE = Var.getDeclRefExpr())
405     Classification[DRE] = std::max(Classification[DRE], C);
406 }
407 
VisitDeclStmt(DeclStmt * DS)408 void ClassifyRefs::VisitDeclStmt(DeclStmt *DS) {
409   for (auto *DI : DS->decls()) {
410     VarDecl *VD = dyn_cast<VarDecl>(DI);
411     if (VD && isTrackedVar(VD))
412       if (const DeclRefExpr *DRE = getSelfInitExpr(VD))
413         Classification[DRE] = SelfInit;
414   }
415 }
416 
VisitBinaryOperator(BinaryOperator * BO)417 void ClassifyRefs::VisitBinaryOperator(BinaryOperator *BO) {
418   // Ignore the evaluation of a DeclRefExpr on the LHS of an assignment. If this
419   // is not a compound-assignment, we will treat it as initializing the variable
420   // when TransferFunctions visits it. A compound-assignment does not affect
421   // whether a variable is uninitialized, and there's no point counting it as a
422   // use.
423   if (BO->isCompoundAssignmentOp())
424     classify(BO->getLHS(), Use);
425   else if (BO->getOpcode() == BO_Assign || BO->getOpcode() == BO_Comma)
426     classify(BO->getLHS(), Ignore);
427 }
428 
VisitUnaryOperator(UnaryOperator * UO)429 void ClassifyRefs::VisitUnaryOperator(UnaryOperator *UO) {
430   // Increment and decrement are uses despite there being no lvalue-to-rvalue
431   // conversion.
432   if (UO->isIncrementDecrementOp())
433     classify(UO->getSubExpr(), Use);
434 }
435 
isPointerToConst(const QualType & QT)436 static bool isPointerToConst(const QualType &QT) {
437   return QT->isAnyPointerType() && QT->getPointeeType().isConstQualified();
438 }
439 
VisitCallExpr(CallExpr * CE)440 void ClassifyRefs::VisitCallExpr(CallExpr *CE) {
441   // Classify arguments to std::move as used.
442   if (CE->getNumArgs() == 1) {
443     if (FunctionDecl *FD = CE->getDirectCallee()) {
444       if (FD->isInStdNamespace() && FD->getIdentifier() &&
445           FD->getIdentifier()->isStr("move")) {
446         // RecordTypes are handled in SemaDeclCXX.cpp.
447         if (!CE->getArg(0)->getType()->isRecordType())
448           classify(CE->getArg(0), Use);
449         return;
450       }
451     }
452   }
453 
454   // If a value is passed by const pointer or by const reference to a function,
455   // we should not assume that it is initialized by the call, and we
456   // conservatively do not assume that it is used.
457   for (CallExpr::arg_iterator I = CE->arg_begin(), E = CE->arg_end();
458        I != E; ++I) {
459     if ((*I)->isGLValue()) {
460       if ((*I)->getType().isConstQualified())
461         classify((*I), Ignore);
462     } else if (isPointerToConst((*I)->getType())) {
463       const Expr *Ex = stripCasts(DC->getParentASTContext(), *I);
464       const UnaryOperator *UO = dyn_cast<UnaryOperator>(Ex);
465       if (UO && UO->getOpcode() == UO_AddrOf)
466         Ex = UO->getSubExpr();
467       classify(Ex, Ignore);
468     }
469   }
470 }
471 
VisitCastExpr(CastExpr * CE)472 void ClassifyRefs::VisitCastExpr(CastExpr *CE) {
473   if (CE->getCastKind() == CK_LValueToRValue)
474     classify(CE->getSubExpr(), Use);
475   else if (CStyleCastExpr *CSE = dyn_cast<CStyleCastExpr>(CE)) {
476     if (CSE->getType()->isVoidType()) {
477       // Squelch any detected load of an uninitialized value if
478       // we cast it to void.
479       // e.g. (void) x;
480       classify(CSE->getSubExpr(), Ignore);
481     }
482   }
483 }
484 
485 //------------------------------------------------------------------------====//
486 // Transfer function for uninitialized values analysis.
487 //====------------------------------------------------------------------------//
488 
489 namespace {
490 class TransferFunctions : public StmtVisitor<TransferFunctions> {
491   CFGBlockValues &vals;
492   const CFG &cfg;
493   const CFGBlock *block;
494   AnalysisDeclContext ∾
495   const ClassifyRefs &classification;
496   ObjCNoReturn objCNoRet;
497   UninitVariablesHandler &handler;
498 
499 public:
TransferFunctions(CFGBlockValues & vals,const CFG & cfg,const CFGBlock * block,AnalysisDeclContext & ac,const ClassifyRefs & classification,UninitVariablesHandler & handler)500   TransferFunctions(CFGBlockValues &vals, const CFG &cfg,
501                     const CFGBlock *block, AnalysisDeclContext &ac,
502                     const ClassifyRefs &classification,
503                     UninitVariablesHandler &handler)
504     : vals(vals), cfg(cfg), block(block), ac(ac),
505       classification(classification), objCNoRet(ac.getASTContext()),
506       handler(handler) {}
507 
508   void reportUse(const Expr *ex, const VarDecl *vd);
509 
510   void VisitBinaryOperator(BinaryOperator *bo);
511   void VisitBlockExpr(BlockExpr *be);
512   void VisitCallExpr(CallExpr *ce);
513   void VisitDeclRefExpr(DeclRefExpr *dr);
514   void VisitDeclStmt(DeclStmt *ds);
515   void VisitObjCForCollectionStmt(ObjCForCollectionStmt *FS);
516   void VisitObjCMessageExpr(ObjCMessageExpr *ME);
517 
isTrackedVar(const VarDecl * vd)518   bool isTrackedVar(const VarDecl *vd) {
519     return ::isTrackedVar(vd, cast<DeclContext>(ac.getDecl()));
520   }
521 
findVar(const Expr * ex)522   FindVarResult findVar(const Expr *ex) {
523     return ::findVar(ex, cast<DeclContext>(ac.getDecl()));
524   }
525 
getUninitUse(const Expr * ex,const VarDecl * vd,Value v)526   UninitUse getUninitUse(const Expr *ex, const VarDecl *vd, Value v) {
527     UninitUse Use(ex, isAlwaysUninit(v));
528 
529     assert(isUninitialized(v));
530     if (Use.getKind() == UninitUse::Always)
531       return Use;
532 
533     // If an edge which leads unconditionally to this use did not initialize
534     // the variable, we can say something stronger than 'may be uninitialized':
535     // we can say 'either it's used uninitialized or you have dead code'.
536     //
537     // We track the number of successors of a node which have been visited, and
538     // visit a node once we have visited all of its successors. Only edges where
539     // the variable might still be uninitialized are followed. Since a variable
540     // can't transfer from being initialized to being uninitialized, this will
541     // trace out the subgraph which inevitably leads to the use and does not
542     // initialize the variable. We do not want to skip past loops, since their
543     // non-termination might be correlated with the initialization condition.
544     //
545     // For example:
546     //
547     //         void f(bool a, bool b) {
548     // block1:   int n;
549     //           if (a) {
550     // block2:     if (b)
551     // block3:       n = 1;
552     // block4:   } else if (b) {
553     // block5:     while (!a) {
554     // block6:       do_work(&a);
555     //               n = 2;
556     //             }
557     //           }
558     // block7:   if (a)
559     // block8:     g();
560     // block9:   return n;
561     //         }
562     //
563     // Starting from the maybe-uninitialized use in block 9:
564     //  * Block 7 is not visited because we have only visited one of its two
565     //    successors.
566     //  * Block 8 is visited because we've visited its only successor.
567     // From block 8:
568     //  * Block 7 is visited because we've now visited both of its successors.
569     // From block 7:
570     //  * Blocks 1, 2, 4, 5, and 6 are not visited because we didn't visit all
571     //    of their successors (we didn't visit 4, 3, 5, 6, and 5, respectively).
572     //  * Block 3 is not visited because it initializes 'n'.
573     // Now the algorithm terminates, having visited blocks 7 and 8, and having
574     // found the frontier is blocks 2, 4, and 5.
575     //
576     // 'n' is definitely uninitialized for two edges into block 7 (from blocks 2
577     // and 4), so we report that any time either of those edges is taken (in
578     // each case when 'b == false'), 'n' is used uninitialized.
579     SmallVector<const CFGBlock*, 32> Queue;
580     SmallVector<unsigned, 32> SuccsVisited(cfg.getNumBlockIDs(), 0);
581     Queue.push_back(block);
582     // Specify that we've already visited all successors of the starting block.
583     // This has the dual purpose of ensuring we never add it to the queue, and
584     // of marking it as not being a candidate element of the frontier.
585     SuccsVisited[block->getBlockID()] = block->succ_size();
586     while (!Queue.empty()) {
587       const CFGBlock *B = Queue.pop_back_val();
588 
589       // If the use is always reached from the entry block, make a note of that.
590       if (B == &cfg.getEntry())
591         Use.setUninitAfterCall();
592 
593       for (CFGBlock::const_pred_iterator I = B->pred_begin(), E = B->pred_end();
594            I != E; ++I) {
595         const CFGBlock *Pred = *I;
596         if (!Pred)
597           continue;
598 
599         Value AtPredExit = vals.getValue(Pred, B, vd);
600         if (AtPredExit == Initialized)
601           // This block initializes the variable.
602           continue;
603         if (AtPredExit == MayUninitialized &&
604             vals.getValue(B, nullptr, vd) == Uninitialized) {
605           // This block declares the variable (uninitialized), and is reachable
606           // from a block that initializes the variable. We can't guarantee to
607           // give an earlier location for the diagnostic (and it appears that
608           // this code is intended to be reachable) so give a diagnostic here
609           // and go no further down this path.
610           Use.setUninitAfterDecl();
611           continue;
612         }
613 
614         unsigned &SV = SuccsVisited[Pred->getBlockID()];
615         if (!SV) {
616           // When visiting the first successor of a block, mark all NULL
617           // successors as having been visited.
618           for (CFGBlock::const_succ_iterator SI = Pred->succ_begin(),
619                                              SE = Pred->succ_end();
620                SI != SE; ++SI)
621             if (!*SI)
622               ++SV;
623         }
624 
625         if (++SV == Pred->succ_size())
626           // All paths from this block lead to the use and don't initialize the
627           // variable.
628           Queue.push_back(Pred);
629       }
630     }
631 
632     // Scan the frontier, looking for blocks where the variable was
633     // uninitialized.
634     for (CFG::const_iterator BI = cfg.begin(), BE = cfg.end(); BI != BE; ++BI) {
635       const CFGBlock *Block = *BI;
636       unsigned BlockID = Block->getBlockID();
637       const Stmt *Term = Block->getTerminator();
638       if (SuccsVisited[BlockID] && SuccsVisited[BlockID] < Block->succ_size() &&
639           Term) {
640         // This block inevitably leads to the use. If we have an edge from here
641         // to a post-dominator block, and the variable is uninitialized on that
642         // edge, we have found a bug.
643         for (CFGBlock::const_succ_iterator I = Block->succ_begin(),
644              E = Block->succ_end(); I != E; ++I) {
645           const CFGBlock *Succ = *I;
646           if (Succ && SuccsVisited[Succ->getBlockID()] >= Succ->succ_size() &&
647               vals.getValue(Block, Succ, vd) == Uninitialized) {
648             // Switch cases are a special case: report the label to the caller
649             // as the 'terminator', not the switch statement itself. Suppress
650             // situations where no label matched: we can't be sure that's
651             // possible.
652             if (isa<SwitchStmt>(Term)) {
653               const Stmt *Label = Succ->getLabel();
654               if (!Label || !isa<SwitchCase>(Label))
655                 // Might not be possible.
656                 continue;
657               UninitUse::Branch Branch;
658               Branch.Terminator = Label;
659               Branch.Output = 0; // Ignored.
660               Use.addUninitBranch(Branch);
661             } else {
662               UninitUse::Branch Branch;
663               Branch.Terminator = Term;
664               Branch.Output = I - Block->succ_begin();
665               Use.addUninitBranch(Branch);
666             }
667           }
668         }
669       }
670     }
671 
672     return Use;
673   }
674 };
675 }
676 
reportUse(const Expr * ex,const VarDecl * vd)677 void TransferFunctions::reportUse(const Expr *ex, const VarDecl *vd) {
678   Value v = vals[vd];
679   if (isUninitialized(v))
680     handler.handleUseOfUninitVariable(vd, getUninitUse(ex, vd, v));
681 }
682 
VisitObjCForCollectionStmt(ObjCForCollectionStmt * FS)683 void TransferFunctions::VisitObjCForCollectionStmt(ObjCForCollectionStmt *FS) {
684   // This represents an initialization of the 'element' value.
685   if (DeclStmt *DS = dyn_cast<DeclStmt>(FS->getElement())) {
686     const VarDecl *VD = cast<VarDecl>(DS->getSingleDecl());
687     if (isTrackedVar(VD))
688       vals[VD] = Initialized;
689   }
690 }
691 
VisitBlockExpr(BlockExpr * be)692 void TransferFunctions::VisitBlockExpr(BlockExpr *be) {
693   const BlockDecl *bd = be->getBlockDecl();
694   for (const auto &I : bd->captures()) {
695     const VarDecl *vd = I.getVariable();
696     if (!isTrackedVar(vd))
697       continue;
698     if (I.isByRef()) {
699       vals[vd] = Initialized;
700       continue;
701     }
702     reportUse(be, vd);
703   }
704 }
705 
VisitCallExpr(CallExpr * ce)706 void TransferFunctions::VisitCallExpr(CallExpr *ce) {
707   if (Decl *Callee = ce->getCalleeDecl()) {
708     if (Callee->hasAttr<ReturnsTwiceAttr>()) {
709       // After a call to a function like setjmp or vfork, any variable which is
710       // initialized anywhere within this function may now be initialized. For
711       // now, just assume such a call initializes all variables.  FIXME: Only
712       // mark variables as initialized if they have an initializer which is
713       // reachable from here.
714       vals.setAllScratchValues(Initialized);
715     }
716     else if (Callee->hasAttr<AnalyzerNoReturnAttr>()) {
717       // Functions labeled like "analyzer_noreturn" are often used to denote
718       // "panic" functions that in special debug situations can still return,
719       // but for the most part should not be treated as returning.  This is a
720       // useful annotation borrowed from the static analyzer that is useful for
721       // suppressing branch-specific false positives when we call one of these
722       // functions but keep pretending the path continues (when in reality the
723       // user doesn't care).
724       vals.setAllScratchValues(Unknown);
725     }
726   }
727 }
728 
VisitDeclRefExpr(DeclRefExpr * dr)729 void TransferFunctions::VisitDeclRefExpr(DeclRefExpr *dr) {
730   switch (classification.get(dr)) {
731   case ClassifyRefs::Ignore:
732     break;
733   case ClassifyRefs::Use:
734     reportUse(dr, cast<VarDecl>(dr->getDecl()));
735     break;
736   case ClassifyRefs::Init:
737     vals[cast<VarDecl>(dr->getDecl())] = Initialized;
738     break;
739   case ClassifyRefs::SelfInit:
740       handler.handleSelfInit(cast<VarDecl>(dr->getDecl()));
741     break;
742   }
743 }
744 
VisitBinaryOperator(BinaryOperator * BO)745 void TransferFunctions::VisitBinaryOperator(BinaryOperator *BO) {
746   if (BO->getOpcode() == BO_Assign) {
747     FindVarResult Var = findVar(BO->getLHS());
748     if (const VarDecl *VD = Var.getDecl())
749       vals[VD] = Initialized;
750   }
751 }
752 
VisitDeclStmt(DeclStmt * DS)753 void TransferFunctions::VisitDeclStmt(DeclStmt *DS) {
754   for (auto *DI : DS->decls()) {
755     VarDecl *VD = dyn_cast<VarDecl>(DI);
756     if (VD && isTrackedVar(VD)) {
757       if (getSelfInitExpr(VD)) {
758         // If the initializer consists solely of a reference to itself, we
759         // explicitly mark the variable as uninitialized. This allows code
760         // like the following:
761         //
762         //   int x = x;
763         //
764         // to deliberately leave a variable uninitialized. Different analysis
765         // clients can detect this pattern and adjust their reporting
766         // appropriately, but we need to continue to analyze subsequent uses
767         // of the variable.
768         vals[VD] = Uninitialized;
769       } else if (VD->getInit()) {
770         // Treat the new variable as initialized.
771         vals[VD] = Initialized;
772       } else {
773         // No initializer: the variable is now uninitialized. This matters
774         // for cases like:
775         //   while (...) {
776         //     int n;
777         //     use(n);
778         //     n = 0;
779         //   }
780         // FIXME: Mark the variable as uninitialized whenever its scope is
781         // left, since its scope could be re-entered by a jump over the
782         // declaration.
783         vals[VD] = Uninitialized;
784       }
785     }
786   }
787 }
788 
VisitObjCMessageExpr(ObjCMessageExpr * ME)789 void TransferFunctions::VisitObjCMessageExpr(ObjCMessageExpr *ME) {
790   // If the Objective-C message expression is an implicit no-return that
791   // is not modeled in the CFG, set the tracked dataflow values to Unknown.
792   if (objCNoRet.isImplicitNoReturn(ME)) {
793     vals.setAllScratchValues(Unknown);
794   }
795 }
796 
797 //------------------------------------------------------------------------====//
798 // High-level "driver" logic for uninitialized values analysis.
799 //====------------------------------------------------------------------------//
800 
runOnBlock(const CFGBlock * block,const CFG & cfg,AnalysisDeclContext & ac,CFGBlockValues & vals,const ClassifyRefs & classification,llvm::BitVector & wasAnalyzed,UninitVariablesHandler & handler)801 static bool runOnBlock(const CFGBlock *block, const CFG &cfg,
802                        AnalysisDeclContext &ac, CFGBlockValues &vals,
803                        const ClassifyRefs &classification,
804                        llvm::BitVector &wasAnalyzed,
805                        UninitVariablesHandler &handler) {
806   wasAnalyzed[block->getBlockID()] = true;
807   vals.resetScratch();
808   // Merge in values of predecessor blocks.
809   bool isFirst = true;
810   for (CFGBlock::const_pred_iterator I = block->pred_begin(),
811        E = block->pred_end(); I != E; ++I) {
812     const CFGBlock *pred = *I;
813     if (!pred)
814       continue;
815     if (wasAnalyzed[pred->getBlockID()]) {
816       vals.mergeIntoScratch(vals.getValueVector(pred), isFirst);
817       isFirst = false;
818     }
819   }
820   // Apply the transfer function.
821   TransferFunctions tf(vals, cfg, block, ac, classification, handler);
822   for (CFGBlock::const_iterator I = block->begin(), E = block->end();
823        I != E; ++I) {
824     if (Optional<CFGStmt> cs = I->getAs<CFGStmt>())
825       tf.Visit(const_cast<Stmt*>(cs->getStmt()));
826   }
827   return vals.updateValueVectorWithScratch(block);
828 }
829 
830 /// PruneBlocksHandler is a special UninitVariablesHandler that is used
831 /// to detect when a CFGBlock has any *potential* use of an uninitialized
832 /// variable.  It is mainly used to prune out work during the final
833 /// reporting pass.
834 namespace {
835 struct PruneBlocksHandler : public UninitVariablesHandler {
PruneBlocksHandler__anon8c45b64e0611::PruneBlocksHandler836   PruneBlocksHandler(unsigned numBlocks)
837     : hadUse(numBlocks, false), hadAnyUse(false),
838       currentBlock(0) {}
839 
~PruneBlocksHandler__anon8c45b64e0611::PruneBlocksHandler840   ~PruneBlocksHandler() override {}
841 
842   /// Records if a CFGBlock had a potential use of an uninitialized variable.
843   llvm::BitVector hadUse;
844 
845   /// Records if any CFGBlock had a potential use of an uninitialized variable.
846   bool hadAnyUse;
847 
848   /// The current block to scribble use information.
849   unsigned currentBlock;
850 
handleUseOfUninitVariable__anon8c45b64e0611::PruneBlocksHandler851   void handleUseOfUninitVariable(const VarDecl *vd,
852                                  const UninitUse &use) override {
853     hadUse[currentBlock] = true;
854     hadAnyUse = true;
855   }
856 
857   /// Called when the uninitialized variable analysis detects the
858   /// idiom 'int x = x'.  All other uses of 'x' within the initializer
859   /// are handled by handleUseOfUninitVariable.
handleSelfInit__anon8c45b64e0611::PruneBlocksHandler860   void handleSelfInit(const VarDecl *vd) override {
861     hadUse[currentBlock] = true;
862     hadAnyUse = true;
863   }
864 };
865 }
866 
runUninitializedVariablesAnalysis(const DeclContext & dc,const CFG & cfg,AnalysisDeclContext & ac,UninitVariablesHandler & handler,UninitVariablesAnalysisStats & stats)867 void clang::runUninitializedVariablesAnalysis(
868     const DeclContext &dc,
869     const CFG &cfg,
870     AnalysisDeclContext &ac,
871     UninitVariablesHandler &handler,
872     UninitVariablesAnalysisStats &stats) {
873   CFGBlockValues vals(cfg);
874   vals.computeSetOfDeclarations(dc);
875   if (vals.hasNoDeclarations())
876     return;
877 
878   stats.NumVariablesAnalyzed = vals.getNumEntries();
879 
880   // Precompute which expressions are uses and which are initializations.
881   ClassifyRefs classification(ac);
882   cfg.VisitBlockStmts(classification);
883 
884   // Mark all variables uninitialized at the entry.
885   const CFGBlock &entry = cfg.getEntry();
886   ValueVector &vec = vals.getValueVector(&entry);
887   const unsigned n = vals.getNumEntries();
888   for (unsigned j = 0; j < n ; ++j) {
889     vec[j] = Uninitialized;
890   }
891 
892   // Proceed with the workist.
893   DataflowWorklist worklist(cfg, *ac.getAnalysis<PostOrderCFGView>());
894   llvm::BitVector previouslyVisited(cfg.getNumBlockIDs());
895   worklist.enqueueSuccessors(&cfg.getEntry());
896   llvm::BitVector wasAnalyzed(cfg.getNumBlockIDs(), false);
897   wasAnalyzed[cfg.getEntry().getBlockID()] = true;
898   PruneBlocksHandler PBH(cfg.getNumBlockIDs());
899 
900   while (const CFGBlock *block = worklist.dequeue()) {
901     PBH.currentBlock = block->getBlockID();
902 
903     // Did the block change?
904     bool changed = runOnBlock(block, cfg, ac, vals,
905                               classification, wasAnalyzed, PBH);
906     ++stats.NumBlockVisits;
907     if (changed || !previouslyVisited[block->getBlockID()])
908       worklist.enqueueSuccessors(block);
909     previouslyVisited[block->getBlockID()] = true;
910   }
911 
912   if (!PBH.hadAnyUse)
913     return;
914 
915   // Run through the blocks one more time, and report uninitialized variables.
916   for (CFG::const_iterator BI = cfg.begin(), BE = cfg.end(); BI != BE; ++BI) {
917     const CFGBlock *block = *BI;
918     if (PBH.hadUse[block->getBlockID()]) {
919       runOnBlock(block, cfg, ac, vals, classification, wasAnalyzed, handler);
920       ++stats.NumBlockVisits;
921     }
922   }
923 }
924 
~UninitVariablesHandler()925 UninitVariablesHandler::~UninitVariablesHandler() {}
926