blob: 730aa6ba212c79d9bbf892a072b04b5510ee9dbd [file] [log] [blame]
Ted Kremenek6f342132011-03-15 03:17:07 +00001//==- UninitializedValues.cpp - Find Uninitialized Values -------*- C++ --*-==//
Ted Kremenek610068c2011-01-15 02:58:47 +00002//
3// The LLVM Compiler Infrastructure
4//
5// This file is distributed under the University of Illinois Open Source
6// License. See LICENSE.TXT for details.
7//
8//===----------------------------------------------------------------------===//
9//
10// This file implements uninitialized values analysis for source-level CFGs.
11//
12//===----------------------------------------------------------------------===//
13
Richard Smith558e8872012-07-13 23:33:44 +000014#include "clang/AST/ASTContext.h"
Benjamin Kramer2fa67ef2012-12-01 15:09:41 +000015#include "clang/AST/Attr.h"
Ted Kremenek610068c2011-01-15 02:58:47 +000016#include "clang/AST/Decl.h"
Ted Kremenekc1602582012-11-17 02:00:00 +000017#include "clang/Analysis/Analyses/PostOrderCFGView.h"
Ted Kremenek6f342132011-03-15 03:17:07 +000018#include "clang/Analysis/Analyses/UninitializedValues.h"
Benjamin Kramer2fa67ef2012-12-01 15:09:41 +000019#include "clang/Analysis/AnalysisContext.h"
20#include "clang/Analysis/CFG.h"
Ted Kremenek25c1d572012-09-13 00:21:35 +000021#include "clang/Analysis/DomainSpecific/ObjCNoReturn.h"
Benjamin Kramer2fa67ef2012-12-01 15:09:41 +000022#include "clang/Analysis/Visitors/CFGRecStmtDeclVisitor.h"
23#include "llvm/ADT/DenseMap.h"
24#include "llvm/ADT/Optional.h"
25#include "llvm/ADT/PackedVector.h"
26#include "llvm/ADT/SmallBitVector.h"
27#include "llvm/ADT/SmallVector.h"
Argyrios Kyrtzidisb2c60b02012-03-01 19:45:56 +000028#include "llvm/Support/SaveAndRestore.h"
Benjamin Kramer2fa67ef2012-12-01 15:09:41 +000029#include <utility>
Ted Kremenek610068c2011-01-15 02:58:47 +000030
31using namespace clang;
32
Richard Smith558e8872012-07-13 23:33:44 +000033#define DEBUG_LOGGING 0
34
Ted Kremenek40900ee2011-01-27 02:29:34 +000035static bool isTrackedVar(const VarDecl *vd, const DeclContext *dc) {
Ted Kremenek1cbc3152011-03-17 03:06:11 +000036 if (vd->isLocalVarDecl() && !vd->hasGlobalStorage() &&
Ted Kremeneka21612f2011-04-07 20:02:56 +000037 !vd->isExceptionVariable() &&
Ted Kremenek1cbc3152011-03-17 03:06:11 +000038 vd->getDeclContext() == dc) {
39 QualType ty = vd->getType();
40 return ty->isScalarType() || ty->isVectorType();
41 }
42 return false;
Ted Kremenekc104e532011-01-18 04:53:25 +000043}
44
Ted Kremenek610068c2011-01-15 02:58:47 +000045//------------------------------------------------------------------------====//
Ted Kremenek136f8f22011-03-15 04:57:27 +000046// DeclToIndex: a mapping from Decls we track to value indices.
Ted Kremenek610068c2011-01-15 02:58:47 +000047//====------------------------------------------------------------------------//
48
49namespace {
Ted Kremenek136f8f22011-03-15 04:57:27 +000050class DeclToIndex {
Ted Kremenek610068c2011-01-15 02:58:47 +000051 llvm::DenseMap<const VarDecl *, unsigned> map;
52public:
Ted Kremenek136f8f22011-03-15 04:57:27 +000053 DeclToIndex() {}
Ted Kremenek610068c2011-01-15 02:58:47 +000054
55 /// Compute the actual mapping from declarations to bits.
56 void computeMap(const DeclContext &dc);
57
58 /// Return the number of declarations in the map.
59 unsigned size() const { return map.size(); }
60
61 /// Returns the bit vector index for a given declaration.
David Blaikiedc84cd52013-02-20 22:23:23 +000062 Optional<unsigned> getValueIndex(const VarDecl *d) const;
Ted Kremenek610068c2011-01-15 02:58:47 +000063};
64}
65
Ted Kremenek136f8f22011-03-15 04:57:27 +000066void DeclToIndex::computeMap(const DeclContext &dc) {
Ted Kremenek610068c2011-01-15 02:58:47 +000067 unsigned count = 0;
68 DeclContext::specific_decl_iterator<VarDecl> I(dc.decls_begin()),
69 E(dc.decls_end());
70 for ( ; I != E; ++I) {
David Blaikie581deb32012-06-06 20:45:41 +000071 const VarDecl *vd = *I;
Ted Kremenek40900ee2011-01-27 02:29:34 +000072 if (isTrackedVar(vd, &dc))
Ted Kremenek610068c2011-01-15 02:58:47 +000073 map[vd] = count++;
74 }
75}
76
David Blaikiedc84cd52013-02-20 22:23:23 +000077Optional<unsigned> DeclToIndex::getValueIndex(const VarDecl *d) const {
Ted Kremenekb831c672011-03-29 01:40:00 +000078 llvm::DenseMap<const VarDecl *, unsigned>::const_iterator I = map.find(d);
Ted Kremenek610068c2011-01-15 02:58:47 +000079 if (I == map.end())
David Blaikie66874fb2013-02-21 01:47:18 +000080 return None;
Ted Kremenek610068c2011-01-15 02:58:47 +000081 return I->second;
82}
83
84//------------------------------------------------------------------------====//
85// CFGBlockValues: dataflow values for CFG blocks.
86//====------------------------------------------------------------------------//
87
Ted Kremenekf7bafc72011-03-15 04:57:38 +000088// These values are defined in such a way that a merge can be done using
89// a bitwise OR.
90enum Value { Unknown = 0x0, /* 00 */
91 Initialized = 0x1, /* 01 */
92 Uninitialized = 0x2, /* 10 */
93 MayUninitialized = 0x3 /* 11 */ };
94
95static bool isUninitialized(const Value v) {
96 return v >= Uninitialized;
97}
98static bool isAlwaysUninit(const Value v) {
99 return v == Uninitialized;
100}
Ted Kremenekafb10c42011-03-15 04:57:29 +0000101
Benjamin Kramerda57f3e2011-03-26 12:38:21 +0000102namespace {
Ted Kremenek496398d2011-03-15 04:57:32 +0000103
Benjamin Kramerda3d76b2012-09-28 16:44:29 +0000104typedef llvm::PackedVector<Value, 2, llvm::SmallBitVector> ValueVector;
Ted Kremenek13bd4232011-01-20 17:37:17 +0000105
Ted Kremenek610068c2011-01-15 02:58:47 +0000106class CFGBlockValues {
107 const CFG &cfg;
Benjamin Kramerda3d76b2012-09-28 16:44:29 +0000108 SmallVector<ValueVector, 8> vals;
Ted Kremenek136f8f22011-03-15 04:57:27 +0000109 ValueVector scratch;
Ted Kremenek4ddb3872011-03-15 05:30:12 +0000110 DeclToIndex declToIndex;
Ted Kremenek610068c2011-01-15 02:58:47 +0000111public:
112 CFGBlockValues(const CFG &cfg);
Ted Kremenekeee18c32012-07-19 04:59:05 +0000113
Ted Kremenekd40066b2011-04-04 23:29:12 +0000114 unsigned getNumEntries() const { return declToIndex.size(); }
115
Ted Kremenek610068c2011-01-15 02:58:47 +0000116 void computeSetOfDeclarations(const DeclContext &dc);
Ted Kremenekeee18c32012-07-19 04:59:05 +0000117 ValueVector &getValueVector(const CFGBlock *block) {
Benjamin Kramerda3d76b2012-09-28 16:44:29 +0000118 return vals[block->getBlockID()];
Ted Kremenekeee18c32012-07-19 04:59:05 +0000119 }
Ted Kremenek13bd4232011-01-20 17:37:17 +0000120
Richard Smitha9e8b9e2012-07-02 23:23:04 +0000121 void setAllScratchValues(Value V);
Ted Kremenek136f8f22011-03-15 04:57:27 +0000122 void mergeIntoScratch(ValueVector const &source, bool isFirst);
123 bool updateValueVectorWithScratch(const CFGBlock *block);
Ted Kremenek610068c2011-01-15 02:58:47 +0000124
125 bool hasNoDeclarations() const {
Ted Kremenek4ddb3872011-03-15 05:30:12 +0000126 return declToIndex.size() == 0;
Ted Kremenek610068c2011-01-15 02:58:47 +0000127 }
Ted Kremeneke0e29332011-08-20 01:15:28 +0000128
Ted Kremenek610068c2011-01-15 02:58:47 +0000129 void resetScratch();
Ted Kremenek13bd4232011-01-20 17:37:17 +0000130
Ted Kremenek136f8f22011-03-15 04:57:27 +0000131 ValueVector::reference operator[](const VarDecl *vd);
Richard Smith2815e1a2012-05-25 02:17:09 +0000132
133 Value getValue(const CFGBlock *block, const CFGBlock *dstBlock,
134 const VarDecl *vd) {
David Blaikiedc84cd52013-02-20 22:23:23 +0000135 const Optional<unsigned> &idx = declToIndex.getValueIndex(vd);
Richard Smith2815e1a2012-05-25 02:17:09 +0000136 assert(idx.hasValue());
Ted Kremenekeee18c32012-07-19 04:59:05 +0000137 return getValueVector(block)[idx.getValue()];
Richard Smith2815e1a2012-05-25 02:17:09 +0000138 }
Ted Kremenek610068c2011-01-15 02:58:47 +0000139};
Benjamin Kramerda57f3e2011-03-26 12:38:21 +0000140} // end anonymous namespace
Ted Kremenek610068c2011-01-15 02:58:47 +0000141
Ted Kremenekeee18c32012-07-19 04:59:05 +0000142CFGBlockValues::CFGBlockValues(const CFG &c) : cfg(c), vals(0) {}
Ted Kremenek610068c2011-01-15 02:58:47 +0000143
Ted Kremenek610068c2011-01-15 02:58:47 +0000144void CFGBlockValues::computeSetOfDeclarations(const DeclContext &dc) {
Ted Kremenek4ddb3872011-03-15 05:30:12 +0000145 declToIndex.computeMap(dc);
Ted Kremenekeee18c32012-07-19 04:59:05 +0000146 unsigned decls = declToIndex.size();
147 scratch.resize(decls);
148 unsigned n = cfg.getNumBlockIDs();
149 if (!n)
150 return;
151 vals.resize(n);
152 for (unsigned i = 0; i < n; ++i)
Benjamin Kramerda3d76b2012-09-28 16:44:29 +0000153 vals[i].resize(decls);
Ted Kremenek13bd4232011-01-20 17:37:17 +0000154}
155
Richard Smith558e8872012-07-13 23:33:44 +0000156#if DEBUG_LOGGING
Ted Kremenek136f8f22011-03-15 04:57:27 +0000157static void printVector(const CFGBlock *block, ValueVector &bv,
Ted Kremenek9fcbcee2011-02-01 17:43:18 +0000158 unsigned num) {
Ted Kremenek9fcbcee2011-02-01 17:43:18 +0000159 llvm::errs() << block->getBlockID() << " :";
160 for (unsigned i = 0; i < bv.size(); ++i) {
161 llvm::errs() << ' ' << bv[i];
162 }
163 llvm::errs() << " : " << num << '\n';
164}
165#endif
Ted Kremenek610068c2011-01-15 02:58:47 +0000166
Richard Smitha9e8b9e2012-07-02 23:23:04 +0000167void CFGBlockValues::setAllScratchValues(Value V) {
168 for (unsigned I = 0, E = scratch.size(); I != E; ++I)
169 scratch[I] = V;
170}
171
Ted Kremenekc5f740e2011-10-07 00:42:48 +0000172void CFGBlockValues::mergeIntoScratch(ValueVector const &source,
173 bool isFirst) {
174 if (isFirst)
175 scratch = source;
176 else
177 scratch |= source;
178}
179
Ted Kremenek136f8f22011-03-15 04:57:27 +0000180bool CFGBlockValues::updateValueVectorWithScratch(const CFGBlock *block) {
Ted Kremenekeee18c32012-07-19 04:59:05 +0000181 ValueVector &dst = getValueVector(block);
Ted Kremenek610068c2011-01-15 02:58:47 +0000182 bool changed = (dst != scratch);
183 if (changed)
184 dst = scratch;
Richard Smith558e8872012-07-13 23:33:44 +0000185#if DEBUG_LOGGING
Ted Kremenek9fcbcee2011-02-01 17:43:18 +0000186 printVector(block, scratch, 0);
187#endif
Ted Kremenek13bd4232011-01-20 17:37:17 +0000188 return changed;
189}
190
Ted Kremenek610068c2011-01-15 02:58:47 +0000191void CFGBlockValues::resetScratch() {
192 scratch.reset();
193}
194
Ted Kremenek136f8f22011-03-15 04:57:27 +0000195ValueVector::reference CFGBlockValues::operator[](const VarDecl *vd) {
David Blaikiedc84cd52013-02-20 22:23:23 +0000196 const Optional<unsigned> &idx = declToIndex.getValueIndex(vd);
Ted Kremenek610068c2011-01-15 02:58:47 +0000197 assert(idx.hasValue());
198 return scratch[idx.getValue()];
199}
200
201//------------------------------------------------------------------------====//
202// Worklist: worklist for dataflow analysis.
203//====------------------------------------------------------------------------//
204
205namespace {
206class DataflowWorklist {
Ted Kremenekc1602582012-11-17 02:00:00 +0000207 PostOrderCFGView::iterator PO_I, PO_E;
Chris Lattner5f9e2722011-07-23 10:55:15 +0000208 SmallVector<const CFGBlock *, 20> worklist;
Ted Kremenek496398d2011-03-15 04:57:32 +0000209 llvm::BitVector enqueuedBlocks;
Ted Kremenek610068c2011-01-15 02:58:47 +0000210public:
Ted Kremenekc1602582012-11-17 02:00:00 +0000211 DataflowWorklist(const CFG &cfg, PostOrderCFGView &view)
212 : PO_I(view.begin()), PO_E(view.end()),
213 enqueuedBlocks(cfg.getNumBlockIDs(), true) {
214 // Treat the first block as already analyzed.
215 if (PO_I != PO_E) {
216 assert(*PO_I == &cfg.getEntry());
217 enqueuedBlocks[(*PO_I)->getBlockID()] = false;
218 ++PO_I;
219 }
220 }
Ted Kremenek610068c2011-01-15 02:58:47 +0000221
Ted Kremenek610068c2011-01-15 02:58:47 +0000222 void enqueueSuccessors(const CFGBlock *block);
223 const CFGBlock *dequeue();
Ted Kremenek610068c2011-01-15 02:58:47 +0000224};
225}
226
Ted Kremenek610068c2011-01-15 02:58:47 +0000227void DataflowWorklist::enqueueSuccessors(const clang::CFGBlock *block) {
228 for (CFGBlock::const_succ_iterator I = block->succ_begin(),
229 E = block->succ_end(); I != E; ++I) {
Chandler Carruth80520502011-07-08 11:19:06 +0000230 const CFGBlock *Successor = *I;
231 if (!Successor || enqueuedBlocks[Successor->getBlockID()])
232 continue;
233 worklist.push_back(Successor);
234 enqueuedBlocks[Successor->getBlockID()] = true;
Ted Kremenek610068c2011-01-15 02:58:47 +0000235 }
236}
237
238const CFGBlock *DataflowWorklist::dequeue() {
Ted Kremenekc1602582012-11-17 02:00:00 +0000239 const CFGBlock *B = 0;
240
241 // First dequeue from the worklist. This can represent
242 // updates along backedges that we want propagated as quickly as possible.
243 if (!worklist.empty()) {
244 B = worklist.back();
245 worklist.pop_back();
246 }
247 // Next dequeue from the initial reverse post order. This is the
248 // theoretical ideal in the presence of no back edges.
249 else if (PO_I != PO_E) {
250 B = *PO_I;
251 ++PO_I;
252 }
253 else {
Ted Kremenek610068c2011-01-15 02:58:47 +0000254 return 0;
Ted Kremenekc1602582012-11-17 02:00:00 +0000255 }
256
257 assert(enqueuedBlocks[B->getBlockID()] == true);
258 enqueuedBlocks[B->getBlockID()] = false;
259 return B;
Ted Kremenek610068c2011-01-15 02:58:47 +0000260}
261
262//------------------------------------------------------------------------====//
Richard Smith9532e0d2012-07-17 00:06:14 +0000263// Classification of DeclRefExprs as use or initialization.
Ted Kremenek610068c2011-01-15 02:58:47 +0000264//====------------------------------------------------------------------------//
265
Ted Kremenek610068c2011-01-15 02:58:47 +0000266namespace {
267class FindVarResult {
268 const VarDecl *vd;
269 const DeclRefExpr *dr;
270public:
Richard Smith9532e0d2012-07-17 00:06:14 +0000271 FindVarResult(const VarDecl *vd, const DeclRefExpr *dr) : vd(vd), dr(dr) {}
272
Ted Kremenek610068c2011-01-15 02:58:47 +0000273 const DeclRefExpr *getDeclRefExpr() const { return dr; }
274 const VarDecl *getDecl() const { return vd; }
275};
Richard Smith9532e0d2012-07-17 00:06:14 +0000276
277static const Expr *stripCasts(ASTContext &C, const Expr *Ex) {
278 while (Ex) {
279 Ex = Ex->IgnoreParenNoopCasts(C);
280 if (const CastExpr *CE = dyn_cast<CastExpr>(Ex)) {
281 if (CE->getCastKind() == CK_LValueBitCast) {
282 Ex = CE->getSubExpr();
283 continue;
284 }
285 }
286 break;
287 }
288 return Ex;
289}
290
291/// If E is an expression comprising a reference to a single variable, find that
292/// variable.
293static FindVarResult findVar(const Expr *E, const DeclContext *DC) {
294 if (const DeclRefExpr *DRE =
295 dyn_cast<DeclRefExpr>(stripCasts(DC->getParentASTContext(), E)))
296 if (const VarDecl *VD = dyn_cast<VarDecl>(DRE->getDecl()))
297 if (isTrackedVar(VD, DC))
298 return FindVarResult(VD, DRE);
299 return FindVarResult(0, 0);
300}
301
302/// \brief Classify each DeclRefExpr as an initialization or a use. Any
303/// DeclRefExpr which isn't explicitly classified will be assumed to have
304/// escaped the analysis and will be treated as an initialization.
305class ClassifyRefs : public StmtVisitor<ClassifyRefs> {
306public:
307 enum Class {
308 Init,
309 Use,
310 SelfInit,
311 Ignore
312 };
313
314private:
315 const DeclContext *DC;
316 llvm::DenseMap<const DeclRefExpr*, Class> Classification;
317
318 bool isTrackedVar(const VarDecl *VD) const {
319 return ::isTrackedVar(VD, DC);
320 }
321
322 void classify(const Expr *E, Class C);
323
324public:
325 ClassifyRefs(AnalysisDeclContext &AC) : DC(cast<DeclContext>(AC.getDecl())) {}
326
327 void VisitDeclStmt(DeclStmt *DS);
328 void VisitUnaryOperator(UnaryOperator *UO);
329 void VisitBinaryOperator(BinaryOperator *BO);
330 void VisitCallExpr(CallExpr *CE);
331 void VisitCastExpr(CastExpr *CE);
332
333 void operator()(Stmt *S) { Visit(S); }
334
335 Class get(const DeclRefExpr *DRE) const {
336 llvm::DenseMap<const DeclRefExpr*, Class>::const_iterator I
337 = Classification.find(DRE);
338 if (I != Classification.end())
339 return I->second;
340
341 const VarDecl *VD = dyn_cast<VarDecl>(DRE->getDecl());
342 if (!VD || !isTrackedVar(VD))
343 return Ignore;
344
345 return Init;
346 }
347};
348}
349
350static const DeclRefExpr *getSelfInitExpr(VarDecl *VD) {
351 if (Expr *Init = VD->getInit()) {
352 const DeclRefExpr *DRE
353 = dyn_cast<DeclRefExpr>(stripCasts(VD->getASTContext(), Init));
354 if (DRE && DRE->getDecl() == VD)
355 return DRE;
356 }
357 return 0;
358}
359
360void ClassifyRefs::classify(const Expr *E, Class C) {
Ted Kremenek77fd3c02013-01-19 00:25:06 +0000361 // The result of a ?: could also be an lvalue.
362 E = E->IgnoreParens();
363 if (const ConditionalOperator *CO = dyn_cast<ConditionalOperator>(E)) {
364 const Expr *TrueExpr = CO->getTrueExpr();
365 if (!isa<OpaqueValueExpr>(TrueExpr))
366 classify(TrueExpr, C);
367 classify(CO->getFalseExpr(), C);
368 return;
369 }
370
Richard Smith9532e0d2012-07-17 00:06:14 +0000371 FindVarResult Var = findVar(E, DC);
372 if (const DeclRefExpr *DRE = Var.getDeclRefExpr())
373 Classification[DRE] = std::max(Classification[DRE], C);
374}
375
376void ClassifyRefs::VisitDeclStmt(DeclStmt *DS) {
377 for (DeclStmt::decl_iterator DI = DS->decl_begin(), DE = DS->decl_end();
378 DI != DE; ++DI) {
379 VarDecl *VD = dyn_cast<VarDecl>(*DI);
380 if (VD && isTrackedVar(VD))
381 if (const DeclRefExpr *DRE = getSelfInitExpr(VD))
382 Classification[DRE] = SelfInit;
383 }
384}
385
386void ClassifyRefs::VisitBinaryOperator(BinaryOperator *BO) {
387 // Ignore the evaluation of a DeclRefExpr on the LHS of an assignment. If this
388 // is not a compound-assignment, we will treat it as initializing the variable
389 // when TransferFunctions visits it. A compound-assignment does not affect
390 // whether a variable is uninitialized, and there's no point counting it as a
391 // use.
Richard Smith6cfa78f2012-07-17 01:27:33 +0000392 if (BO->isCompoundAssignmentOp())
393 classify(BO->getLHS(), Use);
394 else if (BO->getOpcode() == BO_Assign)
Richard Smith9532e0d2012-07-17 00:06:14 +0000395 classify(BO->getLHS(), Ignore);
396}
397
398void ClassifyRefs::VisitUnaryOperator(UnaryOperator *UO) {
399 // Increment and decrement are uses despite there being no lvalue-to-rvalue
400 // conversion.
401 if (UO->isIncrementDecrementOp())
402 classify(UO->getSubExpr(), Use);
403}
404
405void ClassifyRefs::VisitCallExpr(CallExpr *CE) {
406 // If a value is passed by const reference to a function, we should not assume
407 // that it is initialized by the call, and we conservatively do not assume
408 // that it is used.
409 for (CallExpr::arg_iterator I = CE->arg_begin(), E = CE->arg_end();
410 I != E; ++I)
411 if ((*I)->getType().isConstQualified() && (*I)->isGLValue())
412 classify(*I, Ignore);
413}
414
415void ClassifyRefs::VisitCastExpr(CastExpr *CE) {
416 if (CE->getCastKind() == CK_LValueToRValue)
417 classify(CE->getSubExpr(), Use);
418 else if (CStyleCastExpr *CSE = dyn_cast<CStyleCastExpr>(CE)) {
419 if (CSE->getType()->isVoidType()) {
420 // Squelch any detected load of an uninitialized value if
421 // we cast it to void.
422 // e.g. (void) x;
423 classify(CSE->getSubExpr(), Ignore);
424 }
425 }
426}
427
428//------------------------------------------------------------------------====//
429// Transfer function for uninitialized values analysis.
430//====------------------------------------------------------------------------//
431
432namespace {
Ted Kremenek0c8e5a02011-07-19 14:18:48 +0000433class TransferFunctions : public StmtVisitor<TransferFunctions> {
Ted Kremenek610068c2011-01-15 02:58:47 +0000434 CFGBlockValues &vals;
435 const CFG &cfg;
Richard Smith2815e1a2012-05-25 02:17:09 +0000436 const CFGBlock *block;
Ted Kremenek1d26f482011-10-24 01:32:45 +0000437 AnalysisDeclContext &ac;
Richard Smith9532e0d2012-07-17 00:06:14 +0000438 const ClassifyRefs &classification;
Ted Kremenek25c1d572012-09-13 00:21:35 +0000439 ObjCNoReturn objCNoRet;
Ted Kremenekeba76a42012-11-17 07:18:30 +0000440 UninitVariablesHandler &handler;
Richard Smith9532e0d2012-07-17 00:06:14 +0000441
Ted Kremenek610068c2011-01-15 02:58:47 +0000442public:
443 TransferFunctions(CFGBlockValues &vals, const CFG &cfg,
Richard Smith2815e1a2012-05-25 02:17:09 +0000444 const CFGBlock *block, AnalysisDeclContext &ac,
Richard Smith9532e0d2012-07-17 00:06:14 +0000445 const ClassifyRefs &classification,
Ted Kremenekeba76a42012-11-17 07:18:30 +0000446 UninitVariablesHandler &handler)
Richard Smith9532e0d2012-07-17 00:06:14 +0000447 : vals(vals), cfg(cfg), block(block), ac(ac),
Ted Kremenek25c1d572012-09-13 00:21:35 +0000448 classification(classification), objCNoRet(ac.getASTContext()),
449 handler(handler) {}
Richard Smith9532e0d2012-07-17 00:06:14 +0000450
Richard Smith81891882012-05-24 23:45:35 +0000451 void reportUse(const Expr *ex, const VarDecl *vd);
Ted Kremeneka8c17a52011-01-25 19:13:48 +0000452
Ted Kremenek25c1d572012-09-13 00:21:35 +0000453 void VisitBinaryOperator(BinaryOperator *bo);
Ted Kremeneka8c17a52011-01-25 19:13:48 +0000454 void VisitBlockExpr(BlockExpr *be);
Richard Smitha9e8b9e2012-07-02 23:23:04 +0000455 void VisitCallExpr(CallExpr *ce);
Ted Kremenekc21fed32011-01-18 21:18:58 +0000456 void VisitDeclRefExpr(DeclRefExpr *dr);
Ted Kremenek25c1d572012-09-13 00:21:35 +0000457 void VisitDeclStmt(DeclStmt *ds);
458 void VisitObjCForCollectionStmt(ObjCForCollectionStmt *FS);
459 void VisitObjCMessageExpr(ObjCMessageExpr *ME);
Richard Smith2815e1a2012-05-25 02:17:09 +0000460
Ted Kremenek40900ee2011-01-27 02:29:34 +0000461 bool isTrackedVar(const VarDecl *vd) {
462 return ::isTrackedVar(vd, cast<DeclContext>(ac.getDecl()));
463 }
Richard Smith2815e1a2012-05-25 02:17:09 +0000464
Richard Smith9532e0d2012-07-17 00:06:14 +0000465 FindVarResult findVar(const Expr *ex) {
466 return ::findVar(ex, cast<DeclContext>(ac.getDecl()));
467 }
468
Richard Smith2815e1a2012-05-25 02:17:09 +0000469 UninitUse getUninitUse(const Expr *ex, const VarDecl *vd, Value v) {
470 UninitUse Use(ex, isAlwaysUninit(v));
471
472 assert(isUninitialized(v));
473 if (Use.getKind() == UninitUse::Always)
474 return Use;
475
476 // If an edge which leads unconditionally to this use did not initialize
477 // the variable, we can say something stronger than 'may be uninitialized':
478 // we can say 'either it's used uninitialized or you have dead code'.
479 //
480 // We track the number of successors of a node which have been visited, and
481 // visit a node once we have visited all of its successors. Only edges where
482 // the variable might still be uninitialized are followed. Since a variable
483 // can't transfer from being initialized to being uninitialized, this will
484 // trace out the subgraph which inevitably leads to the use and does not
485 // initialize the variable. We do not want to skip past loops, since their
486 // non-termination might be correlated with the initialization condition.
487 //
488 // For example:
489 //
490 // void f(bool a, bool b) {
491 // block1: int n;
492 // if (a) {
493 // block2: if (b)
494 // block3: n = 1;
495 // block4: } else if (b) {
496 // block5: while (!a) {
497 // block6: do_work(&a);
498 // n = 2;
499 // }
500 // }
501 // block7: if (a)
502 // block8: g();
503 // block9: return n;
504 // }
505 //
506 // Starting from the maybe-uninitialized use in block 9:
507 // * Block 7 is not visited because we have only visited one of its two
508 // successors.
509 // * Block 8 is visited because we've visited its only successor.
510 // From block 8:
511 // * Block 7 is visited because we've now visited both of its successors.
512 // From block 7:
513 // * Blocks 1, 2, 4, 5, and 6 are not visited because we didn't visit all
514 // of their successors (we didn't visit 4, 3, 5, 6, and 5, respectively).
515 // * Block 3 is not visited because it initializes 'n'.
516 // Now the algorithm terminates, having visited blocks 7 and 8, and having
517 // found the frontier is blocks 2, 4, and 5.
518 //
519 // 'n' is definitely uninitialized for two edges into block 7 (from blocks 2
520 // and 4), so we report that any time either of those edges is taken (in
521 // each case when 'b == false'), 'n' is used uninitialized.
Dmitri Gribenkocfa88f82013-01-12 19:30:44 +0000522 SmallVector<const CFGBlock*, 32> Queue;
523 SmallVector<unsigned, 32> SuccsVisited(cfg.getNumBlockIDs(), 0);
Richard Smith2815e1a2012-05-25 02:17:09 +0000524 Queue.push_back(block);
525 // Specify that we've already visited all successors of the starting block.
526 // This has the dual purpose of ensuring we never add it to the queue, and
527 // of marking it as not being a candidate element of the frontier.
528 SuccsVisited[block->getBlockID()] = block->succ_size();
529 while (!Queue.empty()) {
530 const CFGBlock *B = Queue.back();
531 Queue.pop_back();
532 for (CFGBlock::const_pred_iterator I = B->pred_begin(), E = B->pred_end();
533 I != E; ++I) {
534 const CFGBlock *Pred = *I;
535 if (vals.getValue(Pred, B, vd) == Initialized)
536 // This block initializes the variable.
537 continue;
538
Richard Smith558e8872012-07-13 23:33:44 +0000539 unsigned &SV = SuccsVisited[Pred->getBlockID()];
540 if (!SV) {
541 // When visiting the first successor of a block, mark all NULL
542 // successors as having been visited.
543 for (CFGBlock::const_succ_iterator SI = Pred->succ_begin(),
544 SE = Pred->succ_end();
545 SI != SE; ++SI)
546 if (!*SI)
547 ++SV;
548 }
549
550 if (++SV == Pred->succ_size())
Richard Smith2815e1a2012-05-25 02:17:09 +0000551 // All paths from this block lead to the use and don't initialize the
552 // variable.
553 Queue.push_back(Pred);
554 }
555 }
556
557 // Scan the frontier, looking for blocks where the variable was
558 // uninitialized.
559 for (CFG::const_iterator BI = cfg.begin(), BE = cfg.end(); BI != BE; ++BI) {
560 const CFGBlock *Block = *BI;
561 unsigned BlockID = Block->getBlockID();
562 const Stmt *Term = Block->getTerminator();
563 if (SuccsVisited[BlockID] && SuccsVisited[BlockID] < Block->succ_size() &&
564 Term) {
565 // This block inevitably leads to the use. If we have an edge from here
566 // to a post-dominator block, and the variable is uninitialized on that
567 // edge, we have found a bug.
568 for (CFGBlock::const_succ_iterator I = Block->succ_begin(),
569 E = Block->succ_end(); I != E; ++I) {
570 const CFGBlock *Succ = *I;
571 if (Succ && SuccsVisited[Succ->getBlockID()] >= Succ->succ_size() &&
572 vals.getValue(Block, Succ, vd) == Uninitialized) {
573 // Switch cases are a special case: report the label to the caller
574 // as the 'terminator', not the switch statement itself. Suppress
575 // situations where no label matched: we can't be sure that's
576 // possible.
577 if (isa<SwitchStmt>(Term)) {
578 const Stmt *Label = Succ->getLabel();
579 if (!Label || !isa<SwitchCase>(Label))
580 // Might not be possible.
581 continue;
582 UninitUse::Branch Branch;
583 Branch.Terminator = Label;
584 Branch.Output = 0; // Ignored.
585 Use.addUninitBranch(Branch);
586 } else {
587 UninitUse::Branch Branch;
588 Branch.Terminator = Term;
589 Branch.Output = I - Block->succ_begin();
590 Use.addUninitBranch(Branch);
591 }
592 }
593 }
594 }
595 }
596
597 return Use;
598 }
Ted Kremenek610068c2011-01-15 02:58:47 +0000599};
600}
601
Richard Smith81891882012-05-24 23:45:35 +0000602void TransferFunctions::reportUse(const Expr *ex, const VarDecl *vd) {
Richard Smith81891882012-05-24 23:45:35 +0000603 Value v = vals[vd];
604 if (isUninitialized(v))
Ted Kremenekeba76a42012-11-17 07:18:30 +0000605 handler.handleUseOfUninitVariable(vd, getUninitUse(ex, vd, v));
Ted Kremenek610068c2011-01-15 02:58:47 +0000606}
607
Richard Smith9532e0d2012-07-17 00:06:14 +0000608void TransferFunctions::VisitObjCForCollectionStmt(ObjCForCollectionStmt *FS) {
Ted Kremenek1ea800c2011-01-27 02:01:31 +0000609 // This represents an initialization of the 'element' value.
Richard Smith9532e0d2012-07-17 00:06:14 +0000610 if (DeclStmt *DS = dyn_cast<DeclStmt>(FS->getElement())) {
611 const VarDecl *VD = cast<VarDecl>(DS->getSingleDecl());
612 if (isTrackedVar(VD))
613 vals[VD] = Initialized;
Ted Kremenek1ea800c2011-01-27 02:01:31 +0000614 }
Ted Kremenek1ea800c2011-01-27 02:01:31 +0000615}
616
Ted Kremeneka8c17a52011-01-25 19:13:48 +0000617void TransferFunctions::VisitBlockExpr(BlockExpr *be) {
Ted Kremenekbc8b44c2011-03-31 22:32:41 +0000618 const BlockDecl *bd = be->getBlockDecl();
619 for (BlockDecl::capture_const_iterator i = bd->capture_begin(),
620 e = bd->capture_end() ; i != e; ++i) {
621 const VarDecl *vd = i->getVariable();
Ted Kremenekbc8b44c2011-03-31 22:32:41 +0000622 if (!isTrackedVar(vd))
623 continue;
624 if (i->isByRef()) {
625 vals[vd] = Initialized;
626 continue;
627 }
Richard Smith81891882012-05-24 23:45:35 +0000628 reportUse(be, vd);
Ted Kremeneka8c17a52011-01-25 19:13:48 +0000629 }
630}
631
Richard Smitha9e8b9e2012-07-02 23:23:04 +0000632void TransferFunctions::VisitCallExpr(CallExpr *ce) {
Ted Kremenek44ca53f2012-09-12 05:53:43 +0000633 if (Decl *Callee = ce->getCalleeDecl()) {
634 if (Callee->hasAttr<ReturnsTwiceAttr>()) {
635 // After a call to a function like setjmp or vfork, any variable which is
636 // initialized anywhere within this function may now be initialized. For
637 // now, just assume such a call initializes all variables. FIXME: Only
638 // mark variables as initialized if they have an initializer which is
639 // reachable from here.
640 vals.setAllScratchValues(Initialized);
641 }
642 else if (Callee->hasAttr<AnalyzerNoReturnAttr>()) {
643 // Functions labeled like "analyzer_noreturn" are often used to denote
644 // "panic" functions that in special debug situations can still return,
645 // but for the most part should not be treated as returning. This is a
646 // useful annotation borrowed from the static analyzer that is useful for
647 // suppressing branch-specific false positives when we call one of these
648 // functions but keep pretending the path continues (when in reality the
649 // user doesn't care).
650 vals.setAllScratchValues(Unknown);
651 }
652 }
Richard Smitha9e8b9e2012-07-02 23:23:04 +0000653}
654
Ted Kremenek0c8e5a02011-07-19 14:18:48 +0000655void TransferFunctions::VisitDeclRefExpr(DeclRefExpr *dr) {
Richard Smith9532e0d2012-07-17 00:06:14 +0000656 switch (classification.get(dr)) {
657 case ClassifyRefs::Ignore:
658 break;
659 case ClassifyRefs::Use:
660 reportUse(dr, cast<VarDecl>(dr->getDecl()));
661 break;
662 case ClassifyRefs::Init:
663 vals[cast<VarDecl>(dr->getDecl())] = Initialized;
664 break;
665 case ClassifyRefs::SelfInit:
Ted Kremenekeba76a42012-11-17 07:18:30 +0000666 handler.handleSelfInit(cast<VarDecl>(dr->getDecl()));
Richard Smith9532e0d2012-07-17 00:06:14 +0000667 break;
668 }
Ted Kremenek0c8e5a02011-07-19 14:18:48 +0000669}
670
Richard Smith9532e0d2012-07-17 00:06:14 +0000671void TransferFunctions::VisitBinaryOperator(BinaryOperator *BO) {
672 if (BO->getOpcode() == BO_Assign) {
673 FindVarResult Var = findVar(BO->getLHS());
674 if (const VarDecl *VD = Var.getDecl())
675 vals[VD] = Initialized;
676 }
677}
678
679void TransferFunctions::VisitDeclStmt(DeclStmt *DS) {
680 for (DeclStmt::decl_iterator DI = DS->decl_begin(), DE = DS->decl_end();
Ted Kremenek610068c2011-01-15 02:58:47 +0000681 DI != DE; ++DI) {
Richard Smith9532e0d2012-07-17 00:06:14 +0000682 VarDecl *VD = dyn_cast<VarDecl>(*DI);
683 if (VD && isTrackedVar(VD)) {
684 if (getSelfInitExpr(VD)) {
685 // If the initializer consists solely of a reference to itself, we
686 // explicitly mark the variable as uninitialized. This allows code
687 // like the following:
688 //
689 // int x = x;
690 //
691 // to deliberately leave a variable uninitialized. Different analysis
692 // clients can detect this pattern and adjust their reporting
693 // appropriately, but we need to continue to analyze subsequent uses
694 // of the variable.
695 vals[VD] = Uninitialized;
696 } else if (VD->getInit()) {
697 // Treat the new variable as initialized.
698 vals[VD] = Initialized;
699 } else {
700 // No initializer: the variable is now uninitialized. This matters
701 // for cases like:
702 // while (...) {
703 // int n;
704 // use(n);
705 // n = 0;
706 // }
707 // FIXME: Mark the variable as uninitialized whenever its scope is
708 // left, since its scope could be re-entered by a jump over the
709 // declaration.
710 vals[VD] = Uninitialized;
Ted Kremenekc21fed32011-01-18 21:18:58 +0000711 }
Ted Kremenek610068c2011-01-15 02:58:47 +0000712 }
713 }
714}
715
Ted Kremenek25c1d572012-09-13 00:21:35 +0000716void TransferFunctions::VisitObjCMessageExpr(ObjCMessageExpr *ME) {
717 // If the Objective-C message expression is an implicit no-return that
718 // is not modeled in the CFG, set the tracked dataflow values to Unknown.
719 if (objCNoRet.isImplicitNoReturn(ME)) {
720 vals.setAllScratchValues(Unknown);
721 }
722}
723
Ted Kremenek610068c2011-01-15 02:58:47 +0000724//------------------------------------------------------------------------====//
725// High-level "driver" logic for uninitialized values analysis.
726//====------------------------------------------------------------------------//
727
Ted Kremenek13bd4232011-01-20 17:37:17 +0000728static bool runOnBlock(const CFGBlock *block, const CFG &cfg,
Ted Kremenek1d26f482011-10-24 01:32:45 +0000729 AnalysisDeclContext &ac, CFGBlockValues &vals,
Richard Smith9532e0d2012-07-17 00:06:14 +0000730 const ClassifyRefs &classification,
Ted Kremenekf8adeef2011-04-04 20:30:58 +0000731 llvm::BitVector &wasAnalyzed,
Ted Kremenekeba76a42012-11-17 07:18:30 +0000732 UninitVariablesHandler &handler) {
Ted Kremenekf8adeef2011-04-04 20:30:58 +0000733 wasAnalyzed[block->getBlockID()] = true;
Ted Kremenek610068c2011-01-15 02:58:47 +0000734 vals.resetScratch();
Ted Kremenekeee18c32012-07-19 04:59:05 +0000735 // Merge in values of predecessor blocks.
Ted Kremenek610068c2011-01-15 02:58:47 +0000736 bool isFirst = true;
737 for (CFGBlock::const_pred_iterator I = block->pred_begin(),
738 E = block->pred_end(); I != E; ++I) {
Ted Kremenek6f275422011-09-02 19:39:26 +0000739 const CFGBlock *pred = *I;
740 if (wasAnalyzed[pred->getBlockID()]) {
Ted Kremenekeee18c32012-07-19 04:59:05 +0000741 vals.mergeIntoScratch(vals.getValueVector(pred), isFirst);
Ted Kremenek6f275422011-09-02 19:39:26 +0000742 isFirst = false;
743 }
Ted Kremenek610068c2011-01-15 02:58:47 +0000744 }
745 // Apply the transfer function.
Richard Smith9532e0d2012-07-17 00:06:14 +0000746 TransferFunctions tf(vals, cfg, block, ac, classification, handler);
Ted Kremenek610068c2011-01-15 02:58:47 +0000747 for (CFGBlock::const_iterator I = block->begin(), E = block->end();
748 I != E; ++I) {
David Blaikieb0780542013-02-23 00:29:34 +0000749 if (Optional<CFGStmt> cs = I->getAs<CFGStmt>())
750 tf.Visit(const_cast<Stmt*>(cs->getStmt()));
Ted Kremenek610068c2011-01-15 02:58:47 +0000751 }
Ted Kremenek136f8f22011-03-15 04:57:27 +0000752 return vals.updateValueVectorWithScratch(block);
Ted Kremenek610068c2011-01-15 02:58:47 +0000753}
754
Ted Kremenekeba76a42012-11-17 07:18:30 +0000755/// PruneBlocksHandler is a special UninitVariablesHandler that is used
756/// to detect when a CFGBlock has any *potential* use of an uninitialized
757/// variable. It is mainly used to prune out work during the final
758/// reporting pass.
759namespace {
760struct PruneBlocksHandler : public UninitVariablesHandler {
761 PruneBlocksHandler(unsigned numBlocks)
762 : hadUse(numBlocks, false), hadAnyUse(false),
763 currentBlock(0) {}
764
765 virtual ~PruneBlocksHandler() {}
766
767 /// Records if a CFGBlock had a potential use of an uninitialized variable.
768 llvm::BitVector hadUse;
769
770 /// Records if any CFGBlock had a potential use of an uninitialized variable.
771 bool hadAnyUse;
772
773 /// The current block to scribble use information.
774 unsigned currentBlock;
775
776 virtual void handleUseOfUninitVariable(const VarDecl *vd,
777 const UninitUse &use) {
778 hadUse[currentBlock] = true;
779 hadAnyUse = true;
780 }
781
782 /// Called when the uninitialized variable analysis detects the
783 /// idiom 'int x = x'. All other uses of 'x' within the initializer
784 /// are handled by handleUseOfUninitVariable.
785 virtual void handleSelfInit(const VarDecl *vd) {
786 hadUse[currentBlock] = true;
787 hadAnyUse = true;
788 }
789};
790}
791
Chandler Carruth5d989942011-07-06 16:21:37 +0000792void clang::runUninitializedVariablesAnalysis(
793 const DeclContext &dc,
794 const CFG &cfg,
Ted Kremenek1d26f482011-10-24 01:32:45 +0000795 AnalysisDeclContext &ac,
Chandler Carruth5d989942011-07-06 16:21:37 +0000796 UninitVariablesHandler &handler,
797 UninitVariablesAnalysisStats &stats) {
Ted Kremenek610068c2011-01-15 02:58:47 +0000798 CFGBlockValues vals(cfg);
799 vals.computeSetOfDeclarations(dc);
800 if (vals.hasNoDeclarations())
801 return;
Ted Kremenekd40066b2011-04-04 23:29:12 +0000802
Chandler Carruth5d989942011-07-06 16:21:37 +0000803 stats.NumVariablesAnalyzed = vals.getNumEntries();
804
Richard Smith9532e0d2012-07-17 00:06:14 +0000805 // Precompute which expressions are uses and which are initializations.
806 ClassifyRefs classification(ac);
807 cfg.VisitBlockStmts(classification);
808
Ted Kremenekd40066b2011-04-04 23:29:12 +0000809 // Mark all variables uninitialized at the entry.
810 const CFGBlock &entry = cfg.getEntry();
Ted Kremenekeee18c32012-07-19 04:59:05 +0000811 ValueVector &vec = vals.getValueVector(&entry);
812 const unsigned n = vals.getNumEntries();
813 for (unsigned j = 0; j < n ; ++j) {
814 vec[j] = Uninitialized;
Ted Kremenekd40066b2011-04-04 23:29:12 +0000815 }
816
817 // Proceed with the workist.
Ted Kremenekc1602582012-11-17 02:00:00 +0000818 DataflowWorklist worklist(cfg, *ac.getAnalysis<PostOrderCFGView>());
Ted Kremenek496398d2011-03-15 04:57:32 +0000819 llvm::BitVector previouslyVisited(cfg.getNumBlockIDs());
Ted Kremenek610068c2011-01-15 02:58:47 +0000820 worklist.enqueueSuccessors(&cfg.getEntry());
Ted Kremenekf8adeef2011-04-04 20:30:58 +0000821 llvm::BitVector wasAnalyzed(cfg.getNumBlockIDs(), false);
Ted Kremenek6f275422011-09-02 19:39:26 +0000822 wasAnalyzed[cfg.getEntry().getBlockID()] = true;
Ted Kremenekeba76a42012-11-17 07:18:30 +0000823 PruneBlocksHandler PBH(cfg.getNumBlockIDs());
Ted Kremenek610068c2011-01-15 02:58:47 +0000824
825 while (const CFGBlock *block = worklist.dequeue()) {
Ted Kremenekeba76a42012-11-17 07:18:30 +0000826 PBH.currentBlock = block->getBlockID();
827
Ted Kremenek610068c2011-01-15 02:58:47 +0000828 // Did the block change?
Richard Smith9532e0d2012-07-17 00:06:14 +0000829 bool changed = runOnBlock(block, cfg, ac, vals,
Ted Kremenekeba76a42012-11-17 07:18:30 +0000830 classification, wasAnalyzed, PBH);
Chandler Carruth5d989942011-07-06 16:21:37 +0000831 ++stats.NumBlockVisits;
Ted Kremenek610068c2011-01-15 02:58:47 +0000832 if (changed || !previouslyVisited[block->getBlockID()])
833 worklist.enqueueSuccessors(block);
834 previouslyVisited[block->getBlockID()] = true;
835 }
Ted Kremenekeba76a42012-11-17 07:18:30 +0000836
837 if (!PBH.hadAnyUse)
838 return;
839
Enea Zaffanella67d472c2013-01-11 11:37:08 +0000840 // Run through the blocks one more time, and report uninitialized variables.
Ted Kremenek610068c2011-01-15 02:58:47 +0000841 for (CFG::const_iterator BI = cfg.begin(), BE = cfg.end(); BI != BE; ++BI) {
Ted Kremenek6f275422011-09-02 19:39:26 +0000842 const CFGBlock *block = *BI;
Ted Kremenekeba76a42012-11-17 07:18:30 +0000843 if (PBH.hadUse[block->getBlockID()]) {
844 runOnBlock(block, cfg, ac, vals, classification, wasAnalyzed, handler);
Chandler Carruth5d989942011-07-06 16:21:37 +0000845 ++stats.NumBlockVisits;
846 }
Ted Kremenek610068c2011-01-15 02:58:47 +0000847 }
848}
849
850UninitVariablesHandler::~UninitVariablesHandler() {}