blob: 47f2cf67c8e6d3b7c767e70858363b71ca115bcb [file] [log] [blame]
Ted Kremenek6f342132011-03-15 03:17:07 +00001//==- UninitializedValues.cpp - Find Uninitialized Values -------*- C++ --*-==//
Ted Kremenek610068c2011-01-15 02:58:47 +00002//
3// The LLVM Compiler Infrastructure
4//
5// This file is distributed under the University of Illinois Open Source
6// License. See LICENSE.TXT for details.
7//
8//===----------------------------------------------------------------------===//
9//
10// This file implements uninitialized values analysis for source-level CFGs.
11//
12//===----------------------------------------------------------------------===//
13
Ted Kremenek13bd4232011-01-20 17:37:17 +000014#include <utility>
Ted Kremenek610068c2011-01-15 02:58:47 +000015#include "llvm/ADT/Optional.h"
16#include "llvm/ADT/SmallVector.h"
Argyrios Kyrtzidis049f6d02011-05-31 03:56:09 +000017#include "llvm/ADT/PackedVector.h"
Ted Kremenek610068c2011-01-15 02:58:47 +000018#include "llvm/ADT/DenseMap.h"
Richard Smith558e8872012-07-13 23:33:44 +000019#include "clang/AST/ASTContext.h"
Ted Kremenek610068c2011-01-15 02:58:47 +000020#include "clang/AST/Decl.h"
21#include "clang/Analysis/CFG.h"
Ted Kremeneka8c17a52011-01-25 19:13:48 +000022#include "clang/Analysis/AnalysisContext.h"
Ted Kremenek610068c2011-01-15 02:58:47 +000023#include "clang/Analysis/Visitors/CFGRecStmtDeclVisitor.h"
Ted Kremenek6f342132011-03-15 03:17:07 +000024#include "clang/Analysis/Analyses/UninitializedValues.h"
Argyrios Kyrtzidisb2c60b02012-03-01 19:45:56 +000025#include "llvm/Support/SaveAndRestore.h"
Ted Kremenek610068c2011-01-15 02:58:47 +000026
27using namespace clang;
28
Richard Smith558e8872012-07-13 23:33:44 +000029#define DEBUG_LOGGING 0
30
Ted Kremenek40900ee2011-01-27 02:29:34 +000031static bool isTrackedVar(const VarDecl *vd, const DeclContext *dc) {
Ted Kremenek1cbc3152011-03-17 03:06:11 +000032 if (vd->isLocalVarDecl() && !vd->hasGlobalStorage() &&
Ted Kremeneka21612f2011-04-07 20:02:56 +000033 !vd->isExceptionVariable() &&
Ted Kremenek1cbc3152011-03-17 03:06:11 +000034 vd->getDeclContext() == dc) {
35 QualType ty = vd->getType();
36 return ty->isScalarType() || ty->isVectorType();
37 }
38 return false;
Ted Kremenekc104e532011-01-18 04:53:25 +000039}
40
Ted Kremenek610068c2011-01-15 02:58:47 +000041//------------------------------------------------------------------------====//
Ted Kremenek136f8f22011-03-15 04:57:27 +000042// DeclToIndex: a mapping from Decls we track to value indices.
Ted Kremenek610068c2011-01-15 02:58:47 +000043//====------------------------------------------------------------------------//
44
45namespace {
Ted Kremenek136f8f22011-03-15 04:57:27 +000046class DeclToIndex {
Ted Kremenek610068c2011-01-15 02:58:47 +000047 llvm::DenseMap<const VarDecl *, unsigned> map;
48public:
Ted Kremenek136f8f22011-03-15 04:57:27 +000049 DeclToIndex() {}
Ted Kremenek610068c2011-01-15 02:58:47 +000050
51 /// Compute the actual mapping from declarations to bits.
52 void computeMap(const DeclContext &dc);
53
54 /// Return the number of declarations in the map.
55 unsigned size() const { return map.size(); }
56
57 /// Returns the bit vector index for a given declaration.
Ted Kremenekb831c672011-03-29 01:40:00 +000058 llvm::Optional<unsigned> getValueIndex(const VarDecl *d) const;
Ted Kremenek610068c2011-01-15 02:58:47 +000059};
60}
61
Ted Kremenek136f8f22011-03-15 04:57:27 +000062void DeclToIndex::computeMap(const DeclContext &dc) {
Ted Kremenek610068c2011-01-15 02:58:47 +000063 unsigned count = 0;
64 DeclContext::specific_decl_iterator<VarDecl> I(dc.decls_begin()),
65 E(dc.decls_end());
66 for ( ; I != E; ++I) {
David Blaikie581deb32012-06-06 20:45:41 +000067 const VarDecl *vd = *I;
Ted Kremenek40900ee2011-01-27 02:29:34 +000068 if (isTrackedVar(vd, &dc))
Ted Kremenek610068c2011-01-15 02:58:47 +000069 map[vd] = count++;
70 }
71}
72
Ted Kremenekb831c672011-03-29 01:40:00 +000073llvm::Optional<unsigned> DeclToIndex::getValueIndex(const VarDecl *d) const {
74 llvm::DenseMap<const VarDecl *, unsigned>::const_iterator I = map.find(d);
Ted Kremenek610068c2011-01-15 02:58:47 +000075 if (I == map.end())
76 return llvm::Optional<unsigned>();
77 return I->second;
78}
79
80//------------------------------------------------------------------------====//
81// CFGBlockValues: dataflow values for CFG blocks.
82//====------------------------------------------------------------------------//
83
Ted Kremenekf7bafc72011-03-15 04:57:38 +000084// These values are defined in such a way that a merge can be done using
85// a bitwise OR.
86enum Value { Unknown = 0x0, /* 00 */
87 Initialized = 0x1, /* 01 */
88 Uninitialized = 0x2, /* 10 */
89 MayUninitialized = 0x3 /* 11 */ };
90
91static bool isUninitialized(const Value v) {
92 return v >= Uninitialized;
93}
94static bool isAlwaysUninit(const Value v) {
95 return v == Uninitialized;
96}
Ted Kremenekafb10c42011-03-15 04:57:29 +000097
Benjamin Kramerda57f3e2011-03-26 12:38:21 +000098namespace {
Ted Kremenek496398d2011-03-15 04:57:32 +000099
Argyrios Kyrtzidis049f6d02011-05-31 03:56:09 +0000100typedef llvm::PackedVector<Value, 2> ValueVector;
Ted Kremenek13bd4232011-01-20 17:37:17 +0000101
Ted Kremenek610068c2011-01-15 02:58:47 +0000102class CFGBlockValues {
103 const CFG &cfg;
Ted Kremenekeee18c32012-07-19 04:59:05 +0000104 std::vector<ValueVector*> vals;
Ted Kremenek136f8f22011-03-15 04:57:27 +0000105 ValueVector scratch;
Ted Kremenek4ddb3872011-03-15 05:30:12 +0000106 DeclToIndex declToIndex;
Ted Kremenek610068c2011-01-15 02:58:47 +0000107public:
108 CFGBlockValues(const CFG &cfg);
109 ~CFGBlockValues();
Ted Kremenekeee18c32012-07-19 04:59:05 +0000110
Ted Kremenekd40066b2011-04-04 23:29:12 +0000111 unsigned getNumEntries() const { return declToIndex.size(); }
112
Ted Kremenek610068c2011-01-15 02:58:47 +0000113 void computeSetOfDeclarations(const DeclContext &dc);
Ted Kremenekeee18c32012-07-19 04:59:05 +0000114 ValueVector &getValueVector(const CFGBlock *block) {
115 return *vals[block->getBlockID()];
116 }
Ted Kremenek13bd4232011-01-20 17:37:17 +0000117
Richard Smitha9e8b9e2012-07-02 23:23:04 +0000118 void setAllScratchValues(Value V);
Ted Kremenek136f8f22011-03-15 04:57:27 +0000119 void mergeIntoScratch(ValueVector const &source, bool isFirst);
120 bool updateValueVectorWithScratch(const CFGBlock *block);
Ted Kremenek610068c2011-01-15 02:58:47 +0000121
122 bool hasNoDeclarations() const {
Ted Kremenek4ddb3872011-03-15 05:30:12 +0000123 return declToIndex.size() == 0;
Ted Kremenek610068c2011-01-15 02:58:47 +0000124 }
Ted Kremeneke0e29332011-08-20 01:15:28 +0000125
Ted Kremenek610068c2011-01-15 02:58:47 +0000126 void resetScratch();
Ted Kremenek13bd4232011-01-20 17:37:17 +0000127
Ted Kremenek136f8f22011-03-15 04:57:27 +0000128 ValueVector::reference operator[](const VarDecl *vd);
Richard Smith2815e1a2012-05-25 02:17:09 +0000129
130 Value getValue(const CFGBlock *block, const CFGBlock *dstBlock,
131 const VarDecl *vd) {
132 const llvm::Optional<unsigned> &idx = declToIndex.getValueIndex(vd);
133 assert(idx.hasValue());
Ted Kremenekeee18c32012-07-19 04:59:05 +0000134 return getValueVector(block)[idx.getValue()];
Richard Smith2815e1a2012-05-25 02:17:09 +0000135 }
Ted Kremenek610068c2011-01-15 02:58:47 +0000136};
Benjamin Kramerda57f3e2011-03-26 12:38:21 +0000137} // end anonymous namespace
Ted Kremenek610068c2011-01-15 02:58:47 +0000138
Ted Kremenekeee18c32012-07-19 04:59:05 +0000139CFGBlockValues::CFGBlockValues(const CFG &c) : cfg(c), vals(0) {}
Ted Kremenek610068c2011-01-15 02:58:47 +0000140
141CFGBlockValues::~CFGBlockValues() {
Ted Kremenekeee18c32012-07-19 04:59:05 +0000142 for (std::vector<ValueVector*>::iterator I = vals.begin(), E = vals.end();
143 I != E; ++I)
144 delete *I;
Ted Kremenek610068c2011-01-15 02:58:47 +0000145}
146
147void CFGBlockValues::computeSetOfDeclarations(const DeclContext &dc) {
Ted Kremenek4ddb3872011-03-15 05:30:12 +0000148 declToIndex.computeMap(dc);
Ted Kremenekeee18c32012-07-19 04:59:05 +0000149 unsigned decls = declToIndex.size();
150 scratch.resize(decls);
151 unsigned n = cfg.getNumBlockIDs();
152 if (!n)
153 return;
154 vals.resize(n);
155 for (unsigned i = 0; i < n; ++i)
156 vals[i] = new ValueVector(decls);
Ted Kremenek13bd4232011-01-20 17:37:17 +0000157}
158
Richard Smith558e8872012-07-13 23:33:44 +0000159#if DEBUG_LOGGING
Ted Kremenek136f8f22011-03-15 04:57:27 +0000160static void printVector(const CFGBlock *block, ValueVector &bv,
Ted Kremenek9fcbcee2011-02-01 17:43:18 +0000161 unsigned num) {
Ted Kremenek9fcbcee2011-02-01 17:43:18 +0000162 llvm::errs() << block->getBlockID() << " :";
163 for (unsigned i = 0; i < bv.size(); ++i) {
164 llvm::errs() << ' ' << bv[i];
165 }
166 llvm::errs() << " : " << num << '\n';
167}
168#endif
Ted Kremenek610068c2011-01-15 02:58:47 +0000169
Richard Smitha9e8b9e2012-07-02 23:23:04 +0000170void CFGBlockValues::setAllScratchValues(Value V) {
171 for (unsigned I = 0, E = scratch.size(); I != E; ++I)
172 scratch[I] = V;
173}
174
Ted Kremenekc5f740e2011-10-07 00:42:48 +0000175void CFGBlockValues::mergeIntoScratch(ValueVector const &source,
176 bool isFirst) {
177 if (isFirst)
178 scratch = source;
179 else
180 scratch |= source;
181}
182
Ted Kremenek136f8f22011-03-15 04:57:27 +0000183bool CFGBlockValues::updateValueVectorWithScratch(const CFGBlock *block) {
Ted Kremenekeee18c32012-07-19 04:59:05 +0000184 ValueVector &dst = getValueVector(block);
Ted Kremenek610068c2011-01-15 02:58:47 +0000185 bool changed = (dst != scratch);
186 if (changed)
187 dst = scratch;
Richard Smith558e8872012-07-13 23:33:44 +0000188#if DEBUG_LOGGING
Ted Kremenek9fcbcee2011-02-01 17:43:18 +0000189 printVector(block, scratch, 0);
190#endif
Ted Kremenek13bd4232011-01-20 17:37:17 +0000191 return changed;
192}
193
Ted Kremenek610068c2011-01-15 02:58:47 +0000194void CFGBlockValues::resetScratch() {
195 scratch.reset();
196}
197
Ted Kremenek136f8f22011-03-15 04:57:27 +0000198ValueVector::reference CFGBlockValues::operator[](const VarDecl *vd) {
Ted Kremenek4ddb3872011-03-15 05:30:12 +0000199 const llvm::Optional<unsigned> &idx = declToIndex.getValueIndex(vd);
Ted Kremenek610068c2011-01-15 02:58:47 +0000200 assert(idx.hasValue());
201 return scratch[idx.getValue()];
202}
203
204//------------------------------------------------------------------------====//
205// Worklist: worklist for dataflow analysis.
206//====------------------------------------------------------------------------//
207
208namespace {
209class DataflowWorklist {
Chris Lattner5f9e2722011-07-23 10:55:15 +0000210 SmallVector<const CFGBlock *, 20> worklist;
Ted Kremenek496398d2011-03-15 04:57:32 +0000211 llvm::BitVector enqueuedBlocks;
Ted Kremenek610068c2011-01-15 02:58:47 +0000212public:
213 DataflowWorklist(const CFG &cfg) : enqueuedBlocks(cfg.getNumBlockIDs()) {}
214
Ted Kremenek610068c2011-01-15 02:58:47 +0000215 void enqueueSuccessors(const CFGBlock *block);
216 const CFGBlock *dequeue();
Ted Kremenek610068c2011-01-15 02:58:47 +0000217};
218}
219
Ted Kremenek610068c2011-01-15 02:58:47 +0000220void DataflowWorklist::enqueueSuccessors(const clang::CFGBlock *block) {
Chandler Carruth80520502011-07-08 11:19:06 +0000221 unsigned OldWorklistSize = worklist.size();
Ted Kremenek610068c2011-01-15 02:58:47 +0000222 for (CFGBlock::const_succ_iterator I = block->succ_begin(),
223 E = block->succ_end(); I != E; ++I) {
Chandler Carruth80520502011-07-08 11:19:06 +0000224 const CFGBlock *Successor = *I;
225 if (!Successor || enqueuedBlocks[Successor->getBlockID()])
226 continue;
227 worklist.push_back(Successor);
228 enqueuedBlocks[Successor->getBlockID()] = true;
Ted Kremenek610068c2011-01-15 02:58:47 +0000229 }
Chandler Carruth80520502011-07-08 11:19:06 +0000230 if (OldWorklistSize == 0 || OldWorklistSize == worklist.size())
231 return;
232
233 // Rotate the newly added blocks to the start of the worklist so that it forms
234 // a proper queue when we pop off the end of the worklist.
235 std::rotate(worklist.begin(), worklist.begin() + OldWorklistSize,
236 worklist.end());
Ted Kremenek610068c2011-01-15 02:58:47 +0000237}
238
239const CFGBlock *DataflowWorklist::dequeue() {
240 if (worklist.empty())
241 return 0;
242 const CFGBlock *b = worklist.back();
243 worklist.pop_back();
244 enqueuedBlocks[b->getBlockID()] = false;
245 return b;
246}
247
248//------------------------------------------------------------------------====//
Richard Smith9532e0d2012-07-17 00:06:14 +0000249// Classification of DeclRefExprs as use or initialization.
Ted Kremenek610068c2011-01-15 02:58:47 +0000250//====------------------------------------------------------------------------//
251
Ted Kremenek610068c2011-01-15 02:58:47 +0000252namespace {
253class FindVarResult {
254 const VarDecl *vd;
255 const DeclRefExpr *dr;
256public:
Richard Smith9532e0d2012-07-17 00:06:14 +0000257 FindVarResult(const VarDecl *vd, const DeclRefExpr *dr) : vd(vd), dr(dr) {}
258
Ted Kremenek610068c2011-01-15 02:58:47 +0000259 const DeclRefExpr *getDeclRefExpr() const { return dr; }
260 const VarDecl *getDecl() const { return vd; }
261};
Richard Smith9532e0d2012-07-17 00:06:14 +0000262
263static const Expr *stripCasts(ASTContext &C, const Expr *Ex) {
264 while (Ex) {
265 Ex = Ex->IgnoreParenNoopCasts(C);
266 if (const CastExpr *CE = dyn_cast<CastExpr>(Ex)) {
267 if (CE->getCastKind() == CK_LValueBitCast) {
268 Ex = CE->getSubExpr();
269 continue;
270 }
271 }
272 break;
273 }
274 return Ex;
275}
276
277/// If E is an expression comprising a reference to a single variable, find that
278/// variable.
279static FindVarResult findVar(const Expr *E, const DeclContext *DC) {
280 if (const DeclRefExpr *DRE =
281 dyn_cast<DeclRefExpr>(stripCasts(DC->getParentASTContext(), E)))
282 if (const VarDecl *VD = dyn_cast<VarDecl>(DRE->getDecl()))
283 if (isTrackedVar(VD, DC))
284 return FindVarResult(VD, DRE);
285 return FindVarResult(0, 0);
286}
287
288/// \brief Classify each DeclRefExpr as an initialization or a use. Any
289/// DeclRefExpr which isn't explicitly classified will be assumed to have
290/// escaped the analysis and will be treated as an initialization.
291class ClassifyRefs : public StmtVisitor<ClassifyRefs> {
292public:
293 enum Class {
294 Init,
295 Use,
296 SelfInit,
297 Ignore
298 };
299
300private:
301 const DeclContext *DC;
302 llvm::DenseMap<const DeclRefExpr*, Class> Classification;
303
304 bool isTrackedVar(const VarDecl *VD) const {
305 return ::isTrackedVar(VD, DC);
306 }
307
308 void classify(const Expr *E, Class C);
309
310public:
311 ClassifyRefs(AnalysisDeclContext &AC) : DC(cast<DeclContext>(AC.getDecl())) {}
312
313 void VisitDeclStmt(DeclStmt *DS);
314 void VisitUnaryOperator(UnaryOperator *UO);
315 void VisitBinaryOperator(BinaryOperator *BO);
316 void VisitCallExpr(CallExpr *CE);
317 void VisitCastExpr(CastExpr *CE);
318
319 void operator()(Stmt *S) { Visit(S); }
320
321 Class get(const DeclRefExpr *DRE) const {
322 llvm::DenseMap<const DeclRefExpr*, Class>::const_iterator I
323 = Classification.find(DRE);
324 if (I != Classification.end())
325 return I->second;
326
327 const VarDecl *VD = dyn_cast<VarDecl>(DRE->getDecl());
328 if (!VD || !isTrackedVar(VD))
329 return Ignore;
330
331 return Init;
332 }
333};
334}
335
336static const DeclRefExpr *getSelfInitExpr(VarDecl *VD) {
337 if (Expr *Init = VD->getInit()) {
338 const DeclRefExpr *DRE
339 = dyn_cast<DeclRefExpr>(stripCasts(VD->getASTContext(), Init));
340 if (DRE && DRE->getDecl() == VD)
341 return DRE;
342 }
343 return 0;
344}
345
346void ClassifyRefs::classify(const Expr *E, Class C) {
347 FindVarResult Var = findVar(E, DC);
348 if (const DeclRefExpr *DRE = Var.getDeclRefExpr())
349 Classification[DRE] = std::max(Classification[DRE], C);
350}
351
352void ClassifyRefs::VisitDeclStmt(DeclStmt *DS) {
353 for (DeclStmt::decl_iterator DI = DS->decl_begin(), DE = DS->decl_end();
354 DI != DE; ++DI) {
355 VarDecl *VD = dyn_cast<VarDecl>(*DI);
356 if (VD && isTrackedVar(VD))
357 if (const DeclRefExpr *DRE = getSelfInitExpr(VD))
358 Classification[DRE] = SelfInit;
359 }
360}
361
362void ClassifyRefs::VisitBinaryOperator(BinaryOperator *BO) {
363 // Ignore the evaluation of a DeclRefExpr on the LHS of an assignment. If this
364 // is not a compound-assignment, we will treat it as initializing the variable
365 // when TransferFunctions visits it. A compound-assignment does not affect
366 // whether a variable is uninitialized, and there's no point counting it as a
367 // use.
Richard Smith6cfa78f2012-07-17 01:27:33 +0000368 if (BO->isCompoundAssignmentOp())
369 classify(BO->getLHS(), Use);
370 else if (BO->getOpcode() == BO_Assign)
Richard Smith9532e0d2012-07-17 00:06:14 +0000371 classify(BO->getLHS(), Ignore);
372}
373
374void ClassifyRefs::VisitUnaryOperator(UnaryOperator *UO) {
375 // Increment and decrement are uses despite there being no lvalue-to-rvalue
376 // conversion.
377 if (UO->isIncrementDecrementOp())
378 classify(UO->getSubExpr(), Use);
379}
380
381void ClassifyRefs::VisitCallExpr(CallExpr *CE) {
382 // If a value is passed by const reference to a function, we should not assume
383 // that it is initialized by the call, and we conservatively do not assume
384 // that it is used.
385 for (CallExpr::arg_iterator I = CE->arg_begin(), E = CE->arg_end();
386 I != E; ++I)
387 if ((*I)->getType().isConstQualified() && (*I)->isGLValue())
388 classify(*I, Ignore);
389}
390
391void ClassifyRefs::VisitCastExpr(CastExpr *CE) {
392 if (CE->getCastKind() == CK_LValueToRValue)
393 classify(CE->getSubExpr(), Use);
394 else if (CStyleCastExpr *CSE = dyn_cast<CStyleCastExpr>(CE)) {
395 if (CSE->getType()->isVoidType()) {
396 // Squelch any detected load of an uninitialized value if
397 // we cast it to void.
398 // e.g. (void) x;
399 classify(CSE->getSubExpr(), Ignore);
400 }
401 }
402}
403
404//------------------------------------------------------------------------====//
405// Transfer function for uninitialized values analysis.
406//====------------------------------------------------------------------------//
407
408namespace {
Ted Kremenek0c8e5a02011-07-19 14:18:48 +0000409class TransferFunctions : public StmtVisitor<TransferFunctions> {
Ted Kremenek610068c2011-01-15 02:58:47 +0000410 CFGBlockValues &vals;
411 const CFG &cfg;
Richard Smith2815e1a2012-05-25 02:17:09 +0000412 const CFGBlock *block;
Ted Kremenek1d26f482011-10-24 01:32:45 +0000413 AnalysisDeclContext &ac;
Richard Smith9532e0d2012-07-17 00:06:14 +0000414 const ClassifyRefs &classification;
Ted Kremenek610068c2011-01-15 02:58:47 +0000415 UninitVariablesHandler *handler;
Richard Smith9532e0d2012-07-17 00:06:14 +0000416
Ted Kremenek610068c2011-01-15 02:58:47 +0000417public:
418 TransferFunctions(CFGBlockValues &vals, const CFG &cfg,
Richard Smith2815e1a2012-05-25 02:17:09 +0000419 const CFGBlock *block, AnalysisDeclContext &ac,
Richard Smith9532e0d2012-07-17 00:06:14 +0000420 const ClassifyRefs &classification,
Ted Kremenek6f275422011-09-02 19:39:26 +0000421 UninitVariablesHandler *handler)
Richard Smith9532e0d2012-07-17 00:06:14 +0000422 : vals(vals), cfg(cfg), block(block), ac(ac),
423 classification(classification), handler(handler) {}
424
Richard Smith81891882012-05-24 23:45:35 +0000425 void reportUse(const Expr *ex, const VarDecl *vd);
Ted Kremeneka8c17a52011-01-25 19:13:48 +0000426
Richard Smith9532e0d2012-07-17 00:06:14 +0000427 void VisitObjCForCollectionStmt(ObjCForCollectionStmt *FS);
Ted Kremeneka8c17a52011-01-25 19:13:48 +0000428 void VisitBlockExpr(BlockExpr *be);
Richard Smitha9e8b9e2012-07-02 23:23:04 +0000429 void VisitCallExpr(CallExpr *ce);
Ted Kremenek610068c2011-01-15 02:58:47 +0000430 void VisitDeclStmt(DeclStmt *ds);
Ted Kremenekc21fed32011-01-18 21:18:58 +0000431 void VisitDeclRefExpr(DeclRefExpr *dr);
Ted Kremenek610068c2011-01-15 02:58:47 +0000432 void VisitBinaryOperator(BinaryOperator *bo);
Richard Smith2815e1a2012-05-25 02:17:09 +0000433
Ted Kremenek40900ee2011-01-27 02:29:34 +0000434 bool isTrackedVar(const VarDecl *vd) {
435 return ::isTrackedVar(vd, cast<DeclContext>(ac.getDecl()));
436 }
Richard Smith2815e1a2012-05-25 02:17:09 +0000437
Richard Smith9532e0d2012-07-17 00:06:14 +0000438 FindVarResult findVar(const Expr *ex) {
439 return ::findVar(ex, cast<DeclContext>(ac.getDecl()));
440 }
441
Richard Smith2815e1a2012-05-25 02:17:09 +0000442 UninitUse getUninitUse(const Expr *ex, const VarDecl *vd, Value v) {
443 UninitUse Use(ex, isAlwaysUninit(v));
444
445 assert(isUninitialized(v));
446 if (Use.getKind() == UninitUse::Always)
447 return Use;
448
449 // If an edge which leads unconditionally to this use did not initialize
450 // the variable, we can say something stronger than 'may be uninitialized':
451 // we can say 'either it's used uninitialized or you have dead code'.
452 //
453 // We track the number of successors of a node which have been visited, and
454 // visit a node once we have visited all of its successors. Only edges where
455 // the variable might still be uninitialized are followed. Since a variable
456 // can't transfer from being initialized to being uninitialized, this will
457 // trace out the subgraph which inevitably leads to the use and does not
458 // initialize the variable. We do not want to skip past loops, since their
459 // non-termination might be correlated with the initialization condition.
460 //
461 // For example:
462 //
463 // void f(bool a, bool b) {
464 // block1: int n;
465 // if (a) {
466 // block2: if (b)
467 // block3: n = 1;
468 // block4: } else if (b) {
469 // block5: while (!a) {
470 // block6: do_work(&a);
471 // n = 2;
472 // }
473 // }
474 // block7: if (a)
475 // block8: g();
476 // block9: return n;
477 // }
478 //
479 // Starting from the maybe-uninitialized use in block 9:
480 // * Block 7 is not visited because we have only visited one of its two
481 // successors.
482 // * Block 8 is visited because we've visited its only successor.
483 // From block 8:
484 // * Block 7 is visited because we've now visited both of its successors.
485 // From block 7:
486 // * Blocks 1, 2, 4, 5, and 6 are not visited because we didn't visit all
487 // of their successors (we didn't visit 4, 3, 5, 6, and 5, respectively).
488 // * Block 3 is not visited because it initializes 'n'.
489 // Now the algorithm terminates, having visited blocks 7 and 8, and having
490 // found the frontier is blocks 2, 4, and 5.
491 //
492 // 'n' is definitely uninitialized for two edges into block 7 (from blocks 2
493 // and 4), so we report that any time either of those edges is taken (in
494 // each case when 'b == false'), 'n' is used uninitialized.
495 llvm::SmallVector<const CFGBlock*, 32> Queue;
496 llvm::SmallVector<unsigned, 32> SuccsVisited(cfg.getNumBlockIDs(), 0);
497 Queue.push_back(block);
498 // Specify that we've already visited all successors of the starting block.
499 // This has the dual purpose of ensuring we never add it to the queue, and
500 // of marking it as not being a candidate element of the frontier.
501 SuccsVisited[block->getBlockID()] = block->succ_size();
502 while (!Queue.empty()) {
503 const CFGBlock *B = Queue.back();
504 Queue.pop_back();
505 for (CFGBlock::const_pred_iterator I = B->pred_begin(), E = B->pred_end();
506 I != E; ++I) {
507 const CFGBlock *Pred = *I;
508 if (vals.getValue(Pred, B, vd) == Initialized)
509 // This block initializes the variable.
510 continue;
511
Richard Smith558e8872012-07-13 23:33:44 +0000512 unsigned &SV = SuccsVisited[Pred->getBlockID()];
513 if (!SV) {
514 // When visiting the first successor of a block, mark all NULL
515 // successors as having been visited.
516 for (CFGBlock::const_succ_iterator SI = Pred->succ_begin(),
517 SE = Pred->succ_end();
518 SI != SE; ++SI)
519 if (!*SI)
520 ++SV;
521 }
522
523 if (++SV == Pred->succ_size())
Richard Smith2815e1a2012-05-25 02:17:09 +0000524 // All paths from this block lead to the use and don't initialize the
525 // variable.
526 Queue.push_back(Pred);
527 }
528 }
529
530 // Scan the frontier, looking for blocks where the variable was
531 // uninitialized.
532 for (CFG::const_iterator BI = cfg.begin(), BE = cfg.end(); BI != BE; ++BI) {
533 const CFGBlock *Block = *BI;
534 unsigned BlockID = Block->getBlockID();
535 const Stmt *Term = Block->getTerminator();
536 if (SuccsVisited[BlockID] && SuccsVisited[BlockID] < Block->succ_size() &&
537 Term) {
538 // This block inevitably leads to the use. If we have an edge from here
539 // to a post-dominator block, and the variable is uninitialized on that
540 // edge, we have found a bug.
541 for (CFGBlock::const_succ_iterator I = Block->succ_begin(),
542 E = Block->succ_end(); I != E; ++I) {
543 const CFGBlock *Succ = *I;
544 if (Succ && SuccsVisited[Succ->getBlockID()] >= Succ->succ_size() &&
545 vals.getValue(Block, Succ, vd) == Uninitialized) {
546 // Switch cases are a special case: report the label to the caller
547 // as the 'terminator', not the switch statement itself. Suppress
548 // situations where no label matched: we can't be sure that's
549 // possible.
550 if (isa<SwitchStmt>(Term)) {
551 const Stmt *Label = Succ->getLabel();
552 if (!Label || !isa<SwitchCase>(Label))
553 // Might not be possible.
554 continue;
555 UninitUse::Branch Branch;
556 Branch.Terminator = Label;
557 Branch.Output = 0; // Ignored.
558 Use.addUninitBranch(Branch);
559 } else {
560 UninitUse::Branch Branch;
561 Branch.Terminator = Term;
562 Branch.Output = I - Block->succ_begin();
563 Use.addUninitBranch(Branch);
564 }
565 }
566 }
567 }
568 }
569
570 return Use;
571 }
Ted Kremenek610068c2011-01-15 02:58:47 +0000572};
573}
574
Richard Smith81891882012-05-24 23:45:35 +0000575void TransferFunctions::reportUse(const Expr *ex, const VarDecl *vd) {
576 if (!handler)
577 return;
578 Value v = vals[vd];
579 if (isUninitialized(v))
Richard Smith2815e1a2012-05-25 02:17:09 +0000580 handler->handleUseOfUninitVariable(vd, getUninitUse(ex, vd, v));
Ted Kremenek610068c2011-01-15 02:58:47 +0000581}
582
Richard Smith9532e0d2012-07-17 00:06:14 +0000583void TransferFunctions::VisitObjCForCollectionStmt(ObjCForCollectionStmt *FS) {
Ted Kremenek1ea800c2011-01-27 02:01:31 +0000584 // This represents an initialization of the 'element' value.
Richard Smith9532e0d2012-07-17 00:06:14 +0000585 if (DeclStmt *DS = dyn_cast<DeclStmt>(FS->getElement())) {
586 const VarDecl *VD = cast<VarDecl>(DS->getSingleDecl());
587 if (isTrackedVar(VD))
588 vals[VD] = Initialized;
Ted Kremenek1ea800c2011-01-27 02:01:31 +0000589 }
Ted Kremenek1ea800c2011-01-27 02:01:31 +0000590}
591
Ted Kremeneka8c17a52011-01-25 19:13:48 +0000592void TransferFunctions::VisitBlockExpr(BlockExpr *be) {
Ted Kremenekbc8b44c2011-03-31 22:32:41 +0000593 const BlockDecl *bd = be->getBlockDecl();
594 for (BlockDecl::capture_const_iterator i = bd->capture_begin(),
595 e = bd->capture_end() ; i != e; ++i) {
596 const VarDecl *vd = i->getVariable();
Ted Kremenekbc8b44c2011-03-31 22:32:41 +0000597 if (!isTrackedVar(vd))
598 continue;
599 if (i->isByRef()) {
600 vals[vd] = Initialized;
601 continue;
602 }
Richard Smith81891882012-05-24 23:45:35 +0000603 reportUse(be, vd);
Ted Kremeneka8c17a52011-01-25 19:13:48 +0000604 }
605}
606
Richard Smitha9e8b9e2012-07-02 23:23:04 +0000607void TransferFunctions::VisitCallExpr(CallExpr *ce) {
Ted Kremenek44ca53f2012-09-12 05:53:43 +0000608 if (Decl *Callee = ce->getCalleeDecl()) {
609 if (Callee->hasAttr<ReturnsTwiceAttr>()) {
610 // After a call to a function like setjmp or vfork, any variable which is
611 // initialized anywhere within this function may now be initialized. For
612 // now, just assume such a call initializes all variables. FIXME: Only
613 // mark variables as initialized if they have an initializer which is
614 // reachable from here.
615 vals.setAllScratchValues(Initialized);
616 }
617 else if (Callee->hasAttr<AnalyzerNoReturnAttr>()) {
618 // Functions labeled like "analyzer_noreturn" are often used to denote
619 // "panic" functions that in special debug situations can still return,
620 // but for the most part should not be treated as returning. This is a
621 // useful annotation borrowed from the static analyzer that is useful for
622 // suppressing branch-specific false positives when we call one of these
623 // functions but keep pretending the path continues (when in reality the
624 // user doesn't care).
625 vals.setAllScratchValues(Unknown);
626 }
627 }
Richard Smitha9e8b9e2012-07-02 23:23:04 +0000628}
629
Ted Kremenek0c8e5a02011-07-19 14:18:48 +0000630void TransferFunctions::VisitDeclRefExpr(DeclRefExpr *dr) {
Richard Smith9532e0d2012-07-17 00:06:14 +0000631 switch (classification.get(dr)) {
632 case ClassifyRefs::Ignore:
633 break;
634 case ClassifyRefs::Use:
635 reportUse(dr, cast<VarDecl>(dr->getDecl()));
636 break;
637 case ClassifyRefs::Init:
638 vals[cast<VarDecl>(dr->getDecl())] = Initialized;
639 break;
640 case ClassifyRefs::SelfInit:
641 if (handler)
642 handler->handleSelfInit(cast<VarDecl>(dr->getDecl()));
643 break;
644 }
Ted Kremenek0c8e5a02011-07-19 14:18:48 +0000645}
646
Richard Smith9532e0d2012-07-17 00:06:14 +0000647void TransferFunctions::VisitBinaryOperator(BinaryOperator *BO) {
648 if (BO->getOpcode() == BO_Assign) {
649 FindVarResult Var = findVar(BO->getLHS());
650 if (const VarDecl *VD = Var.getDecl())
651 vals[VD] = Initialized;
652 }
653}
654
655void TransferFunctions::VisitDeclStmt(DeclStmt *DS) {
656 for (DeclStmt::decl_iterator DI = DS->decl_begin(), DE = DS->decl_end();
Ted Kremenek610068c2011-01-15 02:58:47 +0000657 DI != DE; ++DI) {
Richard Smith9532e0d2012-07-17 00:06:14 +0000658 VarDecl *VD = dyn_cast<VarDecl>(*DI);
659 if (VD && isTrackedVar(VD)) {
660 if (getSelfInitExpr(VD)) {
661 // If the initializer consists solely of a reference to itself, we
662 // explicitly mark the variable as uninitialized. This allows code
663 // like the following:
664 //
665 // int x = x;
666 //
667 // to deliberately leave a variable uninitialized. Different analysis
668 // clients can detect this pattern and adjust their reporting
669 // appropriately, but we need to continue to analyze subsequent uses
670 // of the variable.
671 vals[VD] = Uninitialized;
672 } else if (VD->getInit()) {
673 // Treat the new variable as initialized.
674 vals[VD] = Initialized;
675 } else {
676 // No initializer: the variable is now uninitialized. This matters
677 // for cases like:
678 // while (...) {
679 // int n;
680 // use(n);
681 // n = 0;
682 // }
683 // FIXME: Mark the variable as uninitialized whenever its scope is
684 // left, since its scope could be re-entered by a jump over the
685 // declaration.
686 vals[VD] = Uninitialized;
Ted Kremenekc21fed32011-01-18 21:18:58 +0000687 }
Ted Kremenek610068c2011-01-15 02:58:47 +0000688 }
689 }
690}
691
Ted Kremenek610068c2011-01-15 02:58:47 +0000692//------------------------------------------------------------------------====//
693// High-level "driver" logic for uninitialized values analysis.
694//====------------------------------------------------------------------------//
695
Ted Kremenek13bd4232011-01-20 17:37:17 +0000696static bool runOnBlock(const CFGBlock *block, const CFG &cfg,
Ted Kremenek1d26f482011-10-24 01:32:45 +0000697 AnalysisDeclContext &ac, CFGBlockValues &vals,
Richard Smith9532e0d2012-07-17 00:06:14 +0000698 const ClassifyRefs &classification,
Ted Kremenekf8adeef2011-04-04 20:30:58 +0000699 llvm::BitVector &wasAnalyzed,
Ted Kremenek6f275422011-09-02 19:39:26 +0000700 UninitVariablesHandler *handler = 0) {
Ted Kremenekf8adeef2011-04-04 20:30:58 +0000701 wasAnalyzed[block->getBlockID()] = true;
Ted Kremenek610068c2011-01-15 02:58:47 +0000702 vals.resetScratch();
Ted Kremenekeee18c32012-07-19 04:59:05 +0000703 // Merge in values of predecessor blocks.
Ted Kremenek610068c2011-01-15 02:58:47 +0000704 bool isFirst = true;
705 for (CFGBlock::const_pred_iterator I = block->pred_begin(),
706 E = block->pred_end(); I != E; ++I) {
Ted Kremenek6f275422011-09-02 19:39:26 +0000707 const CFGBlock *pred = *I;
708 if (wasAnalyzed[pred->getBlockID()]) {
Ted Kremenekeee18c32012-07-19 04:59:05 +0000709 vals.mergeIntoScratch(vals.getValueVector(pred), isFirst);
Ted Kremenek6f275422011-09-02 19:39:26 +0000710 isFirst = false;
711 }
Ted Kremenek610068c2011-01-15 02:58:47 +0000712 }
713 // Apply the transfer function.
Richard Smith9532e0d2012-07-17 00:06:14 +0000714 TransferFunctions tf(vals, cfg, block, ac, classification, handler);
Ted Kremenek610068c2011-01-15 02:58:47 +0000715 for (CFGBlock::const_iterator I = block->begin(), E = block->end();
716 I != E; ++I) {
717 if (const CFGStmt *cs = dyn_cast<CFGStmt>(&*I)) {
Ted Kremenekf1d10d92011-08-23 23:05:04 +0000718 tf.Visit(const_cast<Stmt*>(cs->getStmt()));
Ted Kremenek610068c2011-01-15 02:58:47 +0000719 }
720 }
Ted Kremenek136f8f22011-03-15 04:57:27 +0000721 return vals.updateValueVectorWithScratch(block);
Ted Kremenek610068c2011-01-15 02:58:47 +0000722}
723
Chandler Carruth5d989942011-07-06 16:21:37 +0000724void clang::runUninitializedVariablesAnalysis(
725 const DeclContext &dc,
726 const CFG &cfg,
Ted Kremenek1d26f482011-10-24 01:32:45 +0000727 AnalysisDeclContext &ac,
Chandler Carruth5d989942011-07-06 16:21:37 +0000728 UninitVariablesHandler &handler,
729 UninitVariablesAnalysisStats &stats) {
Ted Kremenek610068c2011-01-15 02:58:47 +0000730 CFGBlockValues vals(cfg);
731 vals.computeSetOfDeclarations(dc);
732 if (vals.hasNoDeclarations())
733 return;
Ted Kremenekd40066b2011-04-04 23:29:12 +0000734
Chandler Carruth5d989942011-07-06 16:21:37 +0000735 stats.NumVariablesAnalyzed = vals.getNumEntries();
736
Richard Smith9532e0d2012-07-17 00:06:14 +0000737 // Precompute which expressions are uses and which are initializations.
738 ClassifyRefs classification(ac);
739 cfg.VisitBlockStmts(classification);
740
Ted Kremenekd40066b2011-04-04 23:29:12 +0000741 // Mark all variables uninitialized at the entry.
742 const CFGBlock &entry = cfg.getEntry();
Ted Kremenekeee18c32012-07-19 04:59:05 +0000743 ValueVector &vec = vals.getValueVector(&entry);
744 const unsigned n = vals.getNumEntries();
745 for (unsigned j = 0; j < n ; ++j) {
746 vec[j] = Uninitialized;
Ted Kremenekd40066b2011-04-04 23:29:12 +0000747 }
748
749 // Proceed with the workist.
Ted Kremenek610068c2011-01-15 02:58:47 +0000750 DataflowWorklist worklist(cfg);
Ted Kremenek496398d2011-03-15 04:57:32 +0000751 llvm::BitVector previouslyVisited(cfg.getNumBlockIDs());
Ted Kremenek610068c2011-01-15 02:58:47 +0000752 worklist.enqueueSuccessors(&cfg.getEntry());
Ted Kremenekf8adeef2011-04-04 20:30:58 +0000753 llvm::BitVector wasAnalyzed(cfg.getNumBlockIDs(), false);
Ted Kremenek6f275422011-09-02 19:39:26 +0000754 wasAnalyzed[cfg.getEntry().getBlockID()] = true;
Ted Kremenek610068c2011-01-15 02:58:47 +0000755
756 while (const CFGBlock *block = worklist.dequeue()) {
Ted Kremenek610068c2011-01-15 02:58:47 +0000757 // Did the block change?
Richard Smith9532e0d2012-07-17 00:06:14 +0000758 bool changed = runOnBlock(block, cfg, ac, vals,
759 classification, wasAnalyzed);
Chandler Carruth5d989942011-07-06 16:21:37 +0000760 ++stats.NumBlockVisits;
Ted Kremenek610068c2011-01-15 02:58:47 +0000761 if (changed || !previouslyVisited[block->getBlockID()])
762 worklist.enqueueSuccessors(block);
763 previouslyVisited[block->getBlockID()] = true;
764 }
765
766 // Run through the blocks one more time, and report uninitialized variabes.
767 for (CFG::const_iterator BI = cfg.begin(), BE = cfg.end(); BI != BE; ++BI) {
Ted Kremenek6f275422011-09-02 19:39:26 +0000768 const CFGBlock *block = *BI;
769 if (wasAnalyzed[block->getBlockID()]) {
Richard Smith9532e0d2012-07-17 00:06:14 +0000770 runOnBlock(block, cfg, ac, vals, classification, wasAnalyzed, &handler);
Chandler Carruth5d989942011-07-06 16:21:37 +0000771 ++stats.NumBlockVisits;
772 }
Ted Kremenek610068c2011-01-15 02:58:47 +0000773 }
774}
775
776UninitVariablesHandler::~UninitVariablesHandler() {}