blob: 8b3e0f76423d341a2240bf4ffcb20eac0c473d74 [file] [log] [blame]
Argyrios Kyrtzidisd7a31ba2011-01-11 19:45:25 +00001//== ObjCSelfInitChecker.cpp - Checker for 'self' initialization -*- C++ -*--=//
2//
3// The LLVM Compiler Infrastructure
4//
5// This file is distributed under the University of Illinois Open Source
6// License. See LICENSE.TXT for details.
7//
8//===----------------------------------------------------------------------===//
9//
10// This defines ObjCSelfInitChecker, a builtin check that checks for uses of
11// 'self' before proper initialization.
12//
13//===----------------------------------------------------------------------===//
14
15// This checks initialization methods to verify that they assign 'self' to the
16// result of an initialization call (e.g. [super init], or [self initWith..])
17// before using 'self' or any instance variable.
18//
Chris Lattnerfc8f0e12011-04-15 05:22:18 +000019// To perform the required checking, values are tagged with flags that indicate
Argyrios Kyrtzidisd7a31ba2011-01-11 19:45:25 +000020// 1) if the object is the one pointed to by 'self', and 2) if the object
21// is the result of an initializer (e.g. [super init]).
22//
23// Uses of an object that is true for 1) but not 2) trigger a diagnostic.
24// The uses that are currently checked are:
25// - Using instance variables.
26// - Returning the object.
27//
28// Note that we don't check for an invalid 'self' that is the receiver of an
29// obj-c message expression to cut down false positives where logging functions
30// get information from self (like its class) or doing "invalidation" on self
31// when the initialization fails.
32//
33// Because the object that 'self' points to gets invalidated when a call
34// receives a reference to 'self', the checker keeps track and passes the flags
35// for 1) and 2) to the new object that 'self' points to after the call.
36//
37// FIXME (rdar://7937506): In the case of:
38// [super init];
39// return self;
40// Have an extra PathDiagnosticPiece in the path that says "called [super init],
41// but didn't assign the result to self."
42
43//===----------------------------------------------------------------------===//
44
45// FIXME: Somehow stick the link to Apple's documentation about initializing
46// objects in the diagnostics.
47// http://developer.apple.com/library/mac/#documentation/Cocoa/Conceptual/ObjectiveC/Articles/ocAllocInit.html
48
Argyrios Kyrtzidis027a6ab2011-02-15 07:42:33 +000049#include "ClangSACheckers.h"
Argyrios Kyrtzidisec8605f2011-03-01 01:16:21 +000050#include "clang/StaticAnalyzer/Core/Checker.h"
Argyrios Kyrtzidis695fb502011-02-17 21:39:17 +000051#include "clang/StaticAnalyzer/Core/CheckerManager.h"
Argyrios Kyrtzidis769ce3e2011-02-22 17:30:38 +000052#include "clang/StaticAnalyzer/Core/PathSensitive/CheckerContext.h"
Ted Kremenek18c66fd2011-08-15 22:09:50 +000053#include "clang/StaticAnalyzer/Core/PathSensitive/ProgramStateTrait.h"
Jordy Rosed1e5a892011-09-02 08:02:59 +000054#include "clang/StaticAnalyzer/Core/PathSensitive/ObjCMessage.h"
Ted Kremenek9b663712011-02-10 01:03:03 +000055#include "clang/StaticAnalyzer/Core/BugReporter/BugType.h"
Argyrios Kyrtzidisd7a31ba2011-01-11 19:45:25 +000056#include "clang/AST/ParentMap.h"
57
58using namespace clang;
59using namespace ento;
60
61static bool shouldRunOnFunctionOrMethod(const NamedDecl *ND);
62static bool isInitializationMethod(const ObjCMethodDecl *MD);
Argyrios Kyrtzidis432424d2011-01-25 00:03:53 +000063static bool isInitMessage(const ObjCMessage &msg);
Argyrios Kyrtzidisd7a31ba2011-01-11 19:45:25 +000064static bool isSelfVar(SVal location, CheckerContext &C);
65
66namespace {
Argyrios Kyrtzidisec8605f2011-03-01 01:16:21 +000067class ObjCSelfInitChecker : public Checker<
Argyrios Kyrtzidis769ce3e2011-02-22 17:30:38 +000068 check::PostObjCMessage,
69 check::PostStmt<ObjCIvarRefExpr>,
70 check::PreStmt<ReturnStmt>,
71 check::PreStmt<CallExpr>,
72 check::PostStmt<CallExpr>,
73 check::Location > {
Argyrios Kyrtzidisd7a31ba2011-01-11 19:45:25 +000074public:
Argyrios Kyrtzidis769ce3e2011-02-22 17:30:38 +000075 void checkPostObjCMessage(ObjCMessage msg, CheckerContext &C) const;
76 void checkPostStmt(const ObjCIvarRefExpr *E, CheckerContext &C) const;
77 void checkPreStmt(const ReturnStmt *S, CheckerContext &C) const;
78 void checkPreStmt(const CallExpr *CE, CheckerContext &C) const;
79 void checkPostStmt(const CallExpr *CE, CheckerContext &C) const;
80 void checkLocation(SVal location, bool isLoad, CheckerContext &C) const;
Argyrios Kyrtzidisd7a31ba2011-01-11 19:45:25 +000081};
82} // end anonymous namespace
83
Argyrios Kyrtzidisd7a31ba2011-01-11 19:45:25 +000084namespace {
85
86class InitSelfBug : public BugType {
87 const std::string desc;
88public:
Argyrios Kyrtzidis4717f162011-01-26 01:26:41 +000089 InitSelfBug() : BugType("missing \"self = [(super or self) init...]\"",
90 "missing \"self = [(super or self) init...]\"") {}
Argyrios Kyrtzidisd7a31ba2011-01-11 19:45:25 +000091};
92
93} // end anonymous namespace
94
Argyrios Kyrtzidis769ce3e2011-02-22 17:30:38 +000095namespace {
96enum SelfFlagEnum {
97 /// \brief No flag set.
98 SelfFlag_None = 0x0,
99 /// \brief Value came from 'self'.
100 SelfFlag_Self = 0x1,
101 /// \brief Value came from the result of an initializer (e.g. [super init]).
102 SelfFlag_InitRes = 0x2
103};
104}
105
Argyrios Kyrtzidisd7a31ba2011-01-11 19:45:25 +0000106typedef llvm::ImmutableMap<SymbolRef, unsigned> SelfFlag;
Ted Kremenekb715a7c2011-02-12 03:03:54 +0000107namespace { struct CalledInit {}; }
Argyrios Kyrtzidis769ce3e2011-02-22 17:30:38 +0000108namespace { struct PreCallSelfFlags {}; }
Argyrios Kyrtzidisd7a31ba2011-01-11 19:45:25 +0000109
110namespace clang {
111namespace ento {
112 template<>
Ted Kremenek18c66fd2011-08-15 22:09:50 +0000113 struct ProgramStateTrait<SelfFlag> : public ProgramStatePartialTrait<SelfFlag> {
Ted Kremenek9c378f72011-08-12 23:37:29 +0000114 static void *GDMIndex() { static int index = 0; return &index; }
Argyrios Kyrtzidisd7a31ba2011-01-11 19:45:25 +0000115 };
Ted Kremenekb715a7c2011-02-12 03:03:54 +0000116 template <>
Ted Kremenek18c66fd2011-08-15 22:09:50 +0000117 struct ProgramStateTrait<CalledInit> : public ProgramStatePartialTrait<bool> {
Ted Kremenekb715a7c2011-02-12 03:03:54 +0000118 static void *GDMIndex() { static int index = 0; return &index; }
119 };
Argyrios Kyrtzidis769ce3e2011-02-22 17:30:38 +0000120
121 /// \brief A call receiving a reference to 'self' invalidates the object that
122 /// 'self' contains. This keeps the "self flags" assigned to the 'self'
123 /// object before the call so we can assign them to the new object that 'self'
124 /// points to after the call.
125 template <>
Ted Kremenek18c66fd2011-08-15 22:09:50 +0000126 struct ProgramStateTrait<PreCallSelfFlags> : public ProgramStatePartialTrait<unsigned> {
Argyrios Kyrtzidis769ce3e2011-02-22 17:30:38 +0000127 static void *GDMIndex() { static int index = 0; return &index; }
128 };
Argyrios Kyrtzidisd7a31ba2011-01-11 19:45:25 +0000129}
130}
131
Ted Kremenek18c66fd2011-08-15 22:09:50 +0000132static SelfFlagEnum getSelfFlags(SVal val, const ProgramState *state) {
Argyrios Kyrtzidisd7a31ba2011-01-11 19:45:25 +0000133 if (SymbolRef sym = val.getAsSymbol())
134 if (const unsigned *attachedFlags = state->get<SelfFlag>(sym))
135 return (SelfFlagEnum)*attachedFlags;
136 return SelfFlag_None;
137}
138
139static SelfFlagEnum getSelfFlags(SVal val, CheckerContext &C) {
140 return getSelfFlags(val, C.getState());
141}
142
Ted Kremenek18c66fd2011-08-15 22:09:50 +0000143static void addSelfFlag(const ProgramState *state, SVal val,
Ted Kremenekb715a7c2011-02-12 03:03:54 +0000144 SelfFlagEnum flag, CheckerContext &C) {
Argyrios Kyrtzidis0ca10402011-02-05 05:54:53 +0000145 // We tag the symbol that the SVal wraps.
Argyrios Kyrtzidisd7a31ba2011-01-11 19:45:25 +0000146 if (SymbolRef sym = val.getAsSymbol())
147 C.addTransition(state->set<SelfFlag>(sym, getSelfFlags(val, C) | flag));
148}
149
150static bool hasSelfFlag(SVal val, SelfFlagEnum flag, CheckerContext &C) {
151 return getSelfFlags(val, C) & flag;
152}
153
154/// \brief Returns true of the value of the expression is the object that 'self'
155/// points to and is an object that did not come from the result of calling
156/// an initializer.
157static bool isInvalidSelf(const Expr *E, CheckerContext &C) {
158 SVal exprVal = C.getState()->getSVal(E);
159 if (!hasSelfFlag(exprVal, SelfFlag_Self, C))
160 return false; // value did not come from 'self'.
161 if (hasSelfFlag(exprVal, SelfFlag_InitRes, C))
162 return false; // 'self' is properly initialized.
163
164 return true;
165}
166
167static void checkForInvalidSelf(const Expr *E, CheckerContext &C,
168 const char *errorStr) {
169 if (!E)
170 return;
Ted Kremenekb715a7c2011-02-12 03:03:54 +0000171
172 if (!C.getState()->get<CalledInit>())
173 return;
174
Argyrios Kyrtzidisd7a31ba2011-01-11 19:45:25 +0000175 if (!isInvalidSelf(E, C))
176 return;
Ted Kremenekb715a7c2011-02-12 03:03:54 +0000177
Argyrios Kyrtzidisd7a31ba2011-01-11 19:45:25 +0000178 // Generate an error node.
179 ExplodedNode *N = C.generateSink();
180 if (!N)
181 return;
182
Anna Zakse172e8b2011-08-17 23:00:25 +0000183 BugReport *report =
184 new BugReport(*new InitSelfBug(), errorStr, N);
Argyrios Kyrtzidisd7a31ba2011-01-11 19:45:25 +0000185 C.EmitReport(report);
186}
187
Argyrios Kyrtzidis769ce3e2011-02-22 17:30:38 +0000188void ObjCSelfInitChecker::checkPostObjCMessage(ObjCMessage msg,
189 CheckerContext &C) const {
Argyrios Kyrtzidisd7a31ba2011-01-11 19:45:25 +0000190 // When encountering a message that does initialization (init rule),
191 // tag the return value so that we know later on that if self has this value
192 // then it is properly initialized.
193
194 // FIXME: A callback should disable checkers at the start of functions.
195 if (!shouldRunOnFunctionOrMethod(dyn_cast<NamedDecl>(
196 C.getCurrentAnalysisContext()->getDecl())))
197 return;
198
Argyrios Kyrtzidis432424d2011-01-25 00:03:53 +0000199 if (isInitMessage(msg)) {
Argyrios Kyrtzidisd7a31ba2011-01-11 19:45:25 +0000200 // Tag the return value as the result of an initializer.
Ted Kremenek18c66fd2011-08-15 22:09:50 +0000201 const ProgramState *state = C.getState();
Ted Kremenekb715a7c2011-02-12 03:03:54 +0000202
203 // FIXME this really should be context sensitive, where we record
204 // the current stack frame (for IPA). Also, we need to clean this
205 // value out when we return from this method.
206 state = state->set<CalledInit>(true);
207
Argyrios Kyrtzidis432424d2011-01-25 00:03:53 +0000208 SVal V = state->getSVal(msg.getOriginExpr());
Ted Kremenekb715a7c2011-02-12 03:03:54 +0000209 addSelfFlag(state, V, SelfFlag_InitRes, C);
Argyrios Kyrtzidisd7a31ba2011-01-11 19:45:25 +0000210 return;
211 }
212
213 // We don't check for an invalid 'self' in an obj-c message expression to cut
214 // down false positives where logging functions get information from self
215 // (like its class) or doing "invalidation" on self when the initialization
216 // fails.
217}
218
Argyrios Kyrtzidis769ce3e2011-02-22 17:30:38 +0000219void ObjCSelfInitChecker::checkPostStmt(const ObjCIvarRefExpr *E,
220 CheckerContext &C) const {
Argyrios Kyrtzidisd7a31ba2011-01-11 19:45:25 +0000221 // FIXME: A callback should disable checkers at the start of functions.
222 if (!shouldRunOnFunctionOrMethod(dyn_cast<NamedDecl>(
223 C.getCurrentAnalysisContext()->getDecl())))
224 return;
225
226 checkForInvalidSelf(E->getBase(), C,
Argyrios Kyrtzidisbe29d8d2011-02-01 19:32:55 +0000227 "Instance variable used while 'self' is not set to the result of "
Argyrios Kyrtzidis4717f162011-01-26 01:26:41 +0000228 "'[(super or self) init...]'");
Argyrios Kyrtzidisd7a31ba2011-01-11 19:45:25 +0000229}
230
Argyrios Kyrtzidis769ce3e2011-02-22 17:30:38 +0000231void ObjCSelfInitChecker::checkPreStmt(const ReturnStmt *S,
232 CheckerContext &C) const {
Argyrios Kyrtzidisd7a31ba2011-01-11 19:45:25 +0000233 // FIXME: A callback should disable checkers at the start of functions.
234 if (!shouldRunOnFunctionOrMethod(dyn_cast<NamedDecl>(
235 C.getCurrentAnalysisContext()->getDecl())))
236 return;
237
238 checkForInvalidSelf(S->getRetValue(), C,
Argyrios Kyrtzidis63eeade2011-02-01 20:33:05 +0000239 "Returning 'self' while it is not set to the result of "
Argyrios Kyrtzidis4717f162011-01-26 01:26:41 +0000240 "'[(super or self) init...]'");
Argyrios Kyrtzidisd7a31ba2011-01-11 19:45:25 +0000241}
242
243// When a call receives a reference to 'self', [Pre/Post]VisitGenericCall pass
244// the SelfFlags from the object 'self' point to before the call, to the new
Argyrios Kyrtzidis0ca10402011-02-05 05:54:53 +0000245// object after the call. This is to avoid invalidation of 'self' by logging
246// functions.
247// Another common pattern in classes with multiple initializers is to put the
248// subclass's common initialization bits into a static function that receives
249// the value of 'self', e.g:
250// @code
251// if (!(self = [super init]))
252// return nil;
253// if (!(self = _commonInit(self)))
254// return nil;
255// @endcode
256// Until we can use inter-procedural analysis, in such a call, transfer the
257// SelfFlags to the result of the call.
Argyrios Kyrtzidisd7a31ba2011-01-11 19:45:25 +0000258
Argyrios Kyrtzidis769ce3e2011-02-22 17:30:38 +0000259void ObjCSelfInitChecker::checkPreStmt(const CallExpr *CE,
260 CheckerContext &C) const {
Ted Kremenek18c66fd2011-08-15 22:09:50 +0000261 const ProgramState *state = C.getState();
Argyrios Kyrtzidisd7a31ba2011-01-11 19:45:25 +0000262 for (CallExpr::const_arg_iterator
263 I = CE->arg_begin(), E = CE->arg_end(); I != E; ++I) {
264 SVal argV = state->getSVal(*I);
265 if (isSelfVar(argV, C)) {
Argyrios Kyrtzidis769ce3e2011-02-22 17:30:38 +0000266 unsigned selfFlags = getSelfFlags(state->getSVal(cast<Loc>(argV)), C);
267 C.addTransition(state->set<PreCallSelfFlags>(selfFlags));
Argyrios Kyrtzidisd7a31ba2011-01-11 19:45:25 +0000268 return;
Argyrios Kyrtzidis0ca10402011-02-05 05:54:53 +0000269 } else if (hasSelfFlag(argV, SelfFlag_Self, C)) {
Argyrios Kyrtzidis769ce3e2011-02-22 17:30:38 +0000270 unsigned selfFlags = getSelfFlags(argV, C);
271 C.addTransition(state->set<PreCallSelfFlags>(selfFlags));
Argyrios Kyrtzidis0ca10402011-02-05 05:54:53 +0000272 return;
Argyrios Kyrtzidisd7a31ba2011-01-11 19:45:25 +0000273 }
274 }
275}
276
Argyrios Kyrtzidis769ce3e2011-02-22 17:30:38 +0000277void ObjCSelfInitChecker::checkPostStmt(const CallExpr *CE,
278 CheckerContext &C) const {
Ted Kremenek18c66fd2011-08-15 22:09:50 +0000279 const ProgramState *state = C.getState();
Argyrios Kyrtzidisd7a31ba2011-01-11 19:45:25 +0000280 for (CallExpr::const_arg_iterator
281 I = CE->arg_begin(), E = CE->arg_end(); I != E; ++I) {
282 SVal argV = state->getSVal(*I);
283 if (isSelfVar(argV, C)) {
Argyrios Kyrtzidis769ce3e2011-02-22 17:30:38 +0000284 SelfFlagEnum prevFlags = (SelfFlagEnum)state->get<PreCallSelfFlags>();
285 state = state->remove<PreCallSelfFlags>();
286 addSelfFlag(state, state->getSVal(cast<Loc>(argV)), prevFlags, C);
Argyrios Kyrtzidisd7a31ba2011-01-11 19:45:25 +0000287 return;
Argyrios Kyrtzidis0ca10402011-02-05 05:54:53 +0000288 } else if (hasSelfFlag(argV, SelfFlag_Self, C)) {
Argyrios Kyrtzidis769ce3e2011-02-22 17:30:38 +0000289 SelfFlagEnum prevFlags = (SelfFlagEnum)state->get<PreCallSelfFlags>();
290 state = state->remove<PreCallSelfFlags>();
291 addSelfFlag(state, state->getSVal(CE), prevFlags, C);
Argyrios Kyrtzidis0ca10402011-02-05 05:54:53 +0000292 return;
Argyrios Kyrtzidisd7a31ba2011-01-11 19:45:25 +0000293 }
294 }
295}
296
Argyrios Kyrtzidis769ce3e2011-02-22 17:30:38 +0000297void ObjCSelfInitChecker::checkLocation(SVal location, bool isLoad,
298 CheckerContext &C) const {
Argyrios Kyrtzidisd7a31ba2011-01-11 19:45:25 +0000299 // Tag the result of a load from 'self' so that we can easily know that the
300 // value is the object that 'self' points to.
Ted Kremenek18c66fd2011-08-15 22:09:50 +0000301 const ProgramState *state = C.getState();
Argyrios Kyrtzidisd7a31ba2011-01-11 19:45:25 +0000302 if (isSelfVar(location, C))
Ted Kremenekb715a7c2011-02-12 03:03:54 +0000303 addSelfFlag(state, state->getSVal(cast<Loc>(location)), SelfFlag_Self, C);
Argyrios Kyrtzidisd7a31ba2011-01-11 19:45:25 +0000304}
305
306// FIXME: A callback should disable checkers at the start of functions.
307static bool shouldRunOnFunctionOrMethod(const NamedDecl *ND) {
308 if (!ND)
309 return false;
310
311 const ObjCMethodDecl *MD = dyn_cast<ObjCMethodDecl>(ND);
312 if (!MD)
313 return false;
Argyrios Kyrtzidisd7a31ba2011-01-11 19:45:25 +0000314 if (!isInitializationMethod(MD))
315 return false;
316
Argyrios Kyrtzidiseaf969b2011-01-25 23:54:44 +0000317 // self = [super init] applies only to NSObject subclasses.
318 // For instance, NSProxy doesn't implement -init.
Ted Kremenek9c378f72011-08-12 23:37:29 +0000319 ASTContext &Ctx = MD->getASTContext();
Argyrios Kyrtzidiseaf969b2011-01-25 23:54:44 +0000320 IdentifierInfo* NSObjectII = &Ctx.Idents.get("NSObject");
Ted Kremenek9c378f72011-08-12 23:37:29 +0000321 ObjCInterfaceDecl *ID = MD->getClassInterface()->getSuperClass();
Argyrios Kyrtzidiseaf969b2011-01-25 23:54:44 +0000322 for ( ; ID ; ID = ID->getSuperClass()) {
323 IdentifierInfo *II = ID->getIdentifier();
324
325 if (II == NSObjectII)
326 break;
327 }
328 if (!ID)
329 return false;
330
Argyrios Kyrtzidisd7a31ba2011-01-11 19:45:25 +0000331 return true;
332}
333
334/// \brief Returns true if the location is 'self'.
335static bool isSelfVar(SVal location, CheckerContext &C) {
336 AnalysisContext *analCtx = C.getCurrentAnalysisContext();
337 if (!analCtx->getSelfDecl())
338 return false;
339 if (!isa<loc::MemRegionVal>(location))
340 return false;
341
342 loc::MemRegionVal MRV = cast<loc::MemRegionVal>(location);
343 if (const DeclRegion *DR = dyn_cast<DeclRegion>(MRV.getRegion()))
344 return (DR->getDecl() == analCtx->getSelfDecl());
345
346 return false;
347}
348
349static bool isInitializationMethod(const ObjCMethodDecl *MD) {
John McCall85f3d762011-03-02 01:50:55 +0000350 return MD->getMethodFamily() == OMF_init;
Argyrios Kyrtzidisd7a31ba2011-01-11 19:45:25 +0000351}
352
Argyrios Kyrtzidis432424d2011-01-25 00:03:53 +0000353static bool isInitMessage(const ObjCMessage &msg) {
John McCall85f3d762011-03-02 01:50:55 +0000354 return msg.getMethodFamily() == OMF_init;
Argyrios Kyrtzidisd7a31ba2011-01-11 19:45:25 +0000355}
Argyrios Kyrtzidis769ce3e2011-02-22 17:30:38 +0000356
357//===----------------------------------------------------------------------===//
358// Registration.
359//===----------------------------------------------------------------------===//
360
361void ento::registerObjCSelfInitChecker(CheckerManager &mgr) {
362 mgr.registerChecker<ObjCSelfInitChecker>();
363}