| 1 | //== ObjCSelfInitChecker.cpp - Checker for 'self' initialization -*- C++ -*--=// |
| 2 | // |
| 3 | // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. |
| 4 | // See https://llvm.org/LICENSE.txt for license information. |
| 5 | // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception |
| 6 | // |
| 7 | //===----------------------------------------------------------------------===// |
| 8 | // |
| 9 | // This defines ObjCSelfInitChecker, a builtin check that checks for uses of |
| 10 | // 'self' before proper initialization. |
| 11 | // |
| 12 | //===----------------------------------------------------------------------===// |
| 13 | |
| 14 | // This checks initialization methods to verify that they assign 'self' to the |
| 15 | // result of an initialization call (e.g. [super init], or [self initWith..]) |
| 16 | // before using 'self' or any instance variable. |
| 17 | // |
| 18 | // To perform the required checking, values are tagged with flags that indicate |
| 19 | // 1) if the object is the one pointed to by 'self', and 2) if the object |
| 20 | // is the result of an initializer (e.g. [super init]). |
| 21 | // |
| 22 | // Uses of an object that is true for 1) but not 2) trigger a diagnostic. |
| 23 | // The uses that are currently checked are: |
| 24 | // - Using instance variables. |
| 25 | // - Returning the object. |
| 26 | // |
| 27 | // Note that we don't check for an invalid 'self' that is the receiver of an |
| 28 | // obj-c message expression to cut down false positives where logging functions |
| 29 | // get information from self (like its class) or doing "invalidation" on self |
| 30 | // when the initialization fails. |
| 31 | // |
| 32 | // Because the object that 'self' points to gets invalidated when a call |
| 33 | // receives a reference to 'self', the checker keeps track and passes the flags |
| 34 | // for 1) and 2) to the new object that 'self' points to after the call. |
| 35 | // |
| 36 | //===----------------------------------------------------------------------===// |
| 37 | |
| 38 | #include "clang/StaticAnalyzer/Checkers/BuiltinCheckerRegistration.h" |
| 39 | #include "clang/AST/ParentMap.h" |
| 40 | #include "clang/StaticAnalyzer/Core/BugReporter/BugType.h" |
| 41 | #include "clang/StaticAnalyzer/Core/Checker.h" |
| 42 | #include "clang/StaticAnalyzer/Core/CheckerManager.h" |
| 43 | #include "clang/StaticAnalyzer/Core/PathSensitive/CallEvent.h" |
| 44 | #include "clang/StaticAnalyzer/Core/PathSensitive/CheckerContext.h" |
| 45 | #include "clang/StaticAnalyzer/Core/PathSensitive/ProgramStateTrait.h" |
| 46 | #include "llvm/Support/raw_ostream.h" |
| 47 | |
| 48 | using namespace clang; |
| 49 | using namespace ento; |
| 50 | |
| 51 | static bool shouldRunOnFunctionOrMethod(const NamedDecl *ND); |
| 52 | static bool isInitializationMethod(const ObjCMethodDecl *MD); |
| 53 | static bool isInitMessage(const ObjCMethodCall &Msg); |
| 54 | static bool isSelfVar(SVal location, CheckerContext &C); |
| 55 | |
| 56 | namespace { |
| 57 | class ObjCSelfInitChecker : public Checker< check::PostObjCMessage, |
| 58 | check::PostStmt<ObjCIvarRefExpr>, |
| 59 | check::PreStmt<ReturnStmt>, |
| 60 | check::PreCall, |
| 61 | check::PostCall, |
| 62 | check::Location, |
| 63 | check::Bind > { |
| 64 | const BugType BT{this, "Missing \"self = [(super or self) init...]\"" , |
| 65 | categories::CoreFoundationObjectiveC}; |
| 66 | |
| 67 | void checkForInvalidSelf(const Expr *E, CheckerContext &C, |
| 68 | const char *errorStr) const; |
| 69 | |
| 70 | public: |
| 71 | void checkPostObjCMessage(const ObjCMethodCall &Msg, CheckerContext &C) const; |
| 72 | void checkPostStmt(const ObjCIvarRefExpr *E, CheckerContext &C) const; |
| 73 | void checkPreStmt(const ReturnStmt *S, CheckerContext &C) const; |
| 74 | void checkLocation(SVal location, bool isLoad, const Stmt *S, |
| 75 | CheckerContext &C) const; |
| 76 | void checkBind(SVal loc, SVal val, const Stmt *S, CheckerContext &C) const; |
| 77 | |
| 78 | void checkPreCall(const CallEvent &CE, CheckerContext &C) const; |
| 79 | void checkPostCall(const CallEvent &CE, CheckerContext &C) const; |
| 80 | |
| 81 | void printState(raw_ostream &Out, ProgramStateRef State, |
| 82 | const char *NL, const char *Sep) const override; |
| 83 | }; |
| 84 | } // end anonymous namespace |
| 85 | |
| 86 | namespace { |
| 87 | enum SelfFlagEnum { |
| 88 | /// No flag set. |
| 89 | SelfFlag_None = 0x0, |
| 90 | /// Value came from 'self'. |
| 91 | SelfFlag_Self = 0x1, |
| 92 | /// Value came from the result of an initializer (e.g. [super init]). |
| 93 | SelfFlag_InitRes = 0x2 |
| 94 | }; |
| 95 | } |
| 96 | |
| 97 | REGISTER_MAP_WITH_PROGRAMSTATE(SelfFlag, SymbolRef, SelfFlagEnum) |
| 98 | REGISTER_TRAIT_WITH_PROGRAMSTATE(CalledInit, bool) |
| 99 | |
| 100 | /// A call receiving a reference to 'self' invalidates the object that |
| 101 | /// 'self' contains. This keeps the "self flags" assigned to the 'self' |
| 102 | /// object before the call so we can assign them to the new object that 'self' |
| 103 | /// points to after the call. |
| 104 | REGISTER_TRAIT_WITH_PROGRAMSTATE(PreCallSelfFlags, SelfFlagEnum) |
| 105 | |
| 106 | static SelfFlagEnum getSelfFlags(SVal val, ProgramStateRef state) { |
| 107 | if (SymbolRef sym = val.getAsSymbol()) |
| 108 | if (const SelfFlagEnum *attachedFlags = state->get<SelfFlag>(key: sym)) |
| 109 | return *attachedFlags; |
| 110 | return SelfFlag_None; |
| 111 | } |
| 112 | |
| 113 | static SelfFlagEnum getSelfFlags(SVal val, CheckerContext &C) { |
| 114 | return getSelfFlags(val, state: C.getState()); |
| 115 | } |
| 116 | |
| 117 | static void addSelfFlag(ProgramStateRef state, SVal val, |
| 118 | SelfFlagEnum flag, CheckerContext &C) { |
| 119 | // We tag the symbol that the SVal wraps. |
| 120 | if (SymbolRef sym = val.getAsSymbol()) { |
| 121 | state = state->set<SelfFlag>(K: sym, |
| 122 | E: SelfFlagEnum(getSelfFlags(val, state) | flag)); |
| 123 | C.addTransition(State: state); |
| 124 | } |
| 125 | } |
| 126 | |
| 127 | static bool hasSelfFlag(SVal val, SelfFlagEnum flag, CheckerContext &C) { |
| 128 | return getSelfFlags(val, C) & flag; |
| 129 | } |
| 130 | |
| 131 | /// Returns true of the value of the expression is the object that 'self' |
| 132 | /// points to and is an object that did not come from the result of calling |
| 133 | /// an initializer. |
| 134 | static bool isInvalidSelf(const Expr *E, CheckerContext &C) { |
| 135 | SVal exprVal = C.getSVal(S: E); |
| 136 | if (!hasSelfFlag(val: exprVal, flag: SelfFlag_Self, C)) |
| 137 | return false; // value did not come from 'self'. |
| 138 | if (hasSelfFlag(val: exprVal, flag: SelfFlag_InitRes, C)) |
| 139 | return false; // 'self' is properly initialized. |
| 140 | |
| 141 | return true; |
| 142 | } |
| 143 | |
| 144 | void ObjCSelfInitChecker::checkForInvalidSelf(const Expr *E, CheckerContext &C, |
| 145 | const char *errorStr) const { |
| 146 | if (!E) |
| 147 | return; |
| 148 | |
| 149 | if (!C.getState()->get<CalledInit>()) |
| 150 | return; |
| 151 | |
| 152 | if (!isInvalidSelf(E, C)) |
| 153 | return; |
| 154 | |
| 155 | // Generate an error node. |
| 156 | ExplodedNode *N = C.generateErrorNode(); |
| 157 | if (!N) |
| 158 | return; |
| 159 | |
| 160 | C.emitReport(R: std::make_unique<PathSensitiveBugReport>(args: BT, args&: errorStr, args&: N)); |
| 161 | } |
| 162 | |
| 163 | void ObjCSelfInitChecker::checkPostObjCMessage(const ObjCMethodCall &Msg, |
| 164 | CheckerContext &C) const { |
| 165 | // When encountering a message that does initialization (init rule), |
| 166 | // tag the return value so that we know later on that if self has this value |
| 167 | // then it is properly initialized. |
| 168 | |
| 169 | // FIXME: A callback should disable checkers at the start of functions. |
| 170 | if (!shouldRunOnFunctionOrMethod(ND: dyn_cast<NamedDecl>( |
| 171 | Val: C.getCurrentAnalysisDeclContext()->getDecl()))) |
| 172 | return; |
| 173 | |
| 174 | if (isInitMessage(Msg)) { |
| 175 | // Tag the return value as the result of an initializer. |
| 176 | ProgramStateRef state = C.getState(); |
| 177 | |
| 178 | // FIXME this really should be context sensitive, where we record |
| 179 | // the current stack frame (for IPA). Also, we need to clean this |
| 180 | // value out when we return from this method. |
| 181 | state = state->set<CalledInit>(true); |
| 182 | |
| 183 | SVal V = C.getSVal(S: Msg.getOriginExpr()); |
| 184 | addSelfFlag(state, val: V, flag: SelfFlag_InitRes, C); |
| 185 | return; |
| 186 | } |
| 187 | |
| 188 | // We don't check for an invalid 'self' in an obj-c message expression to cut |
| 189 | // down false positives where logging functions get information from self |
| 190 | // (like its class) or doing "invalidation" on self when the initialization |
| 191 | // fails. |
| 192 | } |
| 193 | |
| 194 | void ObjCSelfInitChecker::checkPostStmt(const ObjCIvarRefExpr *E, |
| 195 | CheckerContext &C) const { |
| 196 | // FIXME: A callback should disable checkers at the start of functions. |
| 197 | if (!shouldRunOnFunctionOrMethod(ND: dyn_cast<NamedDecl>( |
| 198 | Val: C.getCurrentAnalysisDeclContext()->getDecl()))) |
| 199 | return; |
| 200 | |
| 201 | checkForInvalidSelf( |
| 202 | E: E->getBase(), C, |
| 203 | errorStr: "Instance variable used while 'self' is not set to the result of " |
| 204 | "'[(super or self) init...]'" ); |
| 205 | } |
| 206 | |
| 207 | void ObjCSelfInitChecker::checkPreStmt(const ReturnStmt *S, |
| 208 | CheckerContext &C) const { |
| 209 | // FIXME: A callback should disable checkers at the start of functions. |
| 210 | if (!shouldRunOnFunctionOrMethod(ND: dyn_cast<NamedDecl>( |
| 211 | Val: C.getCurrentAnalysisDeclContext()->getDecl()))) |
| 212 | return; |
| 213 | |
| 214 | checkForInvalidSelf(E: S->getRetValue(), C, |
| 215 | errorStr: "Returning 'self' while it is not set to the result of " |
| 216 | "'[(super or self) init...]'" ); |
| 217 | } |
| 218 | |
| 219 | // When a call receives a reference to 'self', [Pre/Post]Call pass |
| 220 | // the SelfFlags from the object 'self' points to before the call to the new |
| 221 | // object after the call. This is to avoid invalidation of 'self' by logging |
| 222 | // functions. |
| 223 | // Another common pattern in classes with multiple initializers is to put the |
| 224 | // subclass's common initialization bits into a static function that receives |
| 225 | // the value of 'self', e.g: |
| 226 | // @code |
| 227 | // if (!(self = [super init])) |
| 228 | // return nil; |
| 229 | // if (!(self = _commonInit(self))) |
| 230 | // return nil; |
| 231 | // @endcode |
| 232 | // Until we can use inter-procedural analysis, in such a call, transfer the |
| 233 | // SelfFlags to the result of the call. |
| 234 | |
| 235 | void ObjCSelfInitChecker::checkPreCall(const CallEvent &CE, |
| 236 | CheckerContext &C) const { |
| 237 | // FIXME: A callback should disable checkers at the start of functions. |
| 238 | if (!shouldRunOnFunctionOrMethod(ND: dyn_cast<NamedDecl>( |
| 239 | Val: C.getCurrentAnalysisDeclContext()->getDecl()))) |
| 240 | return; |
| 241 | |
| 242 | ProgramStateRef state = C.getState(); |
| 243 | unsigned NumArgs = CE.getNumArgs(); |
| 244 | // If we passed 'self' as and argument to the call, record it in the state |
| 245 | // to be propagated after the call. |
| 246 | // Note, we could have just given up, but try to be more optimistic here and |
| 247 | // assume that the functions are going to continue initialization or will not |
| 248 | // modify self. |
| 249 | for (unsigned i = 0; i < NumArgs; ++i) { |
| 250 | SVal argV = CE.getArgSVal(Index: i); |
| 251 | if (isSelfVar(location: argV, C)) { |
| 252 | SelfFlagEnum selfFlags = |
| 253 | getSelfFlags(val: state->getSVal(LV: argV.castAs<Loc>()), C); |
| 254 | C.addTransition(State: state->set<PreCallSelfFlags>(selfFlags)); |
| 255 | return; |
| 256 | } else if (hasSelfFlag(val: argV, flag: SelfFlag_Self, C)) { |
| 257 | SelfFlagEnum selfFlags = getSelfFlags(val: argV, C); |
| 258 | C.addTransition(State: state->set<PreCallSelfFlags>(selfFlags)); |
| 259 | return; |
| 260 | } |
| 261 | } |
| 262 | } |
| 263 | |
| 264 | void ObjCSelfInitChecker::checkPostCall(const CallEvent &CE, |
| 265 | CheckerContext &C) const { |
| 266 | // FIXME: A callback should disable checkers at the start of functions. |
| 267 | if (!shouldRunOnFunctionOrMethod(ND: dyn_cast<NamedDecl>( |
| 268 | Val: C.getCurrentAnalysisDeclContext()->getDecl()))) |
| 269 | return; |
| 270 | |
| 271 | ProgramStateRef state = C.getState(); |
| 272 | SelfFlagEnum prevFlags = state->get<PreCallSelfFlags>(); |
| 273 | if (!prevFlags) |
| 274 | return; |
| 275 | state = state->remove<PreCallSelfFlags>(); |
| 276 | |
| 277 | unsigned NumArgs = CE.getNumArgs(); |
| 278 | for (unsigned i = 0; i < NumArgs; ++i) { |
| 279 | SVal argV = CE.getArgSVal(Index: i); |
| 280 | if (isSelfVar(location: argV, C)) { |
| 281 | // If the address of 'self' is being passed to the call, assume that the |
| 282 | // 'self' after the call will have the same flags. |
| 283 | // EX: log(&self) |
| 284 | addSelfFlag(state, val: state->getSVal(LV: argV.castAs<Loc>()), flag: prevFlags, C); |
| 285 | return; |
| 286 | } else if (hasSelfFlag(val: argV, flag: SelfFlag_Self, C)) { |
| 287 | // If 'self' is passed to the call by value, assume that the function |
| 288 | // returns 'self'. So assign the flags, which were set on 'self' to the |
| 289 | // return value. |
| 290 | // EX: self = performMoreInitialization(self) |
| 291 | addSelfFlag(state, val: CE.getReturnValue(), flag: prevFlags, C); |
| 292 | return; |
| 293 | } |
| 294 | } |
| 295 | |
| 296 | C.addTransition(State: state); |
| 297 | } |
| 298 | |
| 299 | void ObjCSelfInitChecker::checkLocation(SVal location, bool isLoad, |
| 300 | const Stmt *S, |
| 301 | CheckerContext &C) const { |
| 302 | if (!shouldRunOnFunctionOrMethod(ND: dyn_cast<NamedDecl>( |
| 303 | Val: C.getCurrentAnalysisDeclContext()->getDecl()))) |
| 304 | return; |
| 305 | |
| 306 | // Tag the result of a load from 'self' so that we can easily know that the |
| 307 | // value is the object that 'self' points to. |
| 308 | ProgramStateRef state = C.getState(); |
| 309 | if (isSelfVar(location, C)) |
| 310 | addSelfFlag(state, val: state->getSVal(LV: location.castAs<Loc>()), flag: SelfFlag_Self, |
| 311 | C); |
| 312 | } |
| 313 | |
| 314 | |
| 315 | void ObjCSelfInitChecker::checkBind(SVal loc, SVal val, const Stmt *S, |
| 316 | CheckerContext &C) const { |
| 317 | // Allow assignment of anything to self. Self is a local variable in the |
| 318 | // initializer, so it is legal to assign anything to it, like results of |
| 319 | // static functions/method calls. After self is assigned something we cannot |
| 320 | // reason about, stop enforcing the rules. |
| 321 | // (Only continue checking if the assigned value should be treated as self.) |
| 322 | if ((isSelfVar(location: loc, C)) && |
| 323 | !hasSelfFlag(val, flag: SelfFlag_InitRes, C) && |
| 324 | !hasSelfFlag(val, flag: SelfFlag_Self, C) && |
| 325 | !isSelfVar(location: val, C)) { |
| 326 | |
| 327 | // Stop tracking the checker-specific state in the state. |
| 328 | ProgramStateRef State = C.getState(); |
| 329 | State = State->remove<CalledInit>(); |
| 330 | if (SymbolRef sym = loc.getAsSymbol()) |
| 331 | State = State->remove<SelfFlag>(K: sym); |
| 332 | C.addTransition(State); |
| 333 | } |
| 334 | } |
| 335 | |
| 336 | void ObjCSelfInitChecker::printState(raw_ostream &Out, ProgramStateRef State, |
| 337 | const char *NL, const char *Sep) const { |
| 338 | SelfFlagTy FlagMap = State->get<SelfFlag>(); |
| 339 | bool DidCallInit = State->get<CalledInit>(); |
| 340 | SelfFlagEnum PreCallFlags = State->get<PreCallSelfFlags>(); |
| 341 | |
| 342 | if (FlagMap.isEmpty() && !DidCallInit && !PreCallFlags) |
| 343 | return; |
| 344 | |
| 345 | Out << Sep << NL << "ObjCSelfInitChecker:" << NL; |
| 346 | |
| 347 | if (DidCallInit) |
| 348 | Out << " An init method has been called." << NL; |
| 349 | |
| 350 | if (PreCallFlags != SelfFlag_None) { |
| 351 | if (PreCallFlags & SelfFlag_Self) { |
| 352 | Out << " An argument of the current call came from the 'self' variable." |
| 353 | << NL; |
| 354 | } |
| 355 | if (PreCallFlags & SelfFlag_InitRes) { |
| 356 | Out << " An argument of the current call came from an init method." |
| 357 | << NL; |
| 358 | } |
| 359 | } |
| 360 | |
| 361 | Out << NL; |
| 362 | for (auto [Sym, Flag] : FlagMap) { |
| 363 | Out << Sym << " : " ; |
| 364 | |
| 365 | if (Flag == SelfFlag_None) |
| 366 | Out << "none" ; |
| 367 | |
| 368 | if (Flag & SelfFlag_Self) |
| 369 | Out << "self variable" ; |
| 370 | |
| 371 | if (Flag & SelfFlag_InitRes) { |
| 372 | if (Flag != SelfFlag_InitRes) |
| 373 | Out << " | " ; |
| 374 | Out << "result of init method" ; |
| 375 | } |
| 376 | |
| 377 | Out << NL; |
| 378 | } |
| 379 | } |
| 380 | |
| 381 | |
| 382 | // FIXME: A callback should disable checkers at the start of functions. |
| 383 | static bool shouldRunOnFunctionOrMethod(const NamedDecl *ND) { |
| 384 | if (!ND) |
| 385 | return false; |
| 386 | |
| 387 | const ObjCMethodDecl *MD = dyn_cast<ObjCMethodDecl>(Val: ND); |
| 388 | if (!MD) |
| 389 | return false; |
| 390 | if (!isInitializationMethod(MD)) |
| 391 | return false; |
| 392 | |
| 393 | // self = [super init] applies only to NSObject subclasses. |
| 394 | // For instance, NSProxy doesn't implement -init. |
| 395 | ASTContext &Ctx = MD->getASTContext(); |
| 396 | IdentifierInfo* NSObjectII = &Ctx.Idents.get(Name: "NSObject" ); |
| 397 | ObjCInterfaceDecl *ID = MD->getClassInterface()->getSuperClass(); |
| 398 | for ( ; ID ; ID = ID->getSuperClass()) { |
| 399 | IdentifierInfo *II = ID->getIdentifier(); |
| 400 | |
| 401 | if (II == NSObjectII) |
| 402 | break; |
| 403 | } |
| 404 | return ID != nullptr; |
| 405 | } |
| 406 | |
| 407 | /// Returns true if the location is 'self'. |
| 408 | static bool isSelfVar(SVal location, CheckerContext &C) { |
| 409 | AnalysisDeclContext *analCtx = C.getCurrentAnalysisDeclContext(); |
| 410 | if (!analCtx->getSelfDecl()) |
| 411 | return false; |
| 412 | if (!isa<loc::MemRegionVal>(Val: location)) |
| 413 | return false; |
| 414 | |
| 415 | loc::MemRegionVal MRV = location.castAs<loc::MemRegionVal>(); |
| 416 | if (const DeclRegion *DR = dyn_cast<DeclRegion>(Val: MRV.stripCasts())) |
| 417 | return (DR->getDecl() == analCtx->getSelfDecl()); |
| 418 | |
| 419 | return false; |
| 420 | } |
| 421 | |
| 422 | static bool isInitializationMethod(const ObjCMethodDecl *MD) { |
| 423 | return MD->getMethodFamily() == OMF_init; |
| 424 | } |
| 425 | |
| 426 | static bool isInitMessage(const ObjCMethodCall &Call) { |
| 427 | return Call.getMethodFamily() == OMF_init; |
| 428 | } |
| 429 | |
| 430 | //===----------------------------------------------------------------------===// |
| 431 | // Registration. |
| 432 | //===----------------------------------------------------------------------===// |
| 433 | |
| 434 | void ento::registerObjCSelfInitChecker(CheckerManager &mgr) { |
| 435 | mgr.registerChecker<ObjCSelfInitChecker>(); |
| 436 | } |
| 437 | |
| 438 | bool ento::shouldRegisterObjCSelfInitChecker(const CheckerManager &mgr) { |
| 439 | return true; |
| 440 | } |
| 441 | |