1 //=== StackAddrEscapeChecker.cpp ----------------------------------*- C++ -*--// 2 // 3 // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. 4 // See https://llvm.org/LICENSE.txt for license information. 5 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception 6 // 7 //===----------------------------------------------------------------------===// 8 // 9 // This file defines stack address leak checker, which checks if an invalid 10 // stack address is stored into a global or heap location. See CERT DCL30-C. 11 // 12 //===----------------------------------------------------------------------===// 13 14 #include "clang/AST/ExprCXX.h" 15 #include "clang/Basic/SourceManager.h" 16 #include "clang/StaticAnalyzer/Checkers/BuiltinCheckerRegistration.h" 17 #include "clang/StaticAnalyzer/Core/BugReporter/BugType.h" 18 #include "clang/StaticAnalyzer/Core/Checker.h" 19 #include "clang/StaticAnalyzer/Core/CheckerManager.h" 20 #include "clang/StaticAnalyzer/Core/PathSensitive/CallEvent.h" 21 #include "clang/StaticAnalyzer/Core/PathSensitive/CheckerContext.h" 22 #include "clang/StaticAnalyzer/Core/PathSensitive/ProgramState.h" 23 #include "llvm/ADT/SmallString.h" 24 #include "llvm/Support/raw_ostream.h" 25 using namespace clang; 26 using namespace ento; 27 28 namespace { 29 class StackAddrEscapeChecker 30 : public Checker<check::PreCall, check::PreStmt<ReturnStmt>, 31 check::EndFunction> { 32 mutable IdentifierInfo *dispatch_semaphore_tII = nullptr; 33 mutable std::unique_ptr<BugType> BT_stackleak; 34 mutable std::unique_ptr<BugType> BT_returnstack; 35 mutable std::unique_ptr<BugType> BT_capturedstackasync; 36 mutable std::unique_ptr<BugType> BT_capturedstackret; 37 38 public: 39 enum CheckKind { 40 CK_StackAddrEscapeChecker, 41 CK_StackAddrAsyncEscapeChecker, 42 CK_NumCheckKinds 43 }; 44 45 bool ChecksEnabled[CK_NumCheckKinds] = {false}; 46 CheckerNameRef CheckNames[CK_NumCheckKinds]; 47 48 void checkPreCall(const CallEvent &Call, CheckerContext &C) const; 49 void checkPreStmt(const ReturnStmt *RS, CheckerContext &C) const; 50 void checkEndFunction(const ReturnStmt *RS, CheckerContext &Ctx) const; 51 52 private: 53 void checkReturnedBlockCaptures(const BlockDataRegion &B, 54 CheckerContext &C) const; 55 void checkAsyncExecutedBlockCaptures(const BlockDataRegion &B, 56 CheckerContext &C) const; 57 void EmitStackError(CheckerContext &C, const MemRegion *R, 58 const Expr *RetE) const; 59 bool isSemaphoreCaptured(const BlockDecl &B) const; 60 static SourceRange genName(raw_ostream &os, const MemRegion *R, 61 ASTContext &Ctx); 62 static SmallVector<const MemRegion *, 4> 63 getCapturedStackRegions(const BlockDataRegion &B, CheckerContext &C); 64 static bool isNotInCurrentFrame(const MemRegion *R, CheckerContext &C); 65 }; 66 } // namespace 67 68 SourceRange StackAddrEscapeChecker::genName(raw_ostream &os, const MemRegion *R, 69 ASTContext &Ctx) { 70 // Get the base region, stripping away fields and elements. 71 R = R->getBaseRegion(); 72 SourceManager &SM = Ctx.getSourceManager(); 73 SourceRange range; 74 os << "Address of "; 75 76 // Check if the region is a compound literal. 77 if (const auto *CR = dyn_cast<CompoundLiteralRegion>(R)) { 78 const CompoundLiteralExpr *CL = CR->getLiteralExpr(); 79 os << "stack memory associated with a compound literal " 80 "declared on line " 81 << SM.getExpansionLineNumber(CL->getBeginLoc()) << " returned to caller"; 82 range = CL->getSourceRange(); 83 } else if (const auto *AR = dyn_cast<AllocaRegion>(R)) { 84 const Expr *ARE = AR->getExpr(); 85 SourceLocation L = ARE->getBeginLoc(); 86 range = ARE->getSourceRange(); 87 os << "stack memory allocated by call to alloca() on line " 88 << SM.getExpansionLineNumber(L); 89 } else if (const auto *BR = dyn_cast<BlockDataRegion>(R)) { 90 const BlockDecl *BD = BR->getCodeRegion()->getDecl(); 91 SourceLocation L = BD->getBeginLoc(); 92 range = BD->getSourceRange(); 93 os << "stack-allocated block declared on line " 94 << SM.getExpansionLineNumber(L); 95 } else if (const auto *VR = dyn_cast<VarRegion>(R)) { 96 os << "stack memory associated with local variable '" << VR->getString() 97 << '\''; 98 range = VR->getDecl()->getSourceRange(); 99 } else if (const auto *LER = dyn_cast<CXXLifetimeExtendedObjectRegion>(R)) { 100 QualType Ty = LER->getValueType().getLocalUnqualifiedType(); 101 os << "stack memory associated with temporary object of type '"; 102 Ty.print(os, Ctx.getPrintingPolicy()); 103 os << "' lifetime extended by local variable"; 104 if (const IdentifierInfo *ID = LER->getExtendingDecl()->getIdentifier()) 105 os << " '" << ID->getName() << '\''; 106 range = LER->getExpr()->getSourceRange(); 107 } else if (const auto *TOR = dyn_cast<CXXTempObjectRegion>(R)) { 108 QualType Ty = TOR->getValueType().getLocalUnqualifiedType(); 109 os << "stack memory associated with temporary object of type '"; 110 Ty.print(os, Ctx.getPrintingPolicy()); 111 os << "'"; 112 range = TOR->getExpr()->getSourceRange(); 113 } else { 114 llvm_unreachable("Invalid region in ReturnStackAddressChecker."); 115 } 116 117 return range; 118 } 119 120 bool StackAddrEscapeChecker::isNotInCurrentFrame(const MemRegion *R, 121 CheckerContext &C) { 122 const StackSpaceRegion *S = cast<StackSpaceRegion>(R->getMemorySpace()); 123 return S->getStackFrame() != C.getStackFrame(); 124 } 125 126 bool StackAddrEscapeChecker::isSemaphoreCaptured(const BlockDecl &B) const { 127 if (!dispatch_semaphore_tII) 128 dispatch_semaphore_tII = &B.getASTContext().Idents.get("dispatch_semaphore_t"); 129 for (const auto &C : B.captures()) { 130 const auto *T = C.getVariable()->getType()->getAs<TypedefType>(); 131 if (T && T->getDecl()->getIdentifier() == dispatch_semaphore_tII) 132 return true; 133 } 134 return false; 135 } 136 137 SmallVector<const MemRegion *, 4> 138 StackAddrEscapeChecker::getCapturedStackRegions(const BlockDataRegion &B, 139 CheckerContext &C) { 140 SmallVector<const MemRegion *, 4> Regions; 141 for (auto Var : B.referenced_vars()) { 142 SVal Val = C.getState()->getSVal(Var.getCapturedRegion()); 143 const MemRegion *Region = Val.getAsRegion(); 144 if (Region && isa<StackSpaceRegion>(Region->getMemorySpace())) 145 Regions.push_back(Region); 146 } 147 return Regions; 148 } 149 150 void StackAddrEscapeChecker::EmitStackError(CheckerContext &C, 151 const MemRegion *R, 152 const Expr *RetE) const { 153 ExplodedNode *N = C.generateNonFatalErrorNode(); 154 if (!N) 155 return; 156 if (!BT_returnstack) 157 BT_returnstack = std::make_unique<BugType>( 158 CheckNames[CK_StackAddrEscapeChecker], 159 "Return of address to stack-allocated memory"); 160 // Generate a report for this bug. 161 SmallString<128> buf; 162 llvm::raw_svector_ostream os(buf); 163 SourceRange range = genName(os, R, C.getASTContext()); 164 os << " returned to caller"; 165 auto report = 166 std::make_unique<PathSensitiveBugReport>(*BT_returnstack, os.str(), N); 167 report->addRange(RetE->getSourceRange()); 168 if (range.isValid()) 169 report->addRange(range); 170 C.emitReport(std::move(report)); 171 } 172 173 void StackAddrEscapeChecker::checkAsyncExecutedBlockCaptures( 174 const BlockDataRegion &B, CheckerContext &C) const { 175 // There is a not-too-uncommon idiom 176 // where a block passed to dispatch_async captures a semaphore 177 // and then the thread (which called dispatch_async) is blocked on waiting 178 // for the completion of the execution of the block 179 // via dispatch_semaphore_wait. To avoid false-positives (for now) 180 // we ignore all the blocks which have captured 181 // a variable of the type "dispatch_semaphore_t". 182 if (isSemaphoreCaptured(*B.getDecl())) 183 return; 184 for (const MemRegion *Region : getCapturedStackRegions(B, C)) { 185 // The block passed to dispatch_async may capture another block 186 // created on the stack. However, there is no leak in this situaton, 187 // no matter if ARC or no ARC is enabled: 188 // dispatch_async copies the passed "outer" block (via Block_copy) 189 // and if the block has captured another "inner" block, 190 // the "inner" block will be copied as well. 191 if (isa<BlockDataRegion>(Region)) 192 continue; 193 ExplodedNode *N = C.generateNonFatalErrorNode(); 194 if (!N) 195 continue; 196 if (!BT_capturedstackasync) 197 BT_capturedstackasync = std::make_unique<BugType>( 198 CheckNames[CK_StackAddrAsyncEscapeChecker], 199 "Address of stack-allocated memory is captured"); 200 SmallString<128> Buf; 201 llvm::raw_svector_ostream Out(Buf); 202 SourceRange Range = genName(Out, Region, C.getASTContext()); 203 Out << " is captured by an asynchronously-executed block"; 204 auto Report = std::make_unique<PathSensitiveBugReport>( 205 *BT_capturedstackasync, Out.str(), N); 206 if (Range.isValid()) 207 Report->addRange(Range); 208 C.emitReport(std::move(Report)); 209 } 210 } 211 212 void StackAddrEscapeChecker::checkReturnedBlockCaptures( 213 const BlockDataRegion &B, CheckerContext &C) const { 214 for (const MemRegion *Region : getCapturedStackRegions(B, C)) { 215 if (isNotInCurrentFrame(Region, C)) 216 continue; 217 ExplodedNode *N = C.generateNonFatalErrorNode(); 218 if (!N) 219 continue; 220 if (!BT_capturedstackret) 221 BT_capturedstackret = std::make_unique<BugType>( 222 CheckNames[CK_StackAddrEscapeChecker], 223 "Address of stack-allocated memory is captured"); 224 SmallString<128> Buf; 225 llvm::raw_svector_ostream Out(Buf); 226 SourceRange Range = genName(Out, Region, C.getASTContext()); 227 Out << " is captured by a returned block"; 228 auto Report = std::make_unique<PathSensitiveBugReport>(*BT_capturedstackret, 229 Out.str(), N); 230 if (Range.isValid()) 231 Report->addRange(Range); 232 C.emitReport(std::move(Report)); 233 } 234 } 235 236 void StackAddrEscapeChecker::checkPreCall(const CallEvent &Call, 237 CheckerContext &C) const { 238 if (!ChecksEnabled[CK_StackAddrAsyncEscapeChecker]) 239 return; 240 if (!Call.isGlobalCFunction("dispatch_after") && 241 !Call.isGlobalCFunction("dispatch_async")) 242 return; 243 for (unsigned Idx = 0, NumArgs = Call.getNumArgs(); Idx < NumArgs; ++Idx) { 244 if (const BlockDataRegion *B = dyn_cast_or_null<BlockDataRegion>( 245 Call.getArgSVal(Idx).getAsRegion())) 246 checkAsyncExecutedBlockCaptures(*B, C); 247 } 248 } 249 250 void StackAddrEscapeChecker::checkPreStmt(const ReturnStmt *RS, 251 CheckerContext &C) const { 252 if (!ChecksEnabled[CK_StackAddrEscapeChecker]) 253 return; 254 255 const Expr *RetE = RS->getRetValue(); 256 if (!RetE) 257 return; 258 RetE = RetE->IgnoreParens(); 259 260 SVal V = C.getSVal(RetE); 261 const MemRegion *R = V.getAsRegion(); 262 if (!R) 263 return; 264 265 if (const BlockDataRegion *B = dyn_cast<BlockDataRegion>(R)) 266 checkReturnedBlockCaptures(*B, C); 267 268 if (!isa<StackSpaceRegion>(R->getMemorySpace()) || isNotInCurrentFrame(R, C)) 269 return; 270 271 // Returning a record by value is fine. (In this case, the returned 272 // expression will be a copy-constructor, possibly wrapped in an 273 // ExprWithCleanups node.) 274 if (const ExprWithCleanups *Cleanup = dyn_cast<ExprWithCleanups>(RetE)) 275 RetE = Cleanup->getSubExpr(); 276 if (isa<CXXConstructExpr>(RetE) && RetE->getType()->isRecordType()) 277 return; 278 279 // The CK_CopyAndAutoreleaseBlockObject cast causes the block to be copied 280 // so the stack address is not escaping here. 281 if (const auto *ICE = dyn_cast<ImplicitCastExpr>(RetE)) { 282 if (isa<BlockDataRegion>(R) && 283 ICE->getCastKind() == CK_CopyAndAutoreleaseBlockObject) { 284 return; 285 } 286 } 287 288 EmitStackError(C, R, RetE); 289 } 290 291 static const MemSpaceRegion *getStackOrGlobalSpaceRegion(const MemRegion *R) { 292 assert(R); 293 if (const auto *MemSpace = R->getMemorySpace()) { 294 if (const auto *SSR = MemSpace->getAs<StackSpaceRegion>()) 295 return SSR; 296 if (const auto *GSR = MemSpace->getAs<GlobalsSpaceRegion>()) 297 return GSR; 298 } 299 // If R describes a lambda capture, it will be a symbolic region 300 // referring to a field region of another symbolic region. 301 if (const auto *SymReg = R->getBaseRegion()->getAs<SymbolicRegion>()) { 302 if (const auto *OriginReg = SymReg->getSymbol()->getOriginRegion()) 303 return getStackOrGlobalSpaceRegion(OriginReg); 304 } 305 return nullptr; 306 } 307 308 const MemRegion *getOriginBaseRegion(const MemRegion *Reg) { 309 Reg = Reg->getBaseRegion(); 310 while (const auto *SymReg = dyn_cast<SymbolicRegion>(Reg)) { 311 const auto *OriginReg = SymReg->getSymbol()->getOriginRegion(); 312 if (!OriginReg) 313 break; 314 Reg = OriginReg->getBaseRegion(); 315 } 316 return Reg; 317 } 318 319 std::optional<std::string> printReferrer(const MemRegion *Referrer) { 320 assert(Referrer); 321 const StringRef ReferrerMemorySpace = [](const MemSpaceRegion *Space) { 322 if (isa<StaticGlobalSpaceRegion>(Space)) 323 return "static"; 324 if (isa<GlobalsSpaceRegion>(Space)) 325 return "global"; 326 assert(isa<StackSpaceRegion>(Space)); 327 // This case covers top-level and inlined analyses. 328 return "caller"; 329 }(getStackOrGlobalSpaceRegion(Referrer)); 330 331 while (!Referrer->canPrintPretty()) { 332 if (const auto *SymReg = dyn_cast<SymbolicRegion>(Referrer); 333 SymReg && SymReg->getSymbol()->getOriginRegion()) { 334 Referrer = SymReg->getSymbol()->getOriginRegion()->getBaseRegion(); 335 } else if (isa<CXXThisRegion>(Referrer)) { 336 // Skip members of a class, it is handled in CheckExprLifetime.cpp as 337 // warn_bind_ref_member_to_parameter or 338 // warn_init_ptr_member_to_parameter_addr 339 return std::nullopt; 340 } else { 341 assert(false && "Unexpected referrer region type."); 342 return std::nullopt; 343 } 344 } 345 assert(Referrer); 346 assert(Referrer->canPrintPretty()); 347 348 std::string buf; 349 llvm::raw_string_ostream os(buf); 350 os << ReferrerMemorySpace << " variable "; 351 Referrer->printPretty(os); 352 return buf; 353 } 354 355 /// Check whether \p Region refers to a freshly minted symbol after an opaque 356 /// function call. 357 bool isInvalidatedSymbolRegion(const MemRegion *Region) { 358 const auto *SymReg = Region->getAs<SymbolicRegion>(); 359 if (!SymReg) 360 return false; 361 SymbolRef Symbol = SymReg->getSymbol(); 362 363 const auto *DerS = dyn_cast<SymbolDerived>(Symbol); 364 return DerS && isa_and_nonnull<SymbolConjured>(DerS->getParentSymbol()); 365 } 366 367 void StackAddrEscapeChecker::checkEndFunction(const ReturnStmt *RS, 368 CheckerContext &Ctx) const { 369 if (!ChecksEnabled[CK_StackAddrEscapeChecker]) 370 return; 371 372 ExplodedNode *Node = Ctx.getPredecessor(); 373 374 bool ExitingTopFrame = 375 Ctx.getPredecessor()->getLocationContext()->inTopFrame(); 376 377 if (ExitingTopFrame && 378 Node->getLocation().getTag() == ExprEngine::cleanupNodeTag() && 379 Node->getFirstPred()) { 380 // When finishing analysis of a top-level function, engine proactively 381 // removes dead symbols thus preventing this checker from looking through 382 // the output parameters. Take 1 step back, to the node where these symbols 383 // and their bindings are still present 384 Node = Node->getFirstPred(); 385 } 386 387 // Iterate over all bindings to global variables and see if it contains 388 // a memory region in the stack space. 389 class CallBack : public StoreManager::BindingsHandler { 390 private: 391 CheckerContext &Ctx; 392 const StackFrameContext *PoppedFrame; 393 const bool TopFrame; 394 395 /// Look for stack variables referring to popped stack variables. 396 /// Returns true only if it found some dangling stack variables 397 /// referred by an other stack variable from different stack frame. 398 bool checkForDanglingStackVariable(const MemRegion *Referrer, 399 const MemRegion *Referred) { 400 const auto *ReferrerMemSpace = getStackOrGlobalSpaceRegion(Referrer); 401 const auto *ReferredMemSpace = 402 Referred->getMemorySpace()->getAs<StackSpaceRegion>(); 403 404 if (!ReferrerMemSpace || !ReferredMemSpace) 405 return false; 406 407 const auto *ReferrerStackSpace = 408 ReferrerMemSpace->getAs<StackSpaceRegion>(); 409 410 if (!ReferrerStackSpace) 411 return false; 412 413 if (const auto *ReferredFrame = ReferredMemSpace->getStackFrame(); 414 ReferredFrame != PoppedFrame) { 415 return false; 416 } 417 418 if (ReferrerStackSpace->getStackFrame()->isParentOf(PoppedFrame)) { 419 V.emplace_back(Referrer, Referred); 420 return true; 421 } 422 if (isa<StackArgumentsSpaceRegion>(ReferrerMemSpace) && 423 ReferrerStackSpace->getStackFrame() == PoppedFrame && TopFrame) { 424 // Output parameter of a top-level function 425 V.emplace_back(Referrer, Referred); 426 return true; 427 } 428 return false; 429 } 430 431 // Keep track of the variables that were invalidated through an opaque 432 // function call. Even if the initial values of such variables were bound to 433 // an address of a local variable, we cannot claim anything now, at the 434 // function exit, so skip them to avoid false positives. 435 void recordInInvalidatedRegions(const MemRegion *Region) { 436 if (isInvalidatedSymbolRegion(Region)) 437 ExcludedRegions.insert(getOriginBaseRegion(Region)); 438 } 439 440 public: 441 SmallVector<std::pair<const MemRegion *, const MemRegion *>, 10> V; 442 // ExcludedRegions are skipped from reporting. 443 // I.e., if a referrer in this set, skip the related bug report. 444 // It is useful to avoid false positive for the variables that were 445 // reset to a conjured value after an opaque function call. 446 llvm::SmallPtrSet<const MemRegion *, 4> ExcludedRegions; 447 448 CallBack(CheckerContext &CC, bool TopFrame) 449 : Ctx(CC), PoppedFrame(CC.getStackFrame()), TopFrame(TopFrame) {} 450 451 bool HandleBinding(StoreManager &SMgr, Store S, const MemRegion *Region, 452 SVal Val) override { 453 recordInInvalidatedRegions(Region); 454 const MemRegion *VR = Val.getAsRegion(); 455 if (!VR) 456 return true; 457 458 if (checkForDanglingStackVariable(Region, VR)) 459 return true; 460 461 // Check the globals for the same. 462 if (!isa_and_nonnull<GlobalsSpaceRegion>( 463 getStackOrGlobalSpaceRegion(Region))) 464 return true; 465 if (VR && VR->hasStackStorage() && !isNotInCurrentFrame(VR, Ctx)) 466 V.emplace_back(Region, VR); 467 return true; 468 } 469 }; 470 471 CallBack Cb(Ctx, ExitingTopFrame); 472 ProgramStateRef State = Node->getState(); 473 State->getStateManager().getStoreManager().iterBindings(State->getStore(), 474 Cb); 475 476 if (Cb.V.empty()) 477 return; 478 479 // Generate an error node. 480 ExplodedNode *N = Ctx.generateNonFatalErrorNode(State, Node); 481 if (!N) 482 return; 483 484 if (!BT_stackleak) 485 BT_stackleak = 486 std::make_unique<BugType>(CheckNames[CK_StackAddrEscapeChecker], 487 "Stack address leaks outside of stack frame"); 488 489 for (const auto &P : Cb.V) { 490 const MemRegion *Referrer = P.first->getBaseRegion(); 491 const MemRegion *Referred = P.second; 492 if (Cb.ExcludedRegions.contains(getOriginBaseRegion(Referrer))) { 493 continue; 494 } 495 496 // Generate a report for this bug. 497 const StringRef CommonSuffix = 498 " upon returning to the caller. This will be a dangling reference"; 499 SmallString<128> Buf; 500 llvm::raw_svector_ostream Out(Buf); 501 const SourceRange Range = genName(Out, Referred, Ctx.getASTContext()); 502 503 if (isa<CXXTempObjectRegion, CXXLifetimeExtendedObjectRegion>(Referrer)) { 504 Out << " is still referred to by a temporary object on the stack" 505 << CommonSuffix; 506 auto Report = 507 std::make_unique<PathSensitiveBugReport>(*BT_stackleak, Out.str(), N); 508 if (Range.isValid()) 509 Report->addRange(Range); 510 Ctx.emitReport(std::move(Report)); 511 return; 512 } 513 514 auto ReferrerVariable = printReferrer(Referrer); 515 if (!ReferrerVariable) { 516 continue; 517 } 518 519 Out << " is still referred to by the " << *ReferrerVariable << CommonSuffix; 520 auto Report = 521 std::make_unique<PathSensitiveBugReport>(*BT_stackleak, Out.str(), N); 522 if (Range.isValid()) 523 Report->addRange(Range); 524 525 Ctx.emitReport(std::move(Report)); 526 } 527 } 528 529 void ento::registerStackAddrEscapeBase(CheckerManager &mgr) { 530 mgr.registerChecker<StackAddrEscapeChecker>(); 531 } 532 533 bool ento::shouldRegisterStackAddrEscapeBase(const CheckerManager &mgr) { 534 return true; 535 } 536 537 #define REGISTER_CHECKER(name) \ 538 void ento::register##name(CheckerManager &Mgr) { \ 539 StackAddrEscapeChecker *Chk = Mgr.getChecker<StackAddrEscapeChecker>(); \ 540 Chk->ChecksEnabled[StackAddrEscapeChecker::CK_##name] = true; \ 541 Chk->CheckNames[StackAddrEscapeChecker::CK_##name] = \ 542 Mgr.getCurrentCheckerName(); \ 543 } \ 544 \ 545 bool ento::shouldRegister##name(const CheckerManager &mgr) { return true; } 546 547 REGISTER_CHECKER(StackAddrEscapeChecker) 548 REGISTER_CHECKER(StackAddrAsyncEscapeChecker) 549