10b57cec5SDimitry Andric //===--- NonNullParamChecker.cpp - Undefined arguments checker -*- C++ -*--===//
20b57cec5SDimitry Andric //
30b57cec5SDimitry Andric // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
40b57cec5SDimitry Andric // See https://llvm.org/LICENSE.txt for license information.
50b57cec5SDimitry Andric // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
60b57cec5SDimitry Andric //
70b57cec5SDimitry Andric //===----------------------------------------------------------------------===//
80b57cec5SDimitry Andric //
90b57cec5SDimitry Andric // This defines NonNullParamChecker, which checks for arguments expected not to
100b57cec5SDimitry Andric // be null due to:
110b57cec5SDimitry Andric // - the corresponding parameters being declared to have nonnull attribute
120b57cec5SDimitry Andric // - the corresponding parameters being references; since the call would form
130b57cec5SDimitry Andric // a reference to a null pointer
140b57cec5SDimitry Andric //
150b57cec5SDimitry Andric //===----------------------------------------------------------------------===//
160b57cec5SDimitry Andric
170b57cec5SDimitry Andric #include "clang/AST/Attr.h"
185ffd83dbSDimitry Andric #include "clang/Analysis/AnyCall.h"
195ffd83dbSDimitry Andric #include "clang/StaticAnalyzer/Checkers/BuiltinCheckerRegistration.h"
200b57cec5SDimitry Andric #include "clang/StaticAnalyzer/Core/BugReporter/BugType.h"
21*647cbc5dSDimitry Andric #include "clang/StaticAnalyzer/Core/BugReporter/CommonBugCategories.h"
220b57cec5SDimitry Andric #include "clang/StaticAnalyzer/Core/Checker.h"
230b57cec5SDimitry Andric #include "clang/StaticAnalyzer/Core/CheckerManager.h"
240b57cec5SDimitry Andric #include "clang/StaticAnalyzer/Core/PathSensitive/CallEvent.h"
250b57cec5SDimitry Andric #include "clang/StaticAnalyzer/Core/PathSensitive/CheckerContext.h"
265ffd83dbSDimitry Andric #include "llvm/ADT/StringExtras.h"
270b57cec5SDimitry Andric
280b57cec5SDimitry Andric using namespace clang;
290b57cec5SDimitry Andric using namespace ento;
300b57cec5SDimitry Andric
310b57cec5SDimitry Andric namespace {
320b57cec5SDimitry Andric class NonNullParamChecker
335ffd83dbSDimitry Andric : public Checker<check::PreCall, check::BeginFunction,
345ffd83dbSDimitry Andric EventDispatcher<ImplicitNullDerefEvent>> {
35*647cbc5dSDimitry Andric const BugType BTAttrNonNull{
36*647cbc5dSDimitry Andric this, "Argument with 'nonnull' attribute passed null", "API"};
37*647cbc5dSDimitry Andric const BugType BTNullRefArg{this, "Dereference of null pointer"};
380b57cec5SDimitry Andric
390b57cec5SDimitry Andric public:
400b57cec5SDimitry Andric void checkPreCall(const CallEvent &Call, CheckerContext &C) const;
415ffd83dbSDimitry Andric void checkBeginFunction(CheckerContext &C) const;
420b57cec5SDimitry Andric
43a7dea167SDimitry Andric std::unique_ptr<PathSensitiveBugReport>
445ffd83dbSDimitry Andric genReportNullAttrNonNull(const ExplodedNode *ErrorN, const Expr *ArgE,
45a7dea167SDimitry Andric unsigned IdxOfArg) const;
46a7dea167SDimitry Andric std::unique_ptr<PathSensitiveBugReport>
470b57cec5SDimitry Andric genReportReferenceToNullPointer(const ExplodedNode *ErrorN,
480b57cec5SDimitry Andric const Expr *ArgE) const;
490b57cec5SDimitry Andric };
500b57cec5SDimitry Andric
515ffd83dbSDimitry Andric template <class CallType>
setBitsAccordingToFunctionAttributes(const CallType & Call,llvm::SmallBitVector & AttrNonNull)525ffd83dbSDimitry Andric void setBitsAccordingToFunctionAttributes(const CallType &Call,
535ffd83dbSDimitry Andric llvm::SmallBitVector &AttrNonNull) {
540b57cec5SDimitry Andric const Decl *FD = Call.getDecl();
555ffd83dbSDimitry Andric
560b57cec5SDimitry Andric for (const auto *NonNull : FD->specific_attrs<NonNullAttr>()) {
570b57cec5SDimitry Andric if (!NonNull->args_size()) {
585ffd83dbSDimitry Andric // Lack of attribute parameters means that all of the parameters are
595ffd83dbSDimitry Andric // implicitly marked as non-null.
605ffd83dbSDimitry Andric AttrNonNull.set();
610b57cec5SDimitry Andric break;
620b57cec5SDimitry Andric }
635ffd83dbSDimitry Andric
640b57cec5SDimitry Andric for (const ParamIdx &Idx : NonNull->args()) {
655ffd83dbSDimitry Andric // 'nonnull' attribute's parameters are 1-based and should be adjusted to
665ffd83dbSDimitry Andric // match actual AST parameter/argument indices.
670b57cec5SDimitry Andric unsigned IdxAST = Idx.getASTIndex();
685ffd83dbSDimitry Andric if (IdxAST >= AttrNonNull.size())
690b57cec5SDimitry Andric continue;
700b57cec5SDimitry Andric AttrNonNull.set(IdxAST);
710b57cec5SDimitry Andric }
720b57cec5SDimitry Andric }
735ffd83dbSDimitry Andric }
745ffd83dbSDimitry Andric
755ffd83dbSDimitry Andric template <class CallType>
setBitsAccordingToParameterAttributes(const CallType & Call,llvm::SmallBitVector & AttrNonNull)765ffd83dbSDimitry Andric void setBitsAccordingToParameterAttributes(const CallType &Call,
775ffd83dbSDimitry Andric llvm::SmallBitVector &AttrNonNull) {
785ffd83dbSDimitry Andric for (const ParmVarDecl *Parameter : Call.parameters()) {
795ffd83dbSDimitry Andric unsigned ParameterIndex = Parameter->getFunctionScopeIndex();
805ffd83dbSDimitry Andric if (ParameterIndex == AttrNonNull.size())
815ffd83dbSDimitry Andric break;
825ffd83dbSDimitry Andric
835ffd83dbSDimitry Andric if (Parameter->hasAttr<NonNullAttr>())
845ffd83dbSDimitry Andric AttrNonNull.set(ParameterIndex);
855ffd83dbSDimitry Andric }
865ffd83dbSDimitry Andric }
875ffd83dbSDimitry Andric
885ffd83dbSDimitry Andric template <class CallType>
getNonNullAttrsImpl(const CallType & Call,unsigned ExpectedSize)895ffd83dbSDimitry Andric llvm::SmallBitVector getNonNullAttrsImpl(const CallType &Call,
905ffd83dbSDimitry Andric unsigned ExpectedSize) {
915ffd83dbSDimitry Andric llvm::SmallBitVector AttrNonNull(ExpectedSize);
925ffd83dbSDimitry Andric
935ffd83dbSDimitry Andric setBitsAccordingToFunctionAttributes(Call, AttrNonNull);
945ffd83dbSDimitry Andric setBitsAccordingToParameterAttributes(Call, AttrNonNull);
955ffd83dbSDimitry Andric
960b57cec5SDimitry Andric return AttrNonNull;
970b57cec5SDimitry Andric }
980b57cec5SDimitry Andric
995ffd83dbSDimitry Andric /// \return Bitvector marking non-null attributes.
getNonNullAttrs(const CallEvent & Call)1005ffd83dbSDimitry Andric llvm::SmallBitVector getNonNullAttrs(const CallEvent &Call) {
1015ffd83dbSDimitry Andric return getNonNullAttrsImpl(Call, Call.getNumArgs());
1025ffd83dbSDimitry Andric }
1035ffd83dbSDimitry Andric
1045ffd83dbSDimitry Andric /// \return Bitvector marking non-null attributes.
getNonNullAttrs(const AnyCall & Call)1055ffd83dbSDimitry Andric llvm::SmallBitVector getNonNullAttrs(const AnyCall &Call) {
1065ffd83dbSDimitry Andric return getNonNullAttrsImpl(Call, Call.param_size());
1075ffd83dbSDimitry Andric }
1085ffd83dbSDimitry Andric } // end anonymous namespace
1095ffd83dbSDimitry Andric
checkPreCall(const CallEvent & Call,CheckerContext & C) const1100b57cec5SDimitry Andric void NonNullParamChecker::checkPreCall(const CallEvent &Call,
1110b57cec5SDimitry Andric CheckerContext &C) const {
1120b57cec5SDimitry Andric if (!Call.getDecl())
1130b57cec5SDimitry Andric return;
1140b57cec5SDimitry Andric
1150b57cec5SDimitry Andric llvm::SmallBitVector AttrNonNull = getNonNullAttrs(Call);
1160b57cec5SDimitry Andric unsigned NumArgs = Call.getNumArgs();
1170b57cec5SDimitry Andric
1180b57cec5SDimitry Andric ProgramStateRef state = C.getState();
1190b57cec5SDimitry Andric ArrayRef<ParmVarDecl *> parms = Call.parameters();
1200b57cec5SDimitry Andric
1210b57cec5SDimitry Andric for (unsigned idx = 0; idx < NumArgs; ++idx) {
1220b57cec5SDimitry Andric // For vararg functions, a corresponding parameter decl may not exist.
1230b57cec5SDimitry Andric bool HasParam = idx < parms.size();
1240b57cec5SDimitry Andric
1250b57cec5SDimitry Andric // Check if the parameter is a reference. We want to report when reference
1260b57cec5SDimitry Andric // to a null pointer is passed as a parameter.
1275ffd83dbSDimitry Andric bool HasRefTypeParam =
1280b57cec5SDimitry Andric HasParam ? parms[idx]->getType()->isReferenceType() : false;
1295ffd83dbSDimitry Andric bool ExpectedToBeNonNull = AttrNonNull.test(idx);
1300b57cec5SDimitry Andric
1315ffd83dbSDimitry Andric if (!ExpectedToBeNonNull && !HasRefTypeParam)
1320b57cec5SDimitry Andric continue;
1330b57cec5SDimitry Andric
1340b57cec5SDimitry Andric // If the value is unknown or undefined, we can't perform this check.
1350b57cec5SDimitry Andric const Expr *ArgE = Call.getArgExpr(idx);
1360b57cec5SDimitry Andric SVal V = Call.getArgSVal(idx);
1370b57cec5SDimitry Andric auto DV = V.getAs<DefinedSVal>();
1380b57cec5SDimitry Andric if (!DV)
1390b57cec5SDimitry Andric continue;
1400b57cec5SDimitry Andric
141bdd1243dSDimitry Andric assert(!HasRefTypeParam || isa<Loc>(*DV));
1420b57cec5SDimitry Andric
1430b57cec5SDimitry Andric // Process the case when the argument is not a location.
144bdd1243dSDimitry Andric if (ExpectedToBeNonNull && !isa<Loc>(*DV)) {
1450b57cec5SDimitry Andric // If the argument is a union type, we want to handle a potential
1460b57cec5SDimitry Andric // transparent_union GCC extension.
1470b57cec5SDimitry Andric if (!ArgE)
1480b57cec5SDimitry Andric continue;
1490b57cec5SDimitry Andric
1500b57cec5SDimitry Andric QualType T = ArgE->getType();
1510b57cec5SDimitry Andric const RecordType *UT = T->getAsUnionType();
1520b57cec5SDimitry Andric if (!UT || !UT->getDecl()->hasAttr<TransparentUnionAttr>())
1530b57cec5SDimitry Andric continue;
1540b57cec5SDimitry Andric
1550b57cec5SDimitry Andric auto CSV = DV->getAs<nonloc::CompoundVal>();
1560b57cec5SDimitry Andric
1570b57cec5SDimitry Andric // FIXME: Handle LazyCompoundVals?
1580b57cec5SDimitry Andric if (!CSV)
1590b57cec5SDimitry Andric continue;
1600b57cec5SDimitry Andric
1610b57cec5SDimitry Andric V = *(CSV->begin());
1620b57cec5SDimitry Andric DV = V.getAs<DefinedSVal>();
1630b57cec5SDimitry Andric assert(++CSV->begin() == CSV->end());
1640b57cec5SDimitry Andric // FIXME: Handle (some_union){ some_other_union_val }, which turns into
1650b57cec5SDimitry Andric // a LazyCompoundVal inside a CompoundVal.
16681ad6265SDimitry Andric if (!isa<Loc>(V))
1670b57cec5SDimitry Andric continue;
1680b57cec5SDimitry Andric
1690b57cec5SDimitry Andric // Retrieve the corresponding expression.
1700b57cec5SDimitry Andric if (const auto *CE = dyn_cast<CompoundLiteralExpr>(ArgE))
1710b57cec5SDimitry Andric if (const auto *IE = dyn_cast<InitListExpr>(CE->getInitializer()))
1720b57cec5SDimitry Andric ArgE = dyn_cast<Expr>(*(IE->begin()));
1730b57cec5SDimitry Andric }
1740b57cec5SDimitry Andric
1750b57cec5SDimitry Andric ConstraintManager &CM = C.getConstraintManager();
1760b57cec5SDimitry Andric ProgramStateRef stateNotNull, stateNull;
1770b57cec5SDimitry Andric std::tie(stateNotNull, stateNull) = CM.assumeDual(state, *DV);
1780b57cec5SDimitry Andric
1790b57cec5SDimitry Andric // Generate an error node. Check for a null node in case
1800b57cec5SDimitry Andric // we cache out.
1810b57cec5SDimitry Andric if (stateNull && !stateNotNull) {
1820b57cec5SDimitry Andric if (ExplodedNode *errorNode = C.generateErrorNode(stateNull)) {
1830b57cec5SDimitry Andric
1840b57cec5SDimitry Andric std::unique_ptr<BugReport> R;
1855ffd83dbSDimitry Andric if (ExpectedToBeNonNull)
186a7dea167SDimitry Andric R = genReportNullAttrNonNull(errorNode, ArgE, idx + 1);
1875ffd83dbSDimitry Andric else if (HasRefTypeParam)
1880b57cec5SDimitry Andric R = genReportReferenceToNullPointer(errorNode, ArgE);
1890b57cec5SDimitry Andric
1900b57cec5SDimitry Andric // Highlight the range of the argument that was null.
1910b57cec5SDimitry Andric R->addRange(Call.getArgSourceRange(idx));
1920b57cec5SDimitry Andric
1930b57cec5SDimitry Andric // Emit the bug report.
1940b57cec5SDimitry Andric C.emitReport(std::move(R));
1950b57cec5SDimitry Andric }
1960b57cec5SDimitry Andric
1970b57cec5SDimitry Andric // Always return. Either we cached out or we just emitted an error.
1980b57cec5SDimitry Andric return;
1990b57cec5SDimitry Andric }
2000b57cec5SDimitry Andric
2010b57cec5SDimitry Andric if (stateNull) {
2020b57cec5SDimitry Andric if (ExplodedNode *N = C.generateSink(stateNull, C.getPredecessor())) {
2030b57cec5SDimitry Andric ImplicitNullDerefEvent event = {
2040b57cec5SDimitry Andric V, false, N, &C.getBugReporter(),
2055ffd83dbSDimitry Andric /*IsDirectDereference=*/HasRefTypeParam};
2060b57cec5SDimitry Andric dispatchEvent(event);
2070b57cec5SDimitry Andric }
2080b57cec5SDimitry Andric }
2090b57cec5SDimitry Andric
2100b57cec5SDimitry Andric // If a pointer value passed the check we should assume that it is
2110b57cec5SDimitry Andric // indeed not null from this point forward.
2120b57cec5SDimitry Andric state = stateNotNull;
2130b57cec5SDimitry Andric }
2140b57cec5SDimitry Andric
2150b57cec5SDimitry Andric // If we reach here all of the arguments passed the nonnull check.
2160b57cec5SDimitry Andric // If 'state' has been updated generated a new node.
2170b57cec5SDimitry Andric C.addTransition(state);
2180b57cec5SDimitry Andric }
2190b57cec5SDimitry Andric
2205ffd83dbSDimitry Andric /// We want to trust developer annotations and consider all 'nonnull' parameters
2215ffd83dbSDimitry Andric /// as non-null indeed. Each marked parameter will get a corresponding
2225ffd83dbSDimitry Andric /// constraint.
2235ffd83dbSDimitry Andric ///
2245ffd83dbSDimitry Andric /// This approach will not only help us to get rid of some false positives, but
2255ffd83dbSDimitry Andric /// remove duplicates and shorten warning traces as well.
2265ffd83dbSDimitry Andric ///
2275ffd83dbSDimitry Andric /// \code
2285ffd83dbSDimitry Andric /// void foo(int *x) [[gnu::nonnull]] {
2295ffd83dbSDimitry Andric /// // . . .
2305ffd83dbSDimitry Andric /// *x = 42; // we don't want to consider this as an error...
2315ffd83dbSDimitry Andric /// // . . .
2325ffd83dbSDimitry Andric /// }
2335ffd83dbSDimitry Andric ///
2345ffd83dbSDimitry Andric /// foo(nullptr); // ...and report here instead
2355ffd83dbSDimitry Andric /// \endcode
checkBeginFunction(CheckerContext & Context) const2365ffd83dbSDimitry Andric void NonNullParamChecker::checkBeginFunction(CheckerContext &Context) const {
2375ffd83dbSDimitry Andric // Planned assumption makes sense only for top-level functions.
2385ffd83dbSDimitry Andric // Inlined functions will get similar constraints as part of 'checkPreCall'.
2395ffd83dbSDimitry Andric if (!Context.inTopFrame())
2405ffd83dbSDimitry Andric return;
2415ffd83dbSDimitry Andric
2425ffd83dbSDimitry Andric const LocationContext *LocContext = Context.getLocationContext();
2435ffd83dbSDimitry Andric
2445ffd83dbSDimitry Andric const Decl *FD = LocContext->getDecl();
2455ffd83dbSDimitry Andric // AnyCall helps us here to avoid checking for FunctionDecl and ObjCMethodDecl
2465ffd83dbSDimitry Andric // separately and aggregates interfaces of these classes.
2475ffd83dbSDimitry Andric auto AbstractCall = AnyCall::forDecl(FD);
2485ffd83dbSDimitry Andric if (!AbstractCall)
2495ffd83dbSDimitry Andric return;
2505ffd83dbSDimitry Andric
2515ffd83dbSDimitry Andric ProgramStateRef State = Context.getState();
2525ffd83dbSDimitry Andric llvm::SmallBitVector ParameterNonNullMarks = getNonNullAttrs(*AbstractCall);
2535ffd83dbSDimitry Andric
2545ffd83dbSDimitry Andric for (const ParmVarDecl *Parameter : AbstractCall->parameters()) {
2555ffd83dbSDimitry Andric // 1. Check parameter if it is annotated as non-null
2565ffd83dbSDimitry Andric if (!ParameterNonNullMarks.test(Parameter->getFunctionScopeIndex()))
2575ffd83dbSDimitry Andric continue;
2585ffd83dbSDimitry Andric
2595ffd83dbSDimitry Andric // 2. Check that parameter is a pointer.
2605ffd83dbSDimitry Andric // Nonnull attribute can be applied to non-pointers (by default
2615ffd83dbSDimitry Andric // __attribute__(nonnull) implies "all parameters").
2625ffd83dbSDimitry Andric if (!Parameter->getType()->isPointerType())
2635ffd83dbSDimitry Andric continue;
2645ffd83dbSDimitry Andric
2655ffd83dbSDimitry Andric Loc ParameterLoc = State->getLValue(Parameter, LocContext);
2665ffd83dbSDimitry Andric // We never consider top-level function parameters undefined.
2675ffd83dbSDimitry Andric auto StoredVal =
2685ffd83dbSDimitry Andric State->getSVal(ParameterLoc).castAs<DefinedOrUnknownSVal>();
2695ffd83dbSDimitry Andric
2705ffd83dbSDimitry Andric // 3. Assume that it is indeed non-null
2715ffd83dbSDimitry Andric if (ProgramStateRef NewState = State->assume(StoredVal, true)) {
2725ffd83dbSDimitry Andric State = NewState;
2735ffd83dbSDimitry Andric }
2745ffd83dbSDimitry Andric }
2755ffd83dbSDimitry Andric
2765ffd83dbSDimitry Andric Context.addTransition(State);
2775ffd83dbSDimitry Andric }
2785ffd83dbSDimitry Andric
279a7dea167SDimitry Andric std::unique_ptr<PathSensitiveBugReport>
genReportNullAttrNonNull(const ExplodedNode * ErrorNode,const Expr * ArgE,unsigned IdxOfArg) const2800b57cec5SDimitry Andric NonNullParamChecker::genReportNullAttrNonNull(const ExplodedNode *ErrorNode,
281a7dea167SDimitry Andric const Expr *ArgE,
282a7dea167SDimitry Andric unsigned IdxOfArg) const {
283a7dea167SDimitry Andric llvm::SmallString<256> SBuf;
284a7dea167SDimitry Andric llvm::raw_svector_ostream OS(SBuf);
285a7dea167SDimitry Andric OS << "Null pointer passed to "
286a7dea167SDimitry Andric << IdxOfArg << llvm::getOrdinalSuffix(IdxOfArg)
287a7dea167SDimitry Andric << " parameter expecting 'nonnull'";
288a7dea167SDimitry Andric
289a7dea167SDimitry Andric auto R =
290*647cbc5dSDimitry Andric std::make_unique<PathSensitiveBugReport>(BTAttrNonNull, SBuf, ErrorNode);
2910b57cec5SDimitry Andric if (ArgE)
2920b57cec5SDimitry Andric bugreporter::trackExpressionValue(ErrorNode, ArgE, *R);
2930b57cec5SDimitry Andric
2940b57cec5SDimitry Andric return R;
2950b57cec5SDimitry Andric }
2960b57cec5SDimitry Andric
297a7dea167SDimitry Andric std::unique_ptr<PathSensitiveBugReport>
genReportReferenceToNullPointer(const ExplodedNode * ErrorNode,const Expr * ArgE) const298a7dea167SDimitry Andric NonNullParamChecker::genReportReferenceToNullPointer(
2990b57cec5SDimitry Andric const ExplodedNode *ErrorNode, const Expr *ArgE) const {
300a7dea167SDimitry Andric auto R = std::make_unique<PathSensitiveBugReport>(
301*647cbc5dSDimitry Andric BTNullRefArg, "Forming reference to null pointer", ErrorNode);
3020b57cec5SDimitry Andric if (ArgE) {
3030b57cec5SDimitry Andric const Expr *ArgEDeref = bugreporter::getDerefExpr(ArgE);
3040b57cec5SDimitry Andric if (!ArgEDeref)
3050b57cec5SDimitry Andric ArgEDeref = ArgE;
3060b57cec5SDimitry Andric bugreporter::trackExpressionValue(ErrorNode, ArgEDeref, *R);
3070b57cec5SDimitry Andric }
3080b57cec5SDimitry Andric return R;
3090b57cec5SDimitry Andric }
3100b57cec5SDimitry Andric
registerNonNullParamChecker(CheckerManager & mgr)3110b57cec5SDimitry Andric void ento::registerNonNullParamChecker(CheckerManager &mgr) {
3120b57cec5SDimitry Andric mgr.registerChecker<NonNullParamChecker>();
3130b57cec5SDimitry Andric }
3140b57cec5SDimitry Andric
shouldRegisterNonNullParamChecker(const CheckerManager & mgr)3155ffd83dbSDimitry Andric bool ento::shouldRegisterNonNullParamChecker(const CheckerManager &mgr) {
3160b57cec5SDimitry Andric return true;
3170b57cec5SDimitry Andric }
318