xref: /llvm-project/clang/lib/StaticAnalyzer/Checkers/MallocChecker.cpp (revision 67291b90f9c811045a97eba72a0af75baa028aae)
1 //=== MallocChecker.cpp - A malloc/free checker -------------------*- C++ -*--//
2 //
3 //                     The LLVM Compiler Infrastructure
4 //
5 // This file is distributed under the University of Illinois Open Source
6 // License. See LICENSE.TXT for details.
7 //
8 //===----------------------------------------------------------------------===//
9 //
10 // This file defines malloc/free checker, which checks for potential memory
11 // leaks, double free, and use-after-free problems.
12 //
13 //===----------------------------------------------------------------------===//
14 
15 #include "ClangSACheckers.h"
16 #include "InterCheckerAPI.h"
17 #include "clang/StaticAnalyzer/Core/Checker.h"
18 #include "clang/StaticAnalyzer/Core/CheckerManager.h"
19 #include "clang/StaticAnalyzer/Core/PathSensitive/CheckerContext.h"
20 #include "clang/StaticAnalyzer/Core/BugReporter/BugType.h"
21 #include "clang/StaticAnalyzer/Core/PathSensitive/CallEvent.h"
22 #include "clang/StaticAnalyzer/Core/PathSensitive/ProgramState.h"
23 #include "clang/StaticAnalyzer/Core/PathSensitive/ProgramStateTrait.h"
24 #include "clang/StaticAnalyzer/Core/PathSensitive/SymbolManager.h"
25 #include "clang/Basic/SourceManager.h"
26 #include "llvm/ADT/ImmutableMap.h"
27 #include "llvm/ADT/SmallString.h"
28 #include "llvm/ADT/STLExtras.h"
29 #include "llvm/ADT/StringExtras.h"
30 #include <climits>
31 
32 using namespace clang;
33 using namespace ento;
34 
35 namespace {
36 
37 class RefState {
38   enum Kind { // Reference to allocated memory.
39               Allocated,
40               // Reference to released/freed memory.
41               Released,
42               // The responsibility for freeing resources has transfered from
43               // this reference. A relinquished symbol should not be freed.
44               Relinquished } K;
45   const Stmt *S;
46 
47 public:
48   RefState(Kind k, const Stmt *s) : K(k), S(s) {}
49 
50   bool isAllocated() const { return K == Allocated; }
51   bool isReleased() const { return K == Released; }
52   bool isRelinquished() const { return K == Relinquished; }
53 
54   const Stmt *getStmt() const { return S; }
55 
56   bool operator==(const RefState &X) const {
57     return K == X.K && S == X.S;
58   }
59 
60   static RefState getAllocated(const Stmt *s) {
61     return RefState(Allocated, s);
62   }
63   static RefState getReleased(const Stmt *s) { return RefState(Released, s); }
64   static RefState getRelinquished(const Stmt *s) {
65     return RefState(Relinquished, s);
66   }
67 
68   void Profile(llvm::FoldingSetNodeID &ID) const {
69     ID.AddInteger(K);
70     ID.AddPointer(S);
71   }
72 };
73 
74 enum ReallocPairKind {
75   RPToBeFreedAfterFailure,
76   // The symbol has been freed when reallocation failed.
77   RPIsFreeOnFailure,
78   // The symbol does not need to be freed after reallocation fails.
79   RPDoNotTrackAfterFailure
80 };
81 
82 /// \class ReallocPair
83 /// \brief Stores information about the symbol being reallocated by a call to
84 /// 'realloc' to allow modeling failed reallocation later in the path.
85 struct ReallocPair {
86   // \brief The symbol which realloc reallocated.
87   SymbolRef ReallocatedSym;
88   ReallocPairKind Kind;
89 
90   ReallocPair(SymbolRef S, ReallocPairKind K) :
91     ReallocatedSym(S), Kind(K) {}
92   void Profile(llvm::FoldingSetNodeID &ID) const {
93     ID.AddInteger(Kind);
94     ID.AddPointer(ReallocatedSym);
95   }
96   bool operator==(const ReallocPair &X) const {
97     return ReallocatedSym == X.ReallocatedSym &&
98            Kind == X.Kind;
99   }
100 };
101 
102 typedef std::pair<const Stmt*, const MemRegion*> LeakInfo;
103 
104 class MallocChecker : public Checker<check::DeadSymbols,
105                                      check::EndPath,
106                                      check::PreStmt<ReturnStmt>,
107                                      check::PreStmt<CallExpr>,
108                                      check::PostStmt<CallExpr>,
109                                      check::PostStmt<BlockExpr>,
110                                      check::PostObjCMessage,
111                                      check::Location,
112                                      check::Bind,
113                                      eval::Assume,
114                                      check::RegionChanges>
115 {
116   mutable OwningPtr<BugType> BT_DoubleFree;
117   mutable OwningPtr<BugType> BT_Leak;
118   mutable OwningPtr<BugType> BT_UseFree;
119   mutable OwningPtr<BugType> BT_BadFree;
120   mutable IdentifierInfo *II_malloc, *II_free, *II_realloc, *II_calloc,
121                          *II_valloc, *II_reallocf, *II_strndup, *II_strdup;
122 
123 public:
124   MallocChecker() : II_malloc(0), II_free(0), II_realloc(0), II_calloc(0),
125                     II_valloc(0), II_reallocf(0), II_strndup(0), II_strdup(0) {}
126 
127   /// In pessimistic mode, the checker assumes that it does not know which
128   /// functions might free the memory.
129   struct ChecksFilter {
130     DefaultBool CMallocPessimistic;
131     DefaultBool CMallocOptimistic;
132   };
133 
134   ChecksFilter Filter;
135 
136   void checkPreStmt(const CallExpr *S, CheckerContext &C) const;
137   void checkPostStmt(const CallExpr *CE, CheckerContext &C) const;
138   void checkPostObjCMessage(const ObjCMethodCall &Call, CheckerContext &C) const;
139   void checkPostStmt(const BlockExpr *BE, CheckerContext &C) const;
140   void checkDeadSymbols(SymbolReaper &SymReaper, CheckerContext &C) const;
141   void checkEndPath(CheckerContext &C) const;
142   void checkPreStmt(const ReturnStmt *S, CheckerContext &C) const;
143   ProgramStateRef evalAssume(ProgramStateRef state, SVal Cond,
144                             bool Assumption) const;
145   void checkLocation(SVal l, bool isLoad, const Stmt *S,
146                      CheckerContext &C) const;
147   void checkBind(SVal location, SVal val, const Stmt*S,
148                  CheckerContext &C) const;
149   ProgramStateRef
150   checkRegionChanges(ProgramStateRef state,
151                      const StoreManager::InvalidatedSymbols *invalidated,
152                      ArrayRef<const MemRegion *> ExplicitRegions,
153                      ArrayRef<const MemRegion *> Regions,
154                      const CallEvent *Call) const;
155   bool wantsRegionChangeUpdate(ProgramStateRef state) const {
156     return true;
157   }
158 
159   void printState(raw_ostream &Out, ProgramStateRef State,
160                   const char *NL, const char *Sep) const;
161 
162 private:
163   void initIdentifierInfo(ASTContext &C) const;
164 
165   /// Check if this is one of the functions which can allocate/reallocate memory
166   /// pointed to by one of its arguments.
167   bool isMemFunction(const FunctionDecl *FD, ASTContext &C) const;
168   bool isFreeFunction(const FunctionDecl *FD, ASTContext &C) const;
169   bool isAllocationFunction(const FunctionDecl *FD, ASTContext &C) const;
170 
171   static ProgramStateRef MallocMemReturnsAttr(CheckerContext &C,
172                                               const CallExpr *CE,
173                                               const OwnershipAttr* Att);
174   static ProgramStateRef MallocMemAux(CheckerContext &C, const CallExpr *CE,
175                                      const Expr *SizeEx, SVal Init,
176                                      ProgramStateRef state) {
177     return MallocMemAux(C, CE,
178                         state->getSVal(SizeEx, C.getLocationContext()),
179                         Init, state);
180   }
181 
182   static ProgramStateRef MallocMemAux(CheckerContext &C, const CallExpr *CE,
183                                      SVal SizeEx, SVal Init,
184                                      ProgramStateRef state);
185 
186   /// Update the RefState to reflect the new memory allocation.
187   static ProgramStateRef MallocUpdateRefState(CheckerContext &C,
188                                               const CallExpr *CE,
189                                               ProgramStateRef state);
190 
191   ProgramStateRef FreeMemAttr(CheckerContext &C, const CallExpr *CE,
192                               const OwnershipAttr* Att) const;
193   ProgramStateRef FreeMemAux(CheckerContext &C, const CallExpr *CE,
194                              ProgramStateRef state, unsigned Num,
195                              bool Hold,
196                              bool &ReleasedAllocated,
197                              bool ReturnsNullOnFailure = false) const;
198   ProgramStateRef FreeMemAux(CheckerContext &C, const Expr *Arg,
199                              const Expr *ParentExpr,
200                              ProgramStateRef State,
201                              bool Hold,
202                              bool &ReleasedAllocated,
203                              bool ReturnsNullOnFailure = false) const;
204 
205   ProgramStateRef ReallocMem(CheckerContext &C, const CallExpr *CE,
206                              bool FreesMemOnFailure) const;
207   static ProgramStateRef CallocMem(CheckerContext &C, const CallExpr *CE);
208 
209   ///\brief Check if the memory associated with this symbol was released.
210   bool isReleased(SymbolRef Sym, CheckerContext &C) const;
211 
212   bool checkUseAfterFree(SymbolRef Sym, CheckerContext &C,
213                          const Stmt *S = 0) const;
214 
215   /// Check if the function is not known to us. So, for example, we could
216   /// conservatively assume it can free/reallocate it's pointer arguments.
217   bool doesNotFreeMemory(const CallEvent *Call,
218                          ProgramStateRef State) const;
219 
220   static bool SummarizeValue(raw_ostream &os, SVal V);
221   static bool SummarizeRegion(raw_ostream &os, const MemRegion *MR);
222   void ReportBadFree(CheckerContext &C, SVal ArgVal, SourceRange range) const;
223 
224   /// Find the location of the allocation for Sym on the path leading to the
225   /// exploded node N.
226   LeakInfo getAllocationSite(const ExplodedNode *N, SymbolRef Sym,
227                              CheckerContext &C) const;
228 
229   void reportLeak(SymbolRef Sym, ExplodedNode *N, CheckerContext &C) const;
230 
231   /// The bug visitor which allows us to print extra diagnostics along the
232   /// BugReport path. For example, showing the allocation site of the leaked
233   /// region.
234   class MallocBugVisitor : public BugReporterVisitorImpl<MallocBugVisitor> {
235   protected:
236     enum NotificationMode {
237       Normal,
238       ReallocationFailed
239     };
240 
241     // The allocated region symbol tracked by the main analysis.
242     SymbolRef Sym;
243 
244     // The mode we are in, i.e. what kind of diagnostics will be emitted.
245     NotificationMode Mode;
246 
247     // A symbol from when the primary region should have been reallocated.
248     SymbolRef FailedReallocSymbol;
249 
250     bool IsLeak;
251 
252   public:
253     MallocBugVisitor(SymbolRef S, bool isLeak = false)
254        : Sym(S), Mode(Normal), FailedReallocSymbol(0), IsLeak(isLeak) {}
255 
256     virtual ~MallocBugVisitor() {}
257 
258     void Profile(llvm::FoldingSetNodeID &ID) const {
259       static int X = 0;
260       ID.AddPointer(&X);
261       ID.AddPointer(Sym);
262     }
263 
264     inline bool isAllocated(const RefState *S, const RefState *SPrev,
265                             const Stmt *Stmt) {
266       // Did not track -> allocated. Other state (released) -> allocated.
267       return (Stmt && isa<CallExpr>(Stmt) &&
268               (S && S->isAllocated()) && (!SPrev || !SPrev->isAllocated()));
269     }
270 
271     inline bool isReleased(const RefState *S, const RefState *SPrev,
272                            const Stmt *Stmt) {
273       // Did not track -> released. Other state (allocated) -> released.
274       return (Stmt && isa<CallExpr>(Stmt) &&
275               (S && S->isReleased()) && (!SPrev || !SPrev->isReleased()));
276     }
277 
278     inline bool isRelinquished(const RefState *S, const RefState *SPrev,
279                                const Stmt *Stmt) {
280       // Did not track -> relinquished. Other state (allocated) -> relinquished.
281       return (Stmt && (isa<CallExpr>(Stmt) || isa<ObjCMessageExpr>(Stmt) ||
282                                               isa<ObjCPropertyRefExpr>(Stmt)) &&
283               (S && S->isRelinquished()) &&
284               (!SPrev || !SPrev->isRelinquished()));
285     }
286 
287     inline bool isReallocFailedCheck(const RefState *S, const RefState *SPrev,
288                                      const Stmt *Stmt) {
289       // If the expression is not a call, and the state change is
290       // released -> allocated, it must be the realloc return value
291       // check. If we have to handle more cases here, it might be cleaner just
292       // to track this extra bit in the state itself.
293       return ((!Stmt || !isa<CallExpr>(Stmt)) &&
294               (S && S->isAllocated()) && (SPrev && !SPrev->isAllocated()));
295     }
296 
297     PathDiagnosticPiece *VisitNode(const ExplodedNode *N,
298                                    const ExplodedNode *PrevN,
299                                    BugReporterContext &BRC,
300                                    BugReport &BR);
301 
302     PathDiagnosticPiece* getEndPath(BugReporterContext &BRC,
303                                     const ExplodedNode *EndPathNode,
304                                     BugReport &BR) {
305       if (!IsLeak)
306         return 0;
307 
308       PathDiagnosticLocation L =
309         PathDiagnosticLocation::createEndOfPath(EndPathNode,
310                                                 BRC.getSourceManager());
311       // Do not add the statement itself as a range in case of leak.
312       return new PathDiagnosticEventPiece(L, BR.getDescription(), false);
313     }
314 
315   private:
316     class StackHintGeneratorForReallocationFailed
317         : public StackHintGeneratorForSymbol {
318     public:
319       StackHintGeneratorForReallocationFailed(SymbolRef S, StringRef M)
320         : StackHintGeneratorForSymbol(S, M) {}
321 
322       virtual std::string getMessageForArg(const Expr *ArgE, unsigned ArgIndex) {
323         // Printed parameters start at 1, not 0.
324         ++ArgIndex;
325 
326         SmallString<200> buf;
327         llvm::raw_svector_ostream os(buf);
328 
329         os << "Reallocation of " << ArgIndex << llvm::getOrdinalSuffix(ArgIndex)
330            << " parameter failed";
331 
332         return os.str();
333       }
334 
335       virtual std::string getMessageForReturn(const CallExpr *CallExpr) {
336         return "Reallocation of returned value failed";
337       }
338     };
339   };
340 };
341 } // end anonymous namespace
342 
343 REGISTER_MAP_WITH_PROGRAMSTATE(RegionState, SymbolRef, RefState)
344 REGISTER_MAP_WITH_PROGRAMSTATE(ReallocPairs, SymbolRef, ReallocPair)
345 
346 // A map from the freed symbol to the symbol representing the return value of
347 // the free function.
348 REGISTER_MAP_WITH_PROGRAMSTATE(FreeReturnValue, SymbolRef, SymbolRef)
349 
350 namespace {
351 class StopTrackingCallback : public SymbolVisitor {
352   ProgramStateRef state;
353 public:
354   StopTrackingCallback(ProgramStateRef st) : state(st) {}
355   ProgramStateRef getState() const { return state; }
356 
357   bool VisitSymbol(SymbolRef sym) {
358     state = state->remove<RegionState>(sym);
359     return true;
360   }
361 };
362 } // end anonymous namespace
363 
364 void MallocChecker::initIdentifierInfo(ASTContext &Ctx) const {
365   if (II_malloc)
366     return;
367   II_malloc = &Ctx.Idents.get("malloc");
368   II_free = &Ctx.Idents.get("free");
369   II_realloc = &Ctx.Idents.get("realloc");
370   II_reallocf = &Ctx.Idents.get("reallocf");
371   II_calloc = &Ctx.Idents.get("calloc");
372   II_valloc = &Ctx.Idents.get("valloc");
373   II_strdup = &Ctx.Idents.get("strdup");
374   II_strndup = &Ctx.Idents.get("strndup");
375 }
376 
377 bool MallocChecker::isMemFunction(const FunctionDecl *FD, ASTContext &C) const {
378   if (isFreeFunction(FD, C))
379     return true;
380 
381   if (isAllocationFunction(FD, C))
382     return true;
383 
384   return false;
385 }
386 
387 bool MallocChecker::isAllocationFunction(const FunctionDecl *FD,
388                                          ASTContext &C) const {
389   if (!FD)
390     return false;
391 
392   if (FD->getKind() == Decl::Function) {
393     IdentifierInfo *FunI = FD->getIdentifier();
394     initIdentifierInfo(C);
395 
396     if (FunI == II_malloc || FunI == II_realloc ||
397         FunI == II_reallocf || FunI == II_calloc || FunI == II_valloc ||
398         FunI == II_strdup || FunI == II_strndup)
399       return true;
400   }
401 
402   if (Filter.CMallocOptimistic && FD->hasAttrs())
403     for (specific_attr_iterator<OwnershipAttr>
404            i = FD->specific_attr_begin<OwnershipAttr>(),
405            e = FD->specific_attr_end<OwnershipAttr>();
406            i != e; ++i)
407       if ((*i)->getOwnKind() == OwnershipAttr::Returns)
408         return true;
409   return false;
410 }
411 
412 bool MallocChecker::isFreeFunction(const FunctionDecl *FD, ASTContext &C) const {
413   if (!FD)
414     return false;
415 
416   if (FD->getKind() == Decl::Function) {
417     IdentifierInfo *FunI = FD->getIdentifier();
418     initIdentifierInfo(C);
419 
420     if (FunI == II_free || FunI == II_realloc || FunI == II_reallocf)
421       return true;
422   }
423 
424   if (Filter.CMallocOptimistic && FD->hasAttrs())
425     for (specific_attr_iterator<OwnershipAttr>
426            i = FD->specific_attr_begin<OwnershipAttr>(),
427            e = FD->specific_attr_end<OwnershipAttr>();
428            i != e; ++i)
429       if ((*i)->getOwnKind() == OwnershipAttr::Takes ||
430           (*i)->getOwnKind() == OwnershipAttr::Holds)
431         return true;
432   return false;
433 }
434 
435 void MallocChecker::checkPostStmt(const CallExpr *CE, CheckerContext &C) const {
436   if (C.wasInlined)
437     return;
438 
439   const FunctionDecl *FD = C.getCalleeDecl(CE);
440   if (!FD)
441     return;
442 
443   ProgramStateRef State = C.getState();
444   bool ReleasedAllocatedMemory = false;
445 
446   if (FD->getKind() == Decl::Function) {
447     initIdentifierInfo(C.getASTContext());
448     IdentifierInfo *FunI = FD->getIdentifier();
449 
450     if (FunI == II_malloc || FunI == II_valloc) {
451       if (CE->getNumArgs() < 1)
452         return;
453       State = MallocMemAux(C, CE, CE->getArg(0), UndefinedVal(), State);
454     } else if (FunI == II_realloc) {
455       State = ReallocMem(C, CE, false);
456     } else if (FunI == II_reallocf) {
457       State = ReallocMem(C, CE, true);
458     } else if (FunI == II_calloc) {
459       State = CallocMem(C, CE);
460     } else if (FunI == II_free) {
461       State = FreeMemAux(C, CE, State, 0, false, ReleasedAllocatedMemory);
462     } else if (FunI == II_strdup) {
463       State = MallocUpdateRefState(C, CE, State);
464     } else if (FunI == II_strndup) {
465       State = MallocUpdateRefState(C, CE, State);
466     }
467   }
468 
469   if (Filter.CMallocOptimistic) {
470     // Check all the attributes, if there are any.
471     // There can be multiple of these attributes.
472     if (FD->hasAttrs())
473       for (specific_attr_iterator<OwnershipAttr>
474           i = FD->specific_attr_begin<OwnershipAttr>(),
475           e = FD->specific_attr_end<OwnershipAttr>();
476           i != e; ++i) {
477         switch ((*i)->getOwnKind()) {
478         case OwnershipAttr::Returns:
479           State = MallocMemReturnsAttr(C, CE, *i);
480           break;
481         case OwnershipAttr::Takes:
482         case OwnershipAttr::Holds:
483           State = FreeMemAttr(C, CE, *i);
484           break;
485         }
486       }
487   }
488   C.addTransition(State);
489 }
490 
491 static bool isFreeWhenDoneSetToZero(const ObjCMethodCall &Call) {
492   Selector S = Call.getSelector();
493   for (unsigned i = 1; i < S.getNumArgs(); ++i)
494     if (S.getNameForSlot(i).equals("freeWhenDone"))
495       if (Call.getArgSVal(i).isConstant(0))
496         return true;
497 
498   return false;
499 }
500 
501 void MallocChecker::checkPostObjCMessage(const ObjCMethodCall &Call,
502                                          CheckerContext &C) const {
503   // If the first selector is dataWithBytesNoCopy, assume that the memory will
504   // be released with 'free' by the new object.
505   // Ex:  [NSData dataWithBytesNoCopy:bytes length:10];
506   // Unless 'freeWhenDone' param set to 0.
507   // TODO: Check that the memory was allocated with malloc.
508   bool ReleasedAllocatedMemory = false;
509   Selector S = Call.getSelector();
510   if ((S.getNameForSlot(0) == "dataWithBytesNoCopy" ||
511        S.getNameForSlot(0) == "initWithBytesNoCopy" ||
512        S.getNameForSlot(0) == "initWithCharactersNoCopy") &&
513       !isFreeWhenDoneSetToZero(Call)){
514     unsigned int argIdx  = 0;
515     ProgramStateRef State = FreeMemAux(C, Call.getArgExpr(argIdx),
516                                        Call.getOriginExpr(), C.getState(), true,
517                                        ReleasedAllocatedMemory,
518                                        /* RetNullOnFailure*/ true);
519 
520     C.addTransition(State);
521   }
522 }
523 
524 ProgramStateRef MallocChecker::MallocMemReturnsAttr(CheckerContext &C,
525                                                     const CallExpr *CE,
526                                                     const OwnershipAttr* Att) {
527   if (Att->getModule() != "malloc")
528     return 0;
529 
530   OwnershipAttr::args_iterator I = Att->args_begin(), E = Att->args_end();
531   if (I != E) {
532     return MallocMemAux(C, CE, CE->getArg(*I), UndefinedVal(), C.getState());
533   }
534   return MallocMemAux(C, CE, UnknownVal(), UndefinedVal(), C.getState());
535 }
536 
537 ProgramStateRef MallocChecker::MallocMemAux(CheckerContext &C,
538                                            const CallExpr *CE,
539                                            SVal Size, SVal Init,
540                                            ProgramStateRef state) {
541 
542   // Bind the return value to the symbolic value from the heap region.
543   // TODO: We could rewrite post visit to eval call; 'malloc' does not have
544   // side effects other than what we model here.
545   unsigned Count = C.blockCount();
546   SValBuilder &svalBuilder = C.getSValBuilder();
547   const LocationContext *LCtx = C.getPredecessor()->getLocationContext();
548   DefinedSVal RetVal =
549     cast<DefinedSVal>(svalBuilder.getConjuredHeapSymbolVal(CE, LCtx, Count));
550   state = state->BindExpr(CE, C.getLocationContext(), RetVal);
551 
552   // We expect the malloc functions to return a pointer.
553   if (!isa<Loc>(RetVal))
554     return 0;
555 
556   // Fill the region with the initialization value.
557   state = state->bindDefault(RetVal, Init);
558 
559   // Set the region's extent equal to the Size parameter.
560   const SymbolicRegion *R =
561       dyn_cast_or_null<SymbolicRegion>(RetVal.getAsRegion());
562   if (!R)
563     return 0;
564   if (isa<DefinedOrUnknownSVal>(Size)) {
565     SValBuilder &svalBuilder = C.getSValBuilder();
566     DefinedOrUnknownSVal Extent = R->getExtent(svalBuilder);
567     DefinedOrUnknownSVal DefinedSize = cast<DefinedOrUnknownSVal>(Size);
568     DefinedOrUnknownSVal extentMatchesSize =
569         svalBuilder.evalEQ(state, Extent, DefinedSize);
570 
571     state = state->assume(extentMatchesSize, true);
572     assert(state);
573   }
574 
575   return MallocUpdateRefState(C, CE, state);
576 }
577 
578 ProgramStateRef MallocChecker::MallocUpdateRefState(CheckerContext &C,
579                                                     const CallExpr *CE,
580                                                     ProgramStateRef state) {
581   // Get the return value.
582   SVal retVal = state->getSVal(CE, C.getLocationContext());
583 
584   // We expect the malloc functions to return a pointer.
585   if (!isa<Loc>(retVal))
586     return 0;
587 
588   SymbolRef Sym = retVal.getAsLocSymbol();
589   assert(Sym);
590 
591   // Set the symbol's state to Allocated.
592   return state->set<RegionState>(Sym, RefState::getAllocated(CE));
593 
594 }
595 
596 ProgramStateRef MallocChecker::FreeMemAttr(CheckerContext &C,
597                                            const CallExpr *CE,
598                                            const OwnershipAttr* Att) const {
599   if (Att->getModule() != "malloc")
600     return 0;
601 
602   ProgramStateRef State = C.getState();
603   bool ReleasedAllocated = false;
604 
605   for (OwnershipAttr::args_iterator I = Att->args_begin(), E = Att->args_end();
606        I != E; ++I) {
607     ProgramStateRef StateI = FreeMemAux(C, CE, State, *I,
608                                Att->getOwnKind() == OwnershipAttr::Holds,
609                                ReleasedAllocated);
610     if (StateI)
611       State = StateI;
612   }
613   return State;
614 }
615 
616 ProgramStateRef MallocChecker::FreeMemAux(CheckerContext &C,
617                                           const CallExpr *CE,
618                                           ProgramStateRef state,
619                                           unsigned Num,
620                                           bool Hold,
621                                           bool &ReleasedAllocated,
622                                           bool ReturnsNullOnFailure) const {
623   if (CE->getNumArgs() < (Num + 1))
624     return 0;
625 
626   return FreeMemAux(C, CE->getArg(Num), CE, state, Hold,
627                     ReleasedAllocated, ReturnsNullOnFailure);
628 }
629 
630 /// Check if the previous call to free on the given symbol failed.
631 ///
632 /// For example, if free failed, returns true. In addition, cleans out the
633 /// state from the corresponding failure info. Retuns the cleaned out state
634 /// and the corresponding return value symbol.
635 static std::pair<bool, ProgramStateRef>
636 checkAndCleanFreeFailedInfo(ProgramStateRef State,
637                             SymbolRef Sym, const SymbolRef *Ret) {
638   Ret = State->get<FreeReturnValue>(Sym);
639   if (Ret) {
640     assert(*Ret && "We should not store the null return symbol");
641     ConstraintManager &CMgr = State->getConstraintManager();
642     ConditionTruthVal FreeFailed = CMgr.isNull(State, *Ret);
643     State = State->remove<FreeReturnValue>(Sym);
644     return std::pair<bool, ProgramStateRef>(FreeFailed.isConstrainedTrue(),
645                                             State);
646   }
647   return std::pair<bool, ProgramStateRef>(false, State);
648 }
649 
650 ProgramStateRef MallocChecker::FreeMemAux(CheckerContext &C,
651                                           const Expr *ArgExpr,
652                                           const Expr *ParentExpr,
653                                           ProgramStateRef State,
654                                           bool Hold,
655                                           bool &ReleasedAllocated,
656                                           bool ReturnsNullOnFailure) const {
657 
658   SVal ArgVal = State->getSVal(ArgExpr, C.getLocationContext());
659   if (!isa<DefinedOrUnknownSVal>(ArgVal))
660     return 0;
661   DefinedOrUnknownSVal location = cast<DefinedOrUnknownSVal>(ArgVal);
662 
663   // Check for null dereferences.
664   if (!isa<Loc>(location))
665     return 0;
666 
667   // The explicit NULL case, no operation is performed.
668   ProgramStateRef notNullState, nullState;
669   llvm::tie(notNullState, nullState) = State->assume(location);
670   if (nullState && !notNullState)
671     return 0;
672 
673   // Unknown values could easily be okay
674   // Undefined values are handled elsewhere
675   if (ArgVal.isUnknownOrUndef())
676     return 0;
677 
678   const MemRegion *R = ArgVal.getAsRegion();
679 
680   // Nonlocs can't be freed, of course.
681   // Non-region locations (labels and fixed addresses) also shouldn't be freed.
682   if (!R) {
683     ReportBadFree(C, ArgVal, ArgExpr->getSourceRange());
684     return 0;
685   }
686 
687   R = R->StripCasts();
688 
689   // Blocks might show up as heap data, but should not be free()d
690   if (isa<BlockDataRegion>(R)) {
691     ReportBadFree(C, ArgVal, ArgExpr->getSourceRange());
692     return 0;
693   }
694 
695   const MemSpaceRegion *MS = R->getMemorySpace();
696 
697   // Parameters, locals, statics, and globals shouldn't be freed.
698   if (!(isa<UnknownSpaceRegion>(MS) || isa<HeapSpaceRegion>(MS))) {
699     // FIXME: at the time this code was written, malloc() regions were
700     // represented by conjured symbols, which are all in UnknownSpaceRegion.
701     // This means that there isn't actually anything from HeapSpaceRegion
702     // that should be freed, even though we allow it here.
703     // Of course, free() can work on memory allocated outside the current
704     // function, so UnknownSpaceRegion is always a possibility.
705     // False negatives are better than false positives.
706 
707     ReportBadFree(C, ArgVal, ArgExpr->getSourceRange());
708     return 0;
709   }
710 
711   const SymbolicRegion *SR = dyn_cast<SymbolicRegion>(R);
712   // Various cases could lead to non-symbol values here.
713   // For now, ignore them.
714   if (!SR)
715     return 0;
716 
717   SymbolRef Sym = SR->getSymbol();
718   const RefState *RS = State->get<RegionState>(Sym);
719   bool FailedToFree = false;
720   const SymbolRef *RetStatusSymbolPtr = 0;
721   llvm::tie(FailedToFree, State) =
722       checkAndCleanFreeFailedInfo(State, Sym, RetStatusSymbolPtr);
723 
724   // Check double free.
725   if (RS &&
726       (RS->isReleased() || RS->isRelinquished()) &&
727       !FailedToFree) {
728 
729     if (ExplodedNode *N = C.generateSink()) {
730       if (!BT_DoubleFree)
731         BT_DoubleFree.reset(
732           new BugType("Double free", "Memory Error"));
733       BugReport *R = new BugReport(*BT_DoubleFree,
734         (RS->isReleased() ? "Attempt to free released memory" :
735                             "Attempt to free non-owned memory"), N);
736       R->addRange(ArgExpr->getSourceRange());
737       R->markInteresting(Sym);
738       if (RetStatusSymbolPtr)
739         R->markInteresting(*RetStatusSymbolPtr);
740       R->addVisitor(new MallocBugVisitor(Sym));
741       C.emitReport(R);
742     }
743     return 0;
744   }
745 
746   ReleasedAllocated = (RS != 0);
747 
748   // Keep track of the return value. If it is NULL, we will know that free
749   // failed.
750   if (ReturnsNullOnFailure) {
751     SVal RetVal = C.getSVal(ParentExpr);
752     SymbolRef RetStatusSymbol = RetVal.getAsSymbol();
753     if (RetStatusSymbol) {
754       C.getSymbolManager().addSymbolDependency(Sym, RetStatusSymbol);
755       State = State->set<FreeReturnValue>(Sym, RetStatusSymbol);
756     }
757   }
758 
759   // Normal free.
760   if (Hold)
761     return State->set<RegionState>(Sym, RefState::getRelinquished(ParentExpr));
762   return State->set<RegionState>(Sym, RefState::getReleased(ParentExpr));
763 }
764 
765 bool MallocChecker::SummarizeValue(raw_ostream &os, SVal V) {
766   if (nonloc::ConcreteInt *IntVal = dyn_cast<nonloc::ConcreteInt>(&V))
767     os << "an integer (" << IntVal->getValue() << ")";
768   else if (loc::ConcreteInt *ConstAddr = dyn_cast<loc::ConcreteInt>(&V))
769     os << "a constant address (" << ConstAddr->getValue() << ")";
770   else if (loc::GotoLabel *Label = dyn_cast<loc::GotoLabel>(&V))
771     os << "the address of the label '" << Label->getLabel()->getName() << "'";
772   else
773     return false;
774 
775   return true;
776 }
777 
778 bool MallocChecker::SummarizeRegion(raw_ostream &os,
779                                     const MemRegion *MR) {
780   switch (MR->getKind()) {
781   case MemRegion::FunctionTextRegionKind: {
782     const NamedDecl *FD = cast<FunctionTextRegion>(MR)->getDecl();
783     if (FD)
784       os << "the address of the function '" << *FD << '\'';
785     else
786       os << "the address of a function";
787     return true;
788   }
789   case MemRegion::BlockTextRegionKind:
790     os << "block text";
791     return true;
792   case MemRegion::BlockDataRegionKind:
793     // FIXME: where the block came from?
794     os << "a block";
795     return true;
796   default: {
797     const MemSpaceRegion *MS = MR->getMemorySpace();
798 
799     if (isa<StackLocalsSpaceRegion>(MS)) {
800       const VarRegion *VR = dyn_cast<VarRegion>(MR);
801       const VarDecl *VD;
802       if (VR)
803         VD = VR->getDecl();
804       else
805         VD = NULL;
806 
807       if (VD)
808         os << "the address of the local variable '" << VD->getName() << "'";
809       else
810         os << "the address of a local stack variable";
811       return true;
812     }
813 
814     if (isa<StackArgumentsSpaceRegion>(MS)) {
815       const VarRegion *VR = dyn_cast<VarRegion>(MR);
816       const VarDecl *VD;
817       if (VR)
818         VD = VR->getDecl();
819       else
820         VD = NULL;
821 
822       if (VD)
823         os << "the address of the parameter '" << VD->getName() << "'";
824       else
825         os << "the address of a parameter";
826       return true;
827     }
828 
829     if (isa<GlobalsSpaceRegion>(MS)) {
830       const VarRegion *VR = dyn_cast<VarRegion>(MR);
831       const VarDecl *VD;
832       if (VR)
833         VD = VR->getDecl();
834       else
835         VD = NULL;
836 
837       if (VD) {
838         if (VD->isStaticLocal())
839           os << "the address of the static variable '" << VD->getName() << "'";
840         else
841           os << "the address of the global variable '" << VD->getName() << "'";
842       } else
843         os << "the address of a global variable";
844       return true;
845     }
846 
847     return false;
848   }
849   }
850 }
851 
852 void MallocChecker::ReportBadFree(CheckerContext &C, SVal ArgVal,
853                                   SourceRange range) const {
854   if (ExplodedNode *N = C.generateSink()) {
855     if (!BT_BadFree)
856       BT_BadFree.reset(new BugType("Bad free", "Memory Error"));
857 
858     SmallString<100> buf;
859     llvm::raw_svector_ostream os(buf);
860 
861     const MemRegion *MR = ArgVal.getAsRegion();
862     if (MR) {
863       while (const ElementRegion *ER = dyn_cast<ElementRegion>(MR))
864         MR = ER->getSuperRegion();
865 
866       // Special case for alloca()
867       if (isa<AllocaRegion>(MR))
868         os << "Argument to free() was allocated by alloca(), not malloc()";
869       else {
870         os << "Argument to free() is ";
871         if (SummarizeRegion(os, MR))
872           os << ", which is not memory allocated by malloc()";
873         else
874           os << "not memory allocated by malloc()";
875       }
876     } else {
877       os << "Argument to free() is ";
878       if (SummarizeValue(os, ArgVal))
879         os << ", which is not memory allocated by malloc()";
880       else
881         os << "not memory allocated by malloc()";
882     }
883 
884     BugReport *R = new BugReport(*BT_BadFree, os.str(), N);
885     R->markInteresting(MR);
886     R->addRange(range);
887     C.emitReport(R);
888   }
889 }
890 
891 ProgramStateRef MallocChecker::ReallocMem(CheckerContext &C,
892                                           const CallExpr *CE,
893                                           bool FreesOnFail) const {
894   if (CE->getNumArgs() < 2)
895     return 0;
896 
897   ProgramStateRef state = C.getState();
898   const Expr *arg0Expr = CE->getArg(0);
899   const LocationContext *LCtx = C.getLocationContext();
900   SVal Arg0Val = state->getSVal(arg0Expr, LCtx);
901   if (!isa<DefinedOrUnknownSVal>(Arg0Val))
902     return 0;
903   DefinedOrUnknownSVal arg0Val = cast<DefinedOrUnknownSVal>(Arg0Val);
904 
905   SValBuilder &svalBuilder = C.getSValBuilder();
906 
907   DefinedOrUnknownSVal PtrEQ =
908     svalBuilder.evalEQ(state, arg0Val, svalBuilder.makeNull());
909 
910   // Get the size argument. If there is no size arg then give up.
911   const Expr *Arg1 = CE->getArg(1);
912   if (!Arg1)
913     return 0;
914 
915   // Get the value of the size argument.
916   SVal Arg1ValG = state->getSVal(Arg1, LCtx);
917   if (!isa<DefinedOrUnknownSVal>(Arg1ValG))
918     return 0;
919   DefinedOrUnknownSVal Arg1Val = cast<DefinedOrUnknownSVal>(Arg1ValG);
920 
921   // Compare the size argument to 0.
922   DefinedOrUnknownSVal SizeZero =
923     svalBuilder.evalEQ(state, Arg1Val,
924                        svalBuilder.makeIntValWithPtrWidth(0, false));
925 
926   ProgramStateRef StatePtrIsNull, StatePtrNotNull;
927   llvm::tie(StatePtrIsNull, StatePtrNotNull) = state->assume(PtrEQ);
928   ProgramStateRef StateSizeIsZero, StateSizeNotZero;
929   llvm::tie(StateSizeIsZero, StateSizeNotZero) = state->assume(SizeZero);
930   // We only assume exceptional states if they are definitely true; if the
931   // state is under-constrained, assume regular realloc behavior.
932   bool PrtIsNull = StatePtrIsNull && !StatePtrNotNull;
933   bool SizeIsZero = StateSizeIsZero && !StateSizeNotZero;
934 
935   // If the ptr is NULL and the size is not 0, the call is equivalent to
936   // malloc(size).
937   if ( PrtIsNull && !SizeIsZero) {
938     ProgramStateRef stateMalloc = MallocMemAux(C, CE, CE->getArg(1),
939                                                UndefinedVal(), StatePtrIsNull);
940     return stateMalloc;
941   }
942 
943   if (PrtIsNull && SizeIsZero)
944     return 0;
945 
946   // Get the from and to pointer symbols as in toPtr = realloc(fromPtr, size).
947   assert(!PrtIsNull);
948   SymbolRef FromPtr = arg0Val.getAsSymbol();
949   SVal RetVal = state->getSVal(CE, LCtx);
950   SymbolRef ToPtr = RetVal.getAsSymbol();
951   if (!FromPtr || !ToPtr)
952     return 0;
953 
954   bool ReleasedAllocated = false;
955 
956   // If the size is 0, free the memory.
957   if (SizeIsZero)
958     if (ProgramStateRef stateFree = FreeMemAux(C, CE, StateSizeIsZero, 0,
959                                                false, ReleasedAllocated)){
960       // The semantics of the return value are:
961       // If size was equal to 0, either NULL or a pointer suitable to be passed
962       // to free() is returned. We just free the input pointer and do not add
963       // any constrains on the output pointer.
964       return stateFree;
965     }
966 
967   // Default behavior.
968   if (ProgramStateRef stateFree =
969         FreeMemAux(C, CE, state, 0, false, ReleasedAllocated)) {
970 
971     ProgramStateRef stateRealloc = MallocMemAux(C, CE, CE->getArg(1),
972                                                 UnknownVal(), stateFree);
973     if (!stateRealloc)
974       return 0;
975 
976     ReallocPairKind Kind = RPToBeFreedAfterFailure;
977     if (FreesOnFail)
978       Kind = RPIsFreeOnFailure;
979     else if (!ReleasedAllocated)
980       Kind = RPDoNotTrackAfterFailure;
981 
982     // Record the info about the reallocated symbol so that we could properly
983     // process failed reallocation.
984     stateRealloc = stateRealloc->set<ReallocPairs>(ToPtr,
985                                                    ReallocPair(FromPtr, Kind));
986     // The reallocated symbol should stay alive for as long as the new symbol.
987     C.getSymbolManager().addSymbolDependency(ToPtr, FromPtr);
988     return stateRealloc;
989   }
990   return 0;
991 }
992 
993 ProgramStateRef MallocChecker::CallocMem(CheckerContext &C, const CallExpr *CE){
994   if (CE->getNumArgs() < 2)
995     return 0;
996 
997   ProgramStateRef state = C.getState();
998   SValBuilder &svalBuilder = C.getSValBuilder();
999   const LocationContext *LCtx = C.getLocationContext();
1000   SVal count = state->getSVal(CE->getArg(0), LCtx);
1001   SVal elementSize = state->getSVal(CE->getArg(1), LCtx);
1002   SVal TotalSize = svalBuilder.evalBinOp(state, BO_Mul, count, elementSize,
1003                                         svalBuilder.getContext().getSizeType());
1004   SVal zeroVal = svalBuilder.makeZeroVal(svalBuilder.getContext().CharTy);
1005 
1006   return MallocMemAux(C, CE, TotalSize, zeroVal, state);
1007 }
1008 
1009 LeakInfo
1010 MallocChecker::getAllocationSite(const ExplodedNode *N, SymbolRef Sym,
1011                                  CheckerContext &C) const {
1012   const LocationContext *LeakContext = N->getLocationContext();
1013   // Walk the ExplodedGraph backwards and find the first node that referred to
1014   // the tracked symbol.
1015   const ExplodedNode *AllocNode = N;
1016   const MemRegion *ReferenceRegion = 0;
1017 
1018   while (N) {
1019     ProgramStateRef State = N->getState();
1020     if (!State->get<RegionState>(Sym))
1021       break;
1022 
1023     // Find the most recent expression bound to the symbol in the current
1024     // context.
1025     if (!ReferenceRegion) {
1026       if (const MemRegion *MR = C.getLocationRegionIfPostStore(N)) {
1027         SVal Val = State->getSVal(MR);
1028         if (Val.getAsLocSymbol() == Sym)
1029           ReferenceRegion = MR;
1030       }
1031     }
1032 
1033     // Allocation node, is the last node in the current context in which the
1034     // symbol was tracked.
1035     if (N->getLocationContext() == LeakContext)
1036       AllocNode = N;
1037     N = N->pred_empty() ? NULL : *(N->pred_begin());
1038   }
1039 
1040   ProgramPoint P = AllocNode->getLocation();
1041   const Stmt *AllocationStmt = 0;
1042   if (CallExitEnd *Exit = dyn_cast<CallExitEnd>(&P))
1043     AllocationStmt = Exit->getCalleeContext()->getCallSite();
1044   else if (StmtPoint *SP = dyn_cast<StmtPoint>(&P))
1045     AllocationStmt = SP->getStmt();
1046 
1047   return LeakInfo(AllocationStmt, ReferenceRegion);
1048 }
1049 
1050 void MallocChecker::reportLeak(SymbolRef Sym, ExplodedNode *N,
1051                                CheckerContext &C) const {
1052   assert(N);
1053   if (!BT_Leak) {
1054     BT_Leak.reset(new BugType("Memory leak", "Memory Error"));
1055     // Leaks should not be reported if they are post-dominated by a sink:
1056     // (1) Sinks are higher importance bugs.
1057     // (2) NoReturnFunctionChecker uses sink nodes to represent paths ending
1058     //     with __noreturn functions such as assert() or exit(). We choose not
1059     //     to report leaks on such paths.
1060     BT_Leak->setSuppressOnSink(true);
1061   }
1062 
1063   // Most bug reports are cached at the location where they occurred.
1064   // With leaks, we want to unique them by the location where they were
1065   // allocated, and only report a single path.
1066   PathDiagnosticLocation LocUsedForUniqueing;
1067   const Stmt *AllocStmt = 0;
1068   const MemRegion *Region = 0;
1069   llvm::tie(AllocStmt, Region) = getAllocationSite(N, Sym, C);
1070   if (AllocStmt)
1071     LocUsedForUniqueing = PathDiagnosticLocation::createBegin(AllocStmt,
1072                             C.getSourceManager(), N->getLocationContext());
1073 
1074   SmallString<200> buf;
1075   llvm::raw_svector_ostream os(buf);
1076   os << "Memory is never released; potential leak";
1077   if (Region && Region->canPrintPretty()) {
1078     os << " of memory pointed to by '";
1079     Region->printPretty(os);
1080     os << '\'';
1081   }
1082 
1083   BugReport *R = new BugReport(*BT_Leak, os.str(), N, LocUsedForUniqueing);
1084   R->markInteresting(Sym);
1085   R->addVisitor(new MallocBugVisitor(Sym, true));
1086   C.emitReport(R);
1087 }
1088 
1089 void MallocChecker::checkDeadSymbols(SymbolReaper &SymReaper,
1090                                      CheckerContext &C) const
1091 {
1092   if (!SymReaper.hasDeadSymbols())
1093     return;
1094 
1095   ProgramStateRef state = C.getState();
1096   RegionStateTy RS = state->get<RegionState>();
1097   RegionStateTy::Factory &F = state->get_context<RegionState>();
1098 
1099   llvm::SmallVector<SymbolRef, 2> Errors;
1100   for (RegionStateTy::iterator I = RS.begin(), E = RS.end(); I != E; ++I) {
1101     if (SymReaper.isDead(I->first)) {
1102       if (I->second.isAllocated())
1103         Errors.push_back(I->first);
1104       // Remove the dead symbol from the map.
1105       RS = F.remove(RS, I->first);
1106 
1107     }
1108   }
1109 
1110   // Cleanup the Realloc Pairs Map.
1111   ReallocPairsTy RP = state->get<ReallocPairs>();
1112   for (ReallocPairsTy::iterator I = RP.begin(), E = RP.end(); I != E; ++I) {
1113     if (SymReaper.isDead(I->first) ||
1114         SymReaper.isDead(I->second.ReallocatedSym)) {
1115       state = state->remove<ReallocPairs>(I->first);
1116     }
1117   }
1118 
1119   // Cleanup the FreeReturnValue Map.
1120   FreeReturnValueTy FR = state->get<FreeReturnValue>();
1121   for (FreeReturnValueTy::iterator I = FR.begin(), E = FR.end(); I != E; ++I) {
1122     if (SymReaper.isDead(I->first) ||
1123         SymReaper.isDead(I->second)) {
1124       state = state->remove<FreeReturnValue>(I->first);
1125     }
1126   }
1127 
1128   // Generate leak node.
1129   ExplodedNode *N = C.getPredecessor();
1130   if (!Errors.empty()) {
1131     static SimpleProgramPointTag Tag("MallocChecker : DeadSymbolsLeak");
1132     N = C.addTransition(C.getState(), C.getPredecessor(), &Tag);
1133     for (llvm::SmallVector<SymbolRef, 2>::iterator
1134         I = Errors.begin(), E = Errors.end(); I != E; ++I) {
1135       reportLeak(*I, N, C);
1136     }
1137   }
1138 
1139   C.addTransition(state->set<RegionState>(RS), N);
1140 }
1141 
1142 void MallocChecker::checkEndPath(CheckerContext &C) const {
1143   ProgramStateRef state = C.getState();
1144   RegionStateTy M = state->get<RegionState>();
1145 
1146   // If inside inlined call, skip it.
1147   if (C.getLocationContext()->getParent() != 0)
1148     return;
1149 
1150   for (RegionStateTy::iterator I = M.begin(), E = M.end(); I != E; ++I) {
1151     RefState RS = I->second;
1152     if (RS.isAllocated()) {
1153       ExplodedNode *N = C.addTransition(state);
1154       if (N)
1155         reportLeak(I->first, N, C);
1156     }
1157   }
1158 }
1159 
1160 void MallocChecker::checkPreStmt(const CallExpr *CE, CheckerContext &C) const {
1161   // We will check for double free in the post visit.
1162   if (isFreeFunction(C.getCalleeDecl(CE), C.getASTContext()))
1163     return;
1164 
1165   // Check use after free, when a freed pointer is passed to a call.
1166   ProgramStateRef State = C.getState();
1167   for (CallExpr::const_arg_iterator I = CE->arg_begin(),
1168                                     E = CE->arg_end(); I != E; ++I) {
1169     const Expr *A = *I;
1170     if (A->getType().getTypePtr()->isAnyPointerType()) {
1171       SymbolRef Sym = State->getSVal(A, C.getLocationContext()).getAsSymbol();
1172       if (!Sym)
1173         continue;
1174       if (checkUseAfterFree(Sym, C, A))
1175         return;
1176     }
1177   }
1178 }
1179 
1180 void MallocChecker::checkPreStmt(const ReturnStmt *S, CheckerContext &C) const {
1181   const Expr *E = S->getRetValue();
1182   if (!E)
1183     return;
1184 
1185   // Check if we are returning a symbol.
1186   ProgramStateRef State = C.getState();
1187   SVal RetVal = State->getSVal(E, C.getLocationContext());
1188   SymbolRef Sym = RetVal.getAsSymbol();
1189   if (!Sym)
1190     // If we are returning a field of the allocated struct or an array element,
1191     // the callee could still free the memory.
1192     // TODO: This logic should be a part of generic symbol escape callback.
1193     if (const MemRegion *MR = RetVal.getAsRegion())
1194       if (isa<FieldRegion>(MR) || isa<ElementRegion>(MR))
1195         if (const SymbolicRegion *BMR =
1196               dyn_cast<SymbolicRegion>(MR->getBaseRegion()))
1197           Sym = BMR->getSymbol();
1198 
1199   // Check if we are returning freed memory.
1200   if (Sym)
1201     if (checkUseAfterFree(Sym, C, E))
1202       return;
1203 
1204   // If this function body is not inlined, stop tracking any returned symbols.
1205   if (C.getLocationContext()->getParent() == 0) {
1206     State =
1207       State->scanReachableSymbols<StopTrackingCallback>(RetVal).getState();
1208     C.addTransition(State);
1209   }
1210 }
1211 
1212 // TODO: Blocks should be either inlined or should call invalidate regions
1213 // upon invocation. After that's in place, special casing here will not be
1214 // needed.
1215 void MallocChecker::checkPostStmt(const BlockExpr *BE,
1216                                   CheckerContext &C) const {
1217 
1218   // Scan the BlockDecRefExprs for any object the retain count checker
1219   // may be tracking.
1220   if (!BE->getBlockDecl()->hasCaptures())
1221     return;
1222 
1223   ProgramStateRef state = C.getState();
1224   const BlockDataRegion *R =
1225     cast<BlockDataRegion>(state->getSVal(BE,
1226                                          C.getLocationContext()).getAsRegion());
1227 
1228   BlockDataRegion::referenced_vars_iterator I = R->referenced_vars_begin(),
1229                                             E = R->referenced_vars_end();
1230 
1231   if (I == E)
1232     return;
1233 
1234   SmallVector<const MemRegion*, 10> Regions;
1235   const LocationContext *LC = C.getLocationContext();
1236   MemRegionManager &MemMgr = C.getSValBuilder().getRegionManager();
1237 
1238   for ( ; I != E; ++I) {
1239     const VarRegion *VR = *I;
1240     if (VR->getSuperRegion() == R) {
1241       VR = MemMgr.getVarRegion(VR->getDecl(), LC);
1242     }
1243     Regions.push_back(VR);
1244   }
1245 
1246   state =
1247     state->scanReachableSymbols<StopTrackingCallback>(Regions.data(),
1248                                     Regions.data() + Regions.size()).getState();
1249   C.addTransition(state);
1250 }
1251 
1252 bool MallocChecker::isReleased(SymbolRef Sym, CheckerContext &C) const {
1253   assert(Sym);
1254   const RefState *RS = C.getState()->get<RegionState>(Sym);
1255   return (RS && RS->isReleased());
1256 }
1257 
1258 bool MallocChecker::checkUseAfterFree(SymbolRef Sym, CheckerContext &C,
1259                                       const Stmt *S) const {
1260   if (isReleased(Sym, C)) {
1261     if (ExplodedNode *N = C.generateSink()) {
1262       if (!BT_UseFree)
1263         BT_UseFree.reset(new BugType("Use-after-free", "Memory Error"));
1264 
1265       BugReport *R = new BugReport(*BT_UseFree,
1266                                    "Use of memory after it is freed",N);
1267       if (S)
1268         R->addRange(S->getSourceRange());
1269       R->markInteresting(Sym);
1270       R->addVisitor(new MallocBugVisitor(Sym));
1271       C.emitReport(R);
1272       return true;
1273     }
1274   }
1275   return false;
1276 }
1277 
1278 // Check if the location is a freed symbolic region.
1279 void MallocChecker::checkLocation(SVal l, bool isLoad, const Stmt *S,
1280                                   CheckerContext &C) const {
1281   SymbolRef Sym = l.getLocSymbolInBase();
1282   if (Sym)
1283     checkUseAfterFree(Sym, C, S);
1284 }
1285 
1286 //===----------------------------------------------------------------------===//
1287 // Check various ways a symbol can be invalidated.
1288 // TODO: This logic (the next 3 functions) is copied/similar to the
1289 // RetainRelease checker. We might want to factor this out.
1290 //===----------------------------------------------------------------------===//
1291 
1292 // Stop tracking symbols when a value escapes as a result of checkBind.
1293 // A value escapes in three possible cases:
1294 // (1) we are binding to something that is not a memory region.
1295 // (2) we are binding to a memregion that does not have stack storage
1296 // (3) we are binding to a memregion with stack storage that the store
1297 //     does not understand.
1298 void MallocChecker::checkBind(SVal loc, SVal val, const Stmt *S,
1299                               CheckerContext &C) const {
1300   // Are we storing to something that causes the value to "escape"?
1301   bool escapes = true;
1302   ProgramStateRef state = C.getState();
1303 
1304   if (loc::MemRegionVal *regionLoc = dyn_cast<loc::MemRegionVal>(&loc)) {
1305     escapes = !regionLoc->getRegion()->hasStackStorage();
1306 
1307     if (!escapes) {
1308       // To test (3), generate a new state with the binding added.  If it is
1309       // the same state, then it escapes (since the store cannot represent
1310       // the binding).
1311       // Do this only if we know that the store is not supposed to generate the
1312       // same state.
1313       SVal StoredVal = state->getSVal(regionLoc->getRegion());
1314       if (StoredVal != val)
1315         escapes = (state == (state->bindLoc(*regionLoc, val)));
1316     }
1317   }
1318 
1319   // If our store can represent the binding and we aren't storing to something
1320   // that doesn't have local storage then just return and have the simulation
1321   // state continue as is.
1322   if (!escapes)
1323       return;
1324 
1325   // Otherwise, find all symbols referenced by 'val' that we are tracking
1326   // and stop tracking them.
1327   state = state->scanReachableSymbols<StopTrackingCallback>(val).getState();
1328   C.addTransition(state);
1329 }
1330 
1331 // If a symbolic region is assumed to NULL (or another constant), stop tracking
1332 // it - assuming that allocation failed on this path.
1333 ProgramStateRef MallocChecker::evalAssume(ProgramStateRef state,
1334                                               SVal Cond,
1335                                               bool Assumption) const {
1336   RegionStateTy RS = state->get<RegionState>();
1337   for (RegionStateTy::iterator I = RS.begin(), E = RS.end(); I != E; ++I) {
1338     // If the symbol is assumed to be NULL, remove it from consideration.
1339     ConstraintManager &CMgr = state->getConstraintManager();
1340     ConditionTruthVal AllocFailed = CMgr.isNull(state, I.getKey());
1341     if (AllocFailed.isConstrainedTrue())
1342       state = state->remove<RegionState>(I.getKey());
1343   }
1344 
1345   // Realloc returns 0 when reallocation fails, which means that we should
1346   // restore the state of the pointer being reallocated.
1347   ReallocPairsTy RP = state->get<ReallocPairs>();
1348   for (ReallocPairsTy::iterator I = RP.begin(), E = RP.end(); I != E; ++I) {
1349     // If the symbol is assumed to be NULL, remove it from consideration.
1350     ConstraintManager &CMgr = state->getConstraintManager();
1351     ConditionTruthVal AllocFailed = CMgr.isNull(state, I.getKey());
1352     if (!AllocFailed.isConstrainedTrue())
1353       continue;
1354 
1355     SymbolRef ReallocSym = I.getData().ReallocatedSym;
1356     if (const RefState *RS = state->get<RegionState>(ReallocSym)) {
1357       if (RS->isReleased()) {
1358         if (I.getData().Kind == RPToBeFreedAfterFailure)
1359           state = state->set<RegionState>(ReallocSym,
1360               RefState::getAllocated(RS->getStmt()));
1361         else if (I.getData().Kind == RPDoNotTrackAfterFailure)
1362           state = state->remove<RegionState>(ReallocSym);
1363         else
1364           assert(I.getData().Kind == RPIsFreeOnFailure);
1365       }
1366     }
1367     state = state->remove<ReallocPairs>(I.getKey());
1368   }
1369 
1370   return state;
1371 }
1372 
1373 // Check if the function is known to us. So, for example, we could
1374 // conservatively assume it can free/reallocate its pointer arguments.
1375 // (We assume that the pointers cannot escape through calls to system
1376 // functions not handled by this checker.)
1377 bool MallocChecker::doesNotFreeMemory(const CallEvent *Call,
1378                                       ProgramStateRef State) const {
1379   assert(Call);
1380 
1381   // For now, assume that any C++ call can free memory.
1382   // TODO: If we want to be more optimistic here, we'll need to make sure that
1383   // regions escape to C++ containers. They seem to do that even now, but for
1384   // mysterious reasons.
1385   if (!(isa<FunctionCall>(Call) || isa<ObjCMethodCall>(Call)))
1386     return false;
1387 
1388   // Check Objective-C messages by selector name.
1389   if (const ObjCMethodCall *Msg = dyn_cast<ObjCMethodCall>(Call)) {
1390     // If it's not a framework call, or if it takes a callback, assume it
1391     // can free memory.
1392     if (!Call->isInSystemHeader() || Call->hasNonZeroCallbackArg())
1393       return false;
1394 
1395     Selector S = Msg->getSelector();
1396 
1397     // Whitelist the ObjC methods which do free memory.
1398     // - Anything containing 'freeWhenDone' param set to 1.
1399     //   Ex: dataWithBytesNoCopy:length:freeWhenDone.
1400     for (unsigned i = 1; i < S.getNumArgs(); ++i) {
1401       if (S.getNameForSlot(i).equals("freeWhenDone")) {
1402         if (Call->getArgSVal(i).isConstant(1))
1403           return false;
1404         else
1405           return true;
1406       }
1407     }
1408 
1409     // If the first selector ends with NoCopy, assume that the ownership is
1410     // transferred as well.
1411     // Ex:  [NSData dataWithBytesNoCopy:bytes length:10];
1412     StringRef FirstSlot = S.getNameForSlot(0);
1413     if (FirstSlot.endswith("NoCopy"))
1414       return false;
1415 
1416     // If the first selector starts with addPointer, insertPointer,
1417     // or replacePointer, assume we are dealing with NSPointerArray or similar.
1418     // This is similar to C++ containers (vector); we still might want to check
1419     // that the pointers get freed by following the container itself.
1420     if (FirstSlot.startswith("addPointer") ||
1421         FirstSlot.startswith("insertPointer") ||
1422         FirstSlot.startswith("replacePointer")) {
1423       return false;
1424     }
1425 
1426     // Otherwise, assume that the method does not free memory.
1427     // Most framework methods do not free memory.
1428     return true;
1429   }
1430 
1431   // At this point the only thing left to handle is straight function calls.
1432   const FunctionDecl *FD = cast<FunctionCall>(Call)->getDecl();
1433   if (!FD)
1434     return false;
1435 
1436   ASTContext &ASTC = State->getStateManager().getContext();
1437 
1438   // If it's one of the allocation functions we can reason about, we model
1439   // its behavior explicitly.
1440   if (isMemFunction(FD, ASTC))
1441     return true;
1442 
1443   // If it's not a system call, assume it frees memory.
1444   if (!Call->isInSystemHeader())
1445     return false;
1446 
1447   // White list the system functions whose arguments escape.
1448   const IdentifierInfo *II = FD->getIdentifier();
1449   if (!II)
1450     return false;
1451   StringRef FName = II->getName();
1452 
1453   // White list the 'XXXNoCopy' CoreFoundation functions.
1454   // We specifically check these before
1455   if (FName.endswith("NoCopy")) {
1456     // Look for the deallocator argument. We know that the memory ownership
1457     // is not transferred only if the deallocator argument is
1458     // 'kCFAllocatorNull'.
1459     for (unsigned i = 1; i < Call->getNumArgs(); ++i) {
1460       const Expr *ArgE = Call->getArgExpr(i)->IgnoreParenCasts();
1461       if (const DeclRefExpr *DE = dyn_cast<DeclRefExpr>(ArgE)) {
1462         StringRef DeallocatorName = DE->getFoundDecl()->getName();
1463         if (DeallocatorName == "kCFAllocatorNull")
1464           return true;
1465       }
1466     }
1467     return false;
1468   }
1469 
1470   // Associating streams with malloced buffers. The pointer can escape if
1471   // 'closefn' is specified (and if that function does free memory),
1472   // but it will not if closefn is not specified.
1473   // Currently, we do not inspect the 'closefn' function (PR12101).
1474   if (FName == "funopen")
1475     if (Call->getNumArgs() >= 4 && Call->getArgSVal(4).isConstant(0))
1476       return true;
1477 
1478   // Do not warn on pointers passed to 'setbuf' when used with std streams,
1479   // these leaks might be intentional when setting the buffer for stdio.
1480   // http://stackoverflow.com/questions/2671151/who-frees-setvbuf-buffer
1481   if (FName == "setbuf" || FName =="setbuffer" ||
1482       FName == "setlinebuf" || FName == "setvbuf") {
1483     if (Call->getNumArgs() >= 1) {
1484       const Expr *ArgE = Call->getArgExpr(0)->IgnoreParenCasts();
1485       if (const DeclRefExpr *ArgDRE = dyn_cast<DeclRefExpr>(ArgE))
1486         if (const VarDecl *D = dyn_cast<VarDecl>(ArgDRE->getDecl()))
1487           if (D->getCanonicalDecl()->getName().find("std") != StringRef::npos)
1488             return false;
1489     }
1490   }
1491 
1492   // A bunch of other functions which either take ownership of a pointer or
1493   // wrap the result up in a struct or object, meaning it can be freed later.
1494   // (See RetainCountChecker.) Not all the parameters here are invalidated,
1495   // but the Malloc checker cannot differentiate between them. The right way
1496   // of doing this would be to implement a pointer escapes callback.
1497   if (FName == "CGBitmapContextCreate" ||
1498       FName == "CGBitmapContextCreateWithData" ||
1499       FName == "CVPixelBufferCreateWithBytes" ||
1500       FName == "CVPixelBufferCreateWithPlanarBytes" ||
1501       FName == "OSAtomicEnqueue") {
1502     return false;
1503   }
1504 
1505   // Handle cases where we know a buffer's /address/ can escape.
1506   // Note that the above checks handle some special cases where we know that
1507   // even though the address escapes, it's still our responsibility to free the
1508   // buffer.
1509   if (Call->argumentsMayEscape())
1510     return false;
1511 
1512   // Otherwise, assume that the function does not free memory.
1513   // Most system calls do not free the memory.
1514   return true;
1515 }
1516 
1517 // If the symbol we are tracking is invalidated, but not explicitly (ex: the &p
1518 // escapes, when we are tracking p), do not track the symbol as we cannot reason
1519 // about it anymore.
1520 ProgramStateRef
1521 MallocChecker::checkRegionChanges(ProgramStateRef State,
1522                             const StoreManager::InvalidatedSymbols *invalidated,
1523                                     ArrayRef<const MemRegion *> ExplicitRegions,
1524                                     ArrayRef<const MemRegion *> Regions,
1525                                     const CallEvent *Call) const {
1526   if (!invalidated || invalidated->empty())
1527     return State;
1528   llvm::SmallPtrSet<SymbolRef, 8> WhitelistedSymbols;
1529 
1530   // If it's a call which might free or reallocate memory, we assume that all
1531   // regions (explicit and implicit) escaped.
1532 
1533   // Otherwise, whitelist explicit pointers; we still can track them.
1534   if (!Call || doesNotFreeMemory(Call, State)) {
1535     for (ArrayRef<const MemRegion *>::iterator I = ExplicitRegions.begin(),
1536         E = ExplicitRegions.end(); I != E; ++I) {
1537       if (const SymbolicRegion *R = (*I)->StripCasts()->getAs<SymbolicRegion>())
1538         WhitelistedSymbols.insert(R->getSymbol());
1539     }
1540   }
1541 
1542   for (StoreManager::InvalidatedSymbols::const_iterator I=invalidated->begin(),
1543        E = invalidated->end(); I!=E; ++I) {
1544     SymbolRef sym = *I;
1545     if (WhitelistedSymbols.count(sym))
1546       continue;
1547     // The symbol escaped. Note, we assume that if the symbol is released,
1548     // passing it out will result in a use after free. We also keep tracking
1549     // relinquished symbols.
1550     if (const RefState *RS = State->get<RegionState>(sym)) {
1551       if (RS->isAllocated())
1552         State = State->remove<RegionState>(sym);
1553     }
1554   }
1555   return State;
1556 }
1557 
1558 static SymbolRef findFailedReallocSymbol(ProgramStateRef currState,
1559                                          ProgramStateRef prevState) {
1560   ReallocPairsTy currMap = currState->get<ReallocPairs>();
1561   ReallocPairsTy prevMap = prevState->get<ReallocPairs>();
1562 
1563   for (ReallocPairsTy::iterator I = prevMap.begin(), E = prevMap.end();
1564        I != E; ++I) {
1565     SymbolRef sym = I.getKey();
1566     if (!currMap.lookup(sym))
1567       return sym;
1568   }
1569 
1570   return NULL;
1571 }
1572 
1573 PathDiagnosticPiece *
1574 MallocChecker::MallocBugVisitor::VisitNode(const ExplodedNode *N,
1575                                            const ExplodedNode *PrevN,
1576                                            BugReporterContext &BRC,
1577                                            BugReport &BR) {
1578   ProgramStateRef state = N->getState();
1579   ProgramStateRef statePrev = PrevN->getState();
1580 
1581   const RefState *RS = state->get<RegionState>(Sym);
1582   const RefState *RSPrev = statePrev->get<RegionState>(Sym);
1583   if (!RS)
1584     return 0;
1585 
1586   const Stmt *S = 0;
1587   const char *Msg = 0;
1588   StackHintGeneratorForSymbol *StackHint = 0;
1589 
1590   // Retrieve the associated statement.
1591   ProgramPoint ProgLoc = N->getLocation();
1592   if (StmtPoint *SP = dyn_cast<StmtPoint>(&ProgLoc))
1593     S = SP->getStmt();
1594   else if (CallExitEnd *Exit = dyn_cast<CallExitEnd>(&ProgLoc))
1595     S = Exit->getCalleeContext()->getCallSite();
1596   // If an assumption was made on a branch, it should be caught
1597   // here by looking at the state transition.
1598   else if (BlockEdge *Edge = dyn_cast<BlockEdge>(&ProgLoc)) {
1599     const CFGBlock *srcBlk = Edge->getSrc();
1600     S = srcBlk->getTerminator();
1601   }
1602   if (!S)
1603     return 0;
1604 
1605   // FIXME: We will eventually need to handle non-statement-based events
1606   // (__attribute__((cleanup))).
1607 
1608   // Find out if this is an interesting point and what is the kind.
1609   if (Mode == Normal) {
1610     if (isAllocated(RS, RSPrev, S)) {
1611       Msg = "Memory is allocated";
1612       StackHint = new StackHintGeneratorForSymbol(Sym,
1613                                                   "Returned allocated memory");
1614     } else if (isReleased(RS, RSPrev, S)) {
1615       Msg = "Memory is released";
1616       StackHint = new StackHintGeneratorForSymbol(Sym,
1617                                                   "Returned released memory");
1618     } else if (isRelinquished(RS, RSPrev, S)) {
1619       Msg = "Memory ownership is transfered";
1620       StackHint = new StackHintGeneratorForSymbol(Sym, "");
1621     } else if (isReallocFailedCheck(RS, RSPrev, S)) {
1622       Mode = ReallocationFailed;
1623       Msg = "Reallocation failed";
1624       StackHint = new StackHintGeneratorForReallocationFailed(Sym,
1625                                                        "Reallocation failed");
1626 
1627       if (SymbolRef sym = findFailedReallocSymbol(state, statePrev)) {
1628         // Is it possible to fail two reallocs WITHOUT testing in between?
1629         assert((!FailedReallocSymbol || FailedReallocSymbol == sym) &&
1630           "We only support one failed realloc at a time.");
1631         BR.markInteresting(sym);
1632         FailedReallocSymbol = sym;
1633       }
1634     }
1635 
1636   // We are in a special mode if a reallocation failed later in the path.
1637   } else if (Mode == ReallocationFailed) {
1638     assert(FailedReallocSymbol && "No symbol to look for.");
1639 
1640     // Is this is the first appearance of the reallocated symbol?
1641     if (!statePrev->get<RegionState>(FailedReallocSymbol)) {
1642       // We're at the reallocation point.
1643       Msg = "Attempt to reallocate memory";
1644       StackHint = new StackHintGeneratorForSymbol(Sym,
1645                                                  "Returned reallocated memory");
1646       FailedReallocSymbol = NULL;
1647       Mode = Normal;
1648     }
1649   }
1650 
1651   if (!Msg)
1652     return 0;
1653   assert(StackHint);
1654 
1655   // Generate the extra diagnostic.
1656   PathDiagnosticLocation Pos(S, BRC.getSourceManager(),
1657                              N->getLocationContext());
1658   return new PathDiagnosticEventPiece(Pos, Msg, true, StackHint);
1659 }
1660 
1661 void MallocChecker::printState(raw_ostream &Out, ProgramStateRef State,
1662                                const char *NL, const char *Sep) const {
1663 
1664   RegionStateTy RS = State->get<RegionState>();
1665 
1666   if (!RS.isEmpty())
1667     Out << "Has Malloc data" << NL;
1668 }
1669 
1670 #define REGISTER_CHECKER(name) \
1671 void ento::register##name(CheckerManager &mgr) {\
1672   registerCStringCheckerBasic(mgr); \
1673   mgr.registerChecker<MallocChecker>()->Filter.C##name = true;\
1674 }
1675 
1676 REGISTER_CHECKER(MallocPessimistic)
1677 REGISTER_CHECKER(MallocOptimistic)
1678