1 //===----- UninitializedObjectChecker.cpp ------------------------*- C++ -*-==//
2 //
3 //                     The LLVM Compiler Infrastructure
4 //
5 // This file is distributed under the University of Illinois Open Source
6 // License. See LICENSE.TXT for details.
7 //
8 //===----------------------------------------------------------------------===//
9 //
10 // This file defines a checker that reports uninitialized fields in objects
11 // created after a constructor call.
12 //
13 // This checker has several options:
14 //   - "Pedantic" (boolean). If its not set or is set to false, the checker
15 //     won't emit warnings for objects that don't have at least one initialized
16 //     field. This may be set with
17 //
18 //     `-analyzer-config alpha.cplusplus.UninitializedObject:Pedantic=true`.
19 //
20 //   - "NotesAsWarnings" (boolean). If set to true, the checker will emit a
21 //     warning for each uninitalized field, as opposed to emitting one warning
22 //     per constructor call, and listing the uninitialized fields that belongs
23 //     to it in notes. Defaults to false.
24 //
25 //     `-analyzer-config \
26 //         alpha.cplusplus.UninitializedObject:NotesAsWarnings=true`.
27 //
28 //   - "CheckPointeeInitialization" (boolean). If set to false, the checker will
29 //     not analyze the pointee of pointer/reference fields, and will only check
30 //     whether the object itself is initialized. Defaults to false.
31 //
32 //     `-analyzer-config \
33 //         alpha.cplusplus.UninitializedObject:CheckPointeeInitialization=true`.
34 //
35 //     TODO: With some clever heuristics, some pointers should be dereferenced
36 //     by default. For example, if the pointee is constructed within the
37 //     constructor call, it's reasonable to say that no external object
38 //     references it, and we wouldn't generate multiple report on the same
39 //     pointee.
40 //
41 // To read about how the checker works, refer to the comments in
42 // UninitializedObject.h.
43 //
44 // Some of the logic is implemented in UninitializedPointee.cpp, to reduce the
45 // complexity of this file.
46 //
47 //===----------------------------------------------------------------------===//
48 
49 #include "ClangSACheckers.h"
50 #include "UninitializedObject.h"
51 #include "clang/StaticAnalyzer/Core/BugReporter/BugType.h"
52 #include "clang/StaticAnalyzer/Core/Checker.h"
53 #include "clang/StaticAnalyzer/Core/PathSensitive/CheckerContext.h"
54 #include "clang/StaticAnalyzer/Core/PathSensitive/DynamicTypeMap.h"
55 
56 using namespace clang;
57 using namespace clang::ento;
58 
59 namespace {
60 
61 class UninitializedObjectChecker : public Checker<check::EndFunction> {
62   std::unique_ptr<BuiltinBug> BT_uninitField;
63 
64 public:
65   // These fields will be initialized when registering the checker.
66   bool IsPedantic;
67   bool ShouldConvertNotesToWarnings;
68   bool CheckPointeeInitialization;
69 
70   UninitializedObjectChecker()
71       : BT_uninitField(new BuiltinBug(this, "Uninitialized fields")) {}
72   void checkEndFunction(const ReturnStmt *RS, CheckerContext &C) const;
73 };
74 
75 /// A basic field type, that is not a pointer or a reference, it's dynamic and
76 /// static type is the same.
77 class RegularField : public FieldNode {
78 public:
79   RegularField(const FieldRegion *FR) : FieldNode(FR) {}
80 
81   virtual void printNoteMsg(llvm::raw_ostream &Out) const override {
82     Out << "uninitialized field ";
83   }
84 
85   virtual void printPrefix(llvm::raw_ostream &Out) const override {}
86 
87   virtual void printNode(llvm::raw_ostream &Out) const {
88     Out << getVariableName(getDecl());
89   }
90 
91   virtual void printSeparator(llvm::raw_ostream &Out) const override {
92     Out << '.';
93   }
94 };
95 
96 } // end of anonymous namespace
97 
98 // Utility function declarations.
99 
100 /// Returns the object that was constructed by CtorDecl, or None if that isn't
101 /// possible.
102 // TODO: Refactor this function so that it returns the constructed object's
103 // region.
104 static Optional<nonloc::LazyCompoundVal>
105 getObjectVal(const CXXConstructorDecl *CtorDecl, CheckerContext &Context);
106 
107 /// Checks whether the object constructed by \p Ctor will be analyzed later
108 /// (e.g. if the object is a field of another object, in which case we'd check
109 /// it multiple times).
110 static bool willObjectBeAnalyzedLater(const CXXConstructorDecl *Ctor,
111                                       CheckerContext &Context);
112 
113 //===----------------------------------------------------------------------===//
114 //                  Methods for UninitializedObjectChecker.
115 //===----------------------------------------------------------------------===//
116 
117 void UninitializedObjectChecker::checkEndFunction(
118     const ReturnStmt *RS, CheckerContext &Context) const {
119 
120   const auto *CtorDecl = dyn_cast_or_null<CXXConstructorDecl>(
121       Context.getLocationContext()->getDecl());
122   if (!CtorDecl)
123     return;
124 
125   if (!CtorDecl->isUserProvided())
126     return;
127 
128   if (CtorDecl->getParent()->isUnion())
129     return;
130 
131   // This avoids essentially the same error being reported multiple times.
132   if (willObjectBeAnalyzedLater(CtorDecl, Context))
133     return;
134 
135   Optional<nonloc::LazyCompoundVal> Object = getObjectVal(CtorDecl, Context);
136   if (!Object)
137     return;
138 
139   FindUninitializedFields F(Context.getState(), Object->getRegion(), IsPedantic,
140                             CheckPointeeInitialization);
141 
142   const UninitFieldMap &UninitFields = F.getUninitFields();
143 
144   if (UninitFields.empty())
145     return;
146 
147   // There are uninitialized fields in the record.
148 
149   ExplodedNode *Node = Context.generateNonFatalErrorNode(Context.getState());
150   if (!Node)
151     return;
152 
153   PathDiagnosticLocation LocUsedForUniqueing;
154   const Stmt *CallSite = Context.getStackFrame()->getCallSite();
155   if (CallSite)
156     LocUsedForUniqueing = PathDiagnosticLocation::createBegin(
157         CallSite, Context.getSourceManager(), Node->getLocationContext());
158 
159   // For Plist consumers that don't support notes just yet, we'll convert notes
160   // to warnings.
161   if (ShouldConvertNotesToWarnings) {
162     for (const auto &Pair : UninitFields) {
163 
164       auto Report = llvm::make_unique<BugReport>(
165           *BT_uninitField, Pair.second, Node, LocUsedForUniqueing,
166           Node->getLocationContext()->getDecl());
167       Context.emitReport(std::move(Report));
168     }
169     return;
170   }
171 
172   SmallString<100> WarningBuf;
173   llvm::raw_svector_ostream WarningOS(WarningBuf);
174   WarningOS << UninitFields.size() << " uninitialized field"
175             << (UninitFields.size() == 1 ? "" : "s")
176             << " at the end of the constructor call";
177 
178   auto Report = llvm::make_unique<BugReport>(
179       *BT_uninitField, WarningOS.str(), Node, LocUsedForUniqueing,
180       Node->getLocationContext()->getDecl());
181 
182   for (const auto &Pair : UninitFields) {
183     Report->addNote(Pair.second,
184                     PathDiagnosticLocation::create(Pair.first->getDecl(),
185                                                    Context.getSourceManager()));
186   }
187   Context.emitReport(std::move(Report));
188 }
189 
190 //===----------------------------------------------------------------------===//
191 //                   Methods for FindUninitializedFields.
192 //===----------------------------------------------------------------------===//
193 
194 FindUninitializedFields::FindUninitializedFields(
195     ProgramStateRef State, const TypedValueRegion *const R, bool IsPedantic,
196     bool CheckPointeeInitialization)
197     : State(State), ObjectR(R), IsPedantic(IsPedantic),
198       CheckPointeeInitialization(CheckPointeeInitialization) {}
199 
200 const UninitFieldMap &FindUninitializedFields::getUninitFields() {
201   isNonUnionUninit(ObjectR, FieldChainInfo(ChainFactory));
202 
203   if (!IsPedantic && !IsAnyFieldInitialized)
204     UninitFields.clear();
205 
206   return UninitFields;
207 }
208 
209 bool FindUninitializedFields::addFieldToUninits(FieldChainInfo Chain) {
210   if (State->getStateManager().getContext().getSourceManager().isInSystemHeader(
211           Chain.getUninitRegion()->getDecl()->getLocation()))
212     return false;
213 
214   UninitFieldMap::mapped_type NoteMsgBuf;
215   llvm::raw_svector_ostream OS(NoteMsgBuf);
216   Chain.printNoteMsg(OS);
217   return UninitFields
218       .insert(std::make_pair(Chain.getUninitRegion(), std::move(NoteMsgBuf)))
219       .second;
220 }
221 
222 bool FindUninitializedFields::isNonUnionUninit(const TypedValueRegion *R,
223                                                FieldChainInfo LocalChain) {
224   assert(R->getValueType()->isRecordType() &&
225          !R->getValueType()->isUnionType() &&
226          "This method only checks non-union record objects!");
227 
228   const RecordDecl *RD =
229       R->getValueType()->getAs<RecordType>()->getDecl()->getDefinition();
230   assert(RD && "Referred record has no definition");
231 
232   bool ContainsUninitField = false;
233 
234   // Are all of this non-union's fields initialized?
235   for (const FieldDecl *I : RD->fields()) {
236 
237     const auto FieldVal =
238         State->getLValue(I, loc::MemRegionVal(R)).castAs<loc::MemRegionVal>();
239     const auto *FR = FieldVal.getRegionAs<FieldRegion>();
240     QualType T = I->getType();
241 
242     // If LocalChain already contains FR, then we encountered a cyclic
243     // reference. In this case, region FR is already under checking at an
244     // earlier node in the directed tree.
245     if (LocalChain.contains(FR))
246       return false;
247 
248     if (T->isStructureOrClassType()) {
249       if (isNonUnionUninit(FR, LocalChain.add(RegularField(FR))))
250         ContainsUninitField = true;
251       continue;
252     }
253 
254     if (T->isUnionType()) {
255       if (isUnionUninit(FR)) {
256         if (addFieldToUninits(LocalChain.add(RegularField(FR))))
257           ContainsUninitField = true;
258       } else
259         IsAnyFieldInitialized = true;
260       continue;
261     }
262 
263     if (T->isArrayType()) {
264       IsAnyFieldInitialized = true;
265       continue;
266     }
267 
268     if (T->isPointerType() || T->isReferenceType() || T->isBlockPointerType()) {
269       if (isPointerOrReferenceUninit(FR, LocalChain))
270         ContainsUninitField = true;
271       continue;
272     }
273 
274     if (isPrimitiveType(T)) {
275       SVal V = State->getSVal(FieldVal);
276 
277       if (isPrimitiveUninit(V)) {
278         if (addFieldToUninits(LocalChain.add(RegularField(FR))))
279           ContainsUninitField = true;
280       }
281       continue;
282     }
283 
284     llvm_unreachable("All cases are handled!");
285   }
286 
287   // Checking bases.
288   // FIXME: As of now, because of `willObjectBeAnalyzedLater`, objects whose
289   // type is a descendant of another type will emit warnings for uninitalized
290   // inherited members.
291   // This is not the only way to analyze bases of an object -- if we didn't
292   // filter them out, and didn't analyze the bases, this checker would run for
293   // each base of the object in order of base initailization and in theory would
294   // find every uninitalized field. This approach could also make handling
295   // diamond inheritances more easily.
296   //
297   // This rule (that a descendant type's cunstructor is responsible for
298   // initializing inherited data members) is not obvious, and should it should
299   // be.
300   const auto *CXXRD = dyn_cast<CXXRecordDecl>(RD);
301   if (!CXXRD)
302     return ContainsUninitField;
303 
304   for (const CXXBaseSpecifier &BaseSpec : CXXRD->bases()) {
305     const auto *BaseRegion = State->getLValue(BaseSpec, R)
306                                  .castAs<loc::MemRegionVal>()
307                                  .getRegionAs<TypedValueRegion>();
308 
309     if (isNonUnionUninit(BaseRegion, LocalChain))
310       ContainsUninitField = true;
311   }
312 
313   return ContainsUninitField;
314 }
315 
316 bool FindUninitializedFields::isUnionUninit(const TypedValueRegion *R) {
317   assert(R->getValueType()->isUnionType() &&
318          "This method only checks union objects!");
319   // TODO: Implement support for union fields.
320   return false;
321 }
322 
323 bool FindUninitializedFields::isPrimitiveUninit(const SVal &V) {
324   if (V.isUndef())
325     return true;
326 
327   IsAnyFieldInitialized = true;
328   return false;
329 }
330 
331 //===----------------------------------------------------------------------===//
332 //                       Methods for FieldChainInfo.
333 //===----------------------------------------------------------------------===//
334 
335 const FieldRegion *FieldChainInfo::getUninitRegion() const {
336   assert(!Chain.isEmpty() && "Empty fieldchain!");
337   return (*Chain.begin()).getRegion();
338 }
339 
340 bool FieldChainInfo::contains(const FieldRegion *FR) const {
341   for (const FieldNode &Node : Chain) {
342     if (Node.isSameRegion(FR))
343       return true;
344   }
345   return false;
346 }
347 
348 /// Prints every element except the last to `Out`. Since ImmutableLists store
349 /// elements in reverse order, and have no reverse iterators, we use a
350 /// recursive function to print the fieldchain correctly. The last element in
351 /// the chain is to be printed by `print`.
352 static void printTail(llvm::raw_ostream &Out,
353                       const FieldChainInfo::FieldChainImpl *L);
354 
355 // TODO: This function constructs an incorrect string if a void pointer is a
356 // part of the chain:
357 //
358 //   struct B { int x; }
359 //
360 //   struct A {
361 //     void *vptr;
362 //     A(void* vptr) : vptr(vptr) {}
363 //   };
364 //
365 //   void f() {
366 //     B b;
367 //     A a(&b);
368 //   }
369 //
370 // The note message will be "uninitialized field 'this->vptr->x'", even though
371 // void pointers can't be dereferenced. This should be changed to "uninitialized
372 // field 'static_cast<B*>(this->vptr)->x'".
373 //
374 // TODO: This function constructs an incorrect fieldchain string in the
375 // following case:
376 //
377 //   struct Base { int x; };
378 //   struct D1 : Base {}; struct D2 : Base {};
379 //
380 //   struct MostDerived : D1, D2 {
381 //     MostDerived() {}
382 //   }
383 //
384 // A call to MostDerived::MostDerived() will cause two notes that say
385 // "uninitialized field 'this->x'", but we can't refer to 'x' directly,
386 // we need an explicit namespace resolution whether the uninit field was
387 // 'D1::x' or 'D2::x'.
388 void FieldChainInfo::printNoteMsg(llvm::raw_ostream &Out) const {
389   if (Chain.isEmpty())
390     return;
391 
392   const FieldChainImpl *L = Chain.getInternalPointer();
393   const FieldNode &LastField = L->getHead();
394 
395   LastField.printNoteMsg(Out);
396   Out << '\'';
397 
398   for (const FieldNode &Node : Chain)
399     Node.printPrefix(Out);
400 
401   Out << "this->";
402   printTail(Out, L->getTail());
403   LastField.printNode(Out);
404   Out << '\'';
405 }
406 
407 static void printTail(llvm::raw_ostream &Out,
408                       const FieldChainInfo::FieldChainImpl *L) {
409   if (!L)
410     return;
411 
412   printTail(Out, L->getTail());
413 
414   L->getHead().printNode(Out);
415   L->getHead().printSeparator(Out);
416 }
417 
418 //===----------------------------------------------------------------------===//
419 //                           Utility functions.
420 //===----------------------------------------------------------------------===//
421 
422 static Optional<nonloc::LazyCompoundVal>
423 getObjectVal(const CXXConstructorDecl *CtorDecl, CheckerContext &Context) {
424 
425   Loc ThisLoc = Context.getSValBuilder().getCXXThis(CtorDecl->getParent(),
426                                                     Context.getStackFrame());
427   // Getting the value for 'this'.
428   SVal This = Context.getState()->getSVal(ThisLoc);
429 
430   // Getting the value for '*this'.
431   SVal Object = Context.getState()->getSVal(This.castAs<Loc>());
432 
433   return Object.getAs<nonloc::LazyCompoundVal>();
434 }
435 
436 static bool willObjectBeAnalyzedLater(const CXXConstructorDecl *Ctor,
437                                       CheckerContext &Context) {
438 
439   Optional<nonloc::LazyCompoundVal> CurrentObject = getObjectVal(Ctor, Context);
440   if (!CurrentObject)
441     return false;
442 
443   const LocationContext *LC = Context.getLocationContext();
444   while ((LC = LC->getParent())) {
445 
446     // If \p Ctor was called by another constructor.
447     const auto *OtherCtor = dyn_cast<CXXConstructorDecl>(LC->getDecl());
448     if (!OtherCtor)
449       continue;
450 
451     Optional<nonloc::LazyCompoundVal> OtherObject =
452         getObjectVal(OtherCtor, Context);
453     if (!OtherObject)
454       continue;
455 
456     // If the CurrentObject is a subregion of OtherObject, it will be analyzed
457     // during the analysis of OtherObject.
458     if (CurrentObject->getRegion()->isSubRegionOf(OtherObject->getRegion()))
459       return true;
460   }
461 
462   return false;
463 }
464 
465 StringRef clang::ento::getVariableName(const FieldDecl *Field) {
466   // If Field is a captured lambda variable, Field->getName() will return with
467   // an empty string. We can however acquire it's name from the lambda's
468   // captures.
469   const auto *CXXParent = dyn_cast<CXXRecordDecl>(Field->getParent());
470 
471   if (CXXParent && CXXParent->isLambda()) {
472     assert(CXXParent->captures_begin());
473     auto It = CXXParent->captures_begin() + Field->getFieldIndex();
474     return It->getCapturedVar()->getName();
475   }
476 
477   return Field->getName();
478 }
479 
480 void ento::registerUninitializedObjectChecker(CheckerManager &Mgr) {
481   auto Chk = Mgr.registerChecker<UninitializedObjectChecker>();
482   Chk->IsPedantic = Mgr.getAnalyzerOptions().getBooleanOption(
483       "Pedantic", /*DefaultVal*/ false, Chk);
484   Chk->ShouldConvertNotesToWarnings = Mgr.getAnalyzerOptions().getBooleanOption(
485       "NotesAsWarnings", /*DefaultVal*/ false, Chk);
486   Chk->CheckPointeeInitialization = Mgr.getAnalyzerOptions().getBooleanOption(
487       "CheckPointeeInitialization", /*DefaultVal*/ false, Chk);
488 }
489