xref: /llvm-project/clang/lib/Serialization/ModuleManager.cpp (revision 9a9efbafa701f7c6a2c6732b4e8e2a4e0adc23e1)
1 //===--- ModuleManager.cpp - Module Manager ---------------------*- C++ -*-===//
2 //
3 //                     The LLVM Compiler Infrastructure
4 //
5 // This file is distributed under the University of Illinois Open Source
6 // License. See LICENSE.TXT for details.
7 //
8 //===----------------------------------------------------------------------===//
9 //
10 //  This file defines the ModuleManager class, which manages a set of loaded
11 //  modules for the ASTReader.
12 //
13 //===----------------------------------------------------------------------===//
14 #include "clang/Frontend/PCHContainerOperations.h"
15 #include "clang/Lex/HeaderSearch.h"
16 #include "clang/Lex/ModuleMap.h"
17 #include "clang/Serialization/GlobalModuleIndex.h"
18 #include "clang/Serialization/ModuleManager.h"
19 #include "llvm/Support/MemoryBuffer.h"
20 #include "llvm/Support/Path.h"
21 #include "llvm/Support/raw_ostream.h"
22 #include <system_error>
23 
24 #ifndef NDEBUG
25 #include "llvm/Support/GraphWriter.h"
26 #endif
27 
28 using namespace clang;
29 using namespace serialization;
30 
31 ModuleFile *ModuleManager::lookup(StringRef Name) {
32   const FileEntry *Entry = FileMgr.getFile(Name, /*openFile=*/false,
33                                            /*cacheFailure=*/false);
34   if (Entry)
35     return lookup(Entry);
36 
37   return nullptr;
38 }
39 
40 ModuleFile *ModuleManager::lookup(const FileEntry *File) {
41   llvm::DenseMap<const FileEntry *, ModuleFile *>::iterator Known
42     = Modules.find(File);
43   if (Known == Modules.end())
44     return nullptr;
45 
46   return Known->second;
47 }
48 
49 std::unique_ptr<llvm::MemoryBuffer>
50 ModuleManager::lookupBuffer(StringRef Name) {
51   const FileEntry *Entry = FileMgr.getFile(Name, /*openFile=*/false,
52                                            /*cacheFailure=*/false);
53   return std::move(InMemoryBuffers[Entry]);
54 }
55 
56 ModuleManager::AddModuleResult
57 ModuleManager::addModule(StringRef FileName, ModuleKind Type,
58                          SourceLocation ImportLoc, ModuleFile *ImportedBy,
59                          unsigned Generation,
60                          off_t ExpectedSize, time_t ExpectedModTime,
61                          ASTFileSignature ExpectedSignature,
62                          ASTFileSignatureReader ReadSignature,
63                          ModuleFile *&Module,
64                          std::string &ErrorStr) {
65   Module = nullptr;
66 
67   // Look for the file entry. This only fails if the expected size or
68   // modification time differ.
69   const FileEntry *Entry;
70   if (Type == MK_ExplicitModule) {
71     // If we're not expecting to pull this file out of the module cache, it
72     // might have a different mtime due to being moved across filesystems in
73     // a distributed build. The size must still match, though. (As must the
74     // contents, but we can't check that.)
75     ExpectedModTime = 0;
76   }
77   if (lookupModuleFile(FileName, ExpectedSize, ExpectedModTime, Entry)) {
78     ErrorStr = "module file out of date";
79     return OutOfDate;
80   }
81 
82   if (!Entry && FileName != "-") {
83     ErrorStr = "module file not found";
84     return Missing;
85   }
86 
87   // Check whether we already loaded this module, before
88   ModuleFile *&ModuleEntry = Modules[Entry];
89   bool NewModule = false;
90   if (!ModuleEntry) {
91     // Allocate a new module.
92     ModuleFile *New = new ModuleFile(Type, Generation);
93     New->Index = Chain.size();
94     New->FileName = FileName.str();
95     New->File = Entry;
96     New->ImportLoc = ImportLoc;
97     Chain.push_back(New);
98     if (!New->isModule())
99       PCHChain.push_back(New);
100     if (!ImportedBy)
101       Roots.push_back(New);
102     NewModule = true;
103     ModuleEntry = New;
104 
105     New->InputFilesValidationTimestamp = 0;
106     if (New->Kind == MK_ImplicitModule) {
107       std::string TimestampFilename = New->getTimestampFilename();
108       vfs::Status Status;
109       // A cached stat value would be fine as well.
110       if (!FileMgr.getNoncachedStatValue(TimestampFilename, Status))
111         New->InputFilesValidationTimestamp =
112             Status.getLastModificationTime().toEpochTime();
113     }
114 
115     // Load the contents of the module
116     if (std::unique_ptr<llvm::MemoryBuffer> Buffer = lookupBuffer(FileName)) {
117       // The buffer was already provided for us.
118       New->Buffer = std::move(Buffer);
119     } else {
120       // Open the AST file.
121       llvm::ErrorOr<std::unique_ptr<llvm::MemoryBuffer>> Buf(
122           (std::error_code()));
123       if (FileName == "-") {
124         Buf = llvm::MemoryBuffer::getSTDIN();
125       } else {
126         // Leave the FileEntry open so if it gets read again by another
127         // ModuleManager it must be the same underlying file.
128         // FIXME: Because FileManager::getFile() doesn't guarantee that it will
129         // give us an open file, this may not be 100% reliable.
130         Buf = FileMgr.getBufferForFile(New->File,
131                                        /*IsVolatile=*/false,
132                                        /*ShouldClose=*/false);
133       }
134 
135       if (!Buf) {
136         ErrorStr = Buf.getError().message();
137         return Missing;
138       }
139 
140       New->Buffer = std::move(*Buf);
141     }
142 
143     // Initialize the stream.
144     PCHContainerRdr.ExtractPCH(New->Buffer->getMemBufferRef(), New->StreamFile);
145   }
146 
147   if (ExpectedSignature) {
148     if (NewModule)
149       ModuleEntry->Signature = ReadSignature(ModuleEntry->StreamFile);
150     else
151       assert(ModuleEntry->Signature == ReadSignature(ModuleEntry->StreamFile));
152 
153     if (ModuleEntry->Signature != ExpectedSignature) {
154       ErrorStr = ModuleEntry->Signature ? "signature mismatch"
155                                         : "could not read module signature";
156 
157       if (NewModule) {
158         // Remove the module file immediately, since removeModules might try to
159         // invalidate the file cache for Entry, and that is not safe if this
160         // module is *itself* up to date, but has an out-of-date importer.
161         Modules.erase(Entry);
162         assert(Chain.back() == ModuleEntry);
163         Chain.pop_back();
164         if (!ModuleEntry->isModule())
165           PCHChain.pop_back();
166         if (Roots.back() == ModuleEntry)
167           Roots.pop_back();
168         else
169           assert(ImportedBy);
170         delete ModuleEntry;
171       }
172       return OutOfDate;
173     }
174   }
175 
176   if (ImportedBy) {
177     ModuleEntry->ImportedBy.insert(ImportedBy);
178     ImportedBy->Imports.insert(ModuleEntry);
179   } else {
180     if (!ModuleEntry->DirectlyImported)
181       ModuleEntry->ImportLoc = ImportLoc;
182 
183     ModuleEntry->DirectlyImported = true;
184   }
185 
186   Module = ModuleEntry;
187   return NewModule? NewlyLoaded : AlreadyLoaded;
188 }
189 
190 void ModuleManager::removeModules(
191     ModuleIterator first, ModuleIterator last,
192     llvm::SmallPtrSetImpl<ModuleFile *> &LoadedSuccessfully,
193     ModuleMap *modMap) {
194   if (first == last)
195     return;
196 
197   // Collect the set of module file pointers that we'll be removing.
198   llvm::SmallPtrSet<ModuleFile *, 4> victimSet(first, last);
199 
200   auto IsVictim = [&](ModuleFile *MF) {
201     return victimSet.count(MF);
202   };
203   // Remove any references to the now-destroyed modules.
204   for (unsigned i = 0, n = Chain.size(); i != n; ++i) {
205     Chain[i]->ImportedBy.remove_if(IsVictim);
206   }
207   Roots.erase(std::remove_if(Roots.begin(), Roots.end(), IsVictim),
208               Roots.end());
209 
210   // Remove the modules from the PCH chain.
211   for (auto I = first; I != last; ++I) {
212     if (!(*I)->isModule()) {
213       PCHChain.erase(std::find(PCHChain.begin(), PCHChain.end(), *I),
214                      PCHChain.end());
215       break;
216     }
217   }
218 
219   // Delete the modules and erase them from the various structures.
220   for (ModuleIterator victim = first; victim != last; ++victim) {
221     Modules.erase((*victim)->File);
222 
223     if (modMap) {
224       StringRef ModuleName = (*victim)->ModuleName;
225       if (Module *mod = modMap->findModule(ModuleName)) {
226         mod->setASTFile(nullptr);
227       }
228     }
229 
230     // Files that didn't make it through ReadASTCore successfully will be
231     // rebuilt (or there was an error). Invalidate them so that we can load the
232     // new files that will be renamed over the old ones.
233     if (LoadedSuccessfully.count(*victim) == 0)
234       FileMgr.invalidateCache((*victim)->File);
235 
236     delete *victim;
237   }
238 
239   // Remove the modules from the chain.
240   Chain.erase(first, last);
241 }
242 
243 void
244 ModuleManager::addInMemoryBuffer(StringRef FileName,
245                                  std::unique_ptr<llvm::MemoryBuffer> Buffer) {
246 
247   const FileEntry *Entry =
248       FileMgr.getVirtualFile(FileName, Buffer->getBufferSize(), 0);
249   InMemoryBuffers[Entry] = std::move(Buffer);
250 }
251 
252 bool ModuleManager::addKnownModuleFile(StringRef FileName) {
253   const FileEntry *File;
254   if (lookupModuleFile(FileName, 0, 0, File))
255     return true;
256   if (!Modules.count(File))
257     AdditionalKnownModuleFiles.insert(File);
258   return false;
259 }
260 
261 ModuleManager::VisitState *ModuleManager::allocateVisitState() {
262   // Fast path: if we have a cached state, use it.
263   if (FirstVisitState) {
264     VisitState *Result = FirstVisitState;
265     FirstVisitState = FirstVisitState->NextState;
266     Result->NextState = nullptr;
267     return Result;
268   }
269 
270   // Allocate and return a new state.
271   return new VisitState(size());
272 }
273 
274 void ModuleManager::returnVisitState(VisitState *State) {
275   assert(State->NextState == nullptr && "Visited state is in list?");
276   State->NextState = FirstVisitState;
277   FirstVisitState = State;
278 }
279 
280 void ModuleManager::setGlobalIndex(GlobalModuleIndex *Index) {
281   GlobalIndex = Index;
282   if (!GlobalIndex) {
283     ModulesInCommonWithGlobalIndex.clear();
284     return;
285   }
286 
287   // Notify the global module index about all of the modules we've already
288   // loaded.
289   for (unsigned I = 0, N = Chain.size(); I != N; ++I) {
290     if (!GlobalIndex->loadedModuleFile(Chain[I])) {
291       ModulesInCommonWithGlobalIndex.push_back(Chain[I]);
292     }
293   }
294 }
295 
296 void ModuleManager::moduleFileAccepted(ModuleFile *MF) {
297   AdditionalKnownModuleFiles.remove(MF->File);
298 
299   if (!GlobalIndex || GlobalIndex->loadedModuleFile(MF))
300     return;
301 
302   ModulesInCommonWithGlobalIndex.push_back(MF);
303 }
304 
305 ModuleManager::ModuleManager(FileManager &FileMgr,
306                              const PCHContainerReader &PCHContainerRdr)
307     : FileMgr(FileMgr), PCHContainerRdr(PCHContainerRdr), GlobalIndex(),
308       FirstVisitState(nullptr) {}
309 
310 ModuleManager::~ModuleManager() {
311   for (unsigned i = 0, e = Chain.size(); i != e; ++i)
312     delete Chain[e - i - 1];
313   delete FirstVisitState;
314 }
315 
316 void ModuleManager::visit(llvm::function_ref<bool(ModuleFile &M)> Visitor,
317                           llvm::SmallPtrSetImpl<ModuleFile *> *ModuleFilesHit) {
318   // If the visitation order vector is the wrong size, recompute the order.
319   if (VisitOrder.size() != Chain.size()) {
320     unsigned N = size();
321     VisitOrder.clear();
322     VisitOrder.reserve(N);
323 
324     // Record the number of incoming edges for each module. When we
325     // encounter a module with no incoming edges, push it into the queue
326     // to seed the queue.
327     SmallVector<ModuleFile *, 4> Queue;
328     Queue.reserve(N);
329     llvm::SmallVector<unsigned, 4> UnusedIncomingEdges;
330     UnusedIncomingEdges.resize(size());
331     for (auto M = rbegin(), MEnd = rend(); M != MEnd; ++M) {
332       unsigned Size = (*M)->ImportedBy.size();
333       UnusedIncomingEdges[(*M)->Index] = Size;
334       if (!Size)
335         Queue.push_back(*M);
336     }
337 
338     // Traverse the graph, making sure to visit a module before visiting any
339     // of its dependencies.
340     while (!Queue.empty()) {
341       ModuleFile *CurrentModule = Queue.pop_back_val();
342       VisitOrder.push_back(CurrentModule);
343 
344       // For any module that this module depends on, push it on the
345       // stack (if it hasn't already been marked as visited).
346       for (auto M = CurrentModule->Imports.rbegin(),
347                 MEnd = CurrentModule->Imports.rend();
348            M != MEnd; ++M) {
349         // Remove our current module as an impediment to visiting the
350         // module we depend on. If we were the last unvisited module
351         // that depends on this particular module, push it into the
352         // queue to be visited.
353         unsigned &NumUnusedEdges = UnusedIncomingEdges[(*M)->Index];
354         if (NumUnusedEdges && (--NumUnusedEdges == 0))
355           Queue.push_back(*M);
356       }
357     }
358 
359     assert(VisitOrder.size() == N && "Visitation order is wrong?");
360 
361     delete FirstVisitState;
362     FirstVisitState = nullptr;
363   }
364 
365   VisitState *State = allocateVisitState();
366   unsigned VisitNumber = State->NextVisitNumber++;
367 
368   // If the caller has provided us with a hit-set that came from the global
369   // module index, mark every module file in common with the global module
370   // index that is *not* in that set as 'visited'.
371   if (ModuleFilesHit && !ModulesInCommonWithGlobalIndex.empty()) {
372     for (unsigned I = 0, N = ModulesInCommonWithGlobalIndex.size(); I != N; ++I)
373     {
374       ModuleFile *M = ModulesInCommonWithGlobalIndex[I];
375       if (!ModuleFilesHit->count(M))
376         State->VisitNumber[M->Index] = VisitNumber;
377     }
378   }
379 
380   for (unsigned I = 0, N = VisitOrder.size(); I != N; ++I) {
381     ModuleFile *CurrentModule = VisitOrder[I];
382     // Should we skip this module file?
383     if (State->VisitNumber[CurrentModule->Index] == VisitNumber)
384       continue;
385 
386     // Visit the module.
387     assert(State->VisitNumber[CurrentModule->Index] == VisitNumber - 1);
388     State->VisitNumber[CurrentModule->Index] = VisitNumber;
389     if (!Visitor(*CurrentModule))
390       continue;
391 
392     // The visitor has requested that cut off visitation of any
393     // module that the current module depends on. To indicate this
394     // behavior, we mark all of the reachable modules as having been visited.
395     ModuleFile *NextModule = CurrentModule;
396     do {
397       // For any module that this module depends on, push it on the
398       // stack (if it hasn't already been marked as visited).
399       for (llvm::SetVector<ModuleFile *>::iterator
400              M = NextModule->Imports.begin(),
401              MEnd = NextModule->Imports.end();
402            M != MEnd; ++M) {
403         if (State->VisitNumber[(*M)->Index] != VisitNumber) {
404           State->Stack.push_back(*M);
405           State->VisitNumber[(*M)->Index] = VisitNumber;
406         }
407       }
408 
409       if (State->Stack.empty())
410         break;
411 
412       // Pop the next module off the stack.
413       NextModule = State->Stack.pop_back_val();
414     } while (true);
415   }
416 
417   returnVisitState(State);
418 }
419 
420 static void markVisitedDepthFirst(ModuleFile &M,
421                                   SmallVectorImpl<bool> &Visited) {
422   for (llvm::SetVector<ModuleFile *>::iterator IM = M.Imports.begin(),
423                                                IMEnd = M.Imports.end();
424        IM != IMEnd; ++IM) {
425     if (Visited[(*IM)->Index])
426       continue;
427     Visited[(*IM)->Index] = true;
428     if (!M.DirectlyImported)
429       markVisitedDepthFirst(**IM, Visited);
430   }
431 }
432 
433 /// \brief Perform a depth-first visit of the current module.
434 static bool visitDepthFirst(
435     ModuleFile &M,
436     ModuleManager::DFSPreorderControl (*PreorderVisitor)(ModuleFile &M,
437                                                          void *UserData),
438     bool (*PostorderVisitor)(ModuleFile &M, void *UserData), void *UserData,
439     SmallVectorImpl<bool> &Visited) {
440   if (PreorderVisitor) {
441     switch (PreorderVisitor(M, UserData)) {
442     case ModuleManager::Abort:
443       return true;
444     case ModuleManager::SkipImports:
445       markVisitedDepthFirst(M, Visited);
446       return false;
447     case ModuleManager::Continue:
448       break;
449     }
450   }
451 
452   // Visit children
453   for (llvm::SetVector<ModuleFile *>::iterator IM = M.Imports.begin(),
454                                             IMEnd = M.Imports.end();
455        IM != IMEnd; ++IM) {
456     if (Visited[(*IM)->Index])
457       continue;
458     Visited[(*IM)->Index] = true;
459 
460     if (visitDepthFirst(**IM, PreorderVisitor, PostorderVisitor, UserData, Visited))
461       return true;
462   }
463 
464   if (PostorderVisitor)
465     return PostorderVisitor(M, UserData);
466 
467   return false;
468 }
469 
470 void ModuleManager::visitDepthFirst(
471     ModuleManager::DFSPreorderControl (*PreorderVisitor)(ModuleFile &M,
472                                                          void *UserData),
473     bool (*PostorderVisitor)(ModuleFile &M, void *UserData), void *UserData) {
474   SmallVector<bool, 16> Visited(size(), false);
475   for (unsigned I = 0, N = Roots.size(); I != N; ++I) {
476     if (Visited[Roots[I]->Index])
477       continue;
478     Visited[Roots[I]->Index] = true;
479 
480     if (::visitDepthFirst(*Roots[I], PreorderVisitor, PostorderVisitor, UserData, Visited))
481       return;
482   }
483 }
484 
485 bool ModuleManager::lookupModuleFile(StringRef FileName,
486                                      off_t ExpectedSize,
487                                      time_t ExpectedModTime,
488                                      const FileEntry *&File) {
489   // Open the file immediately to ensure there is no race between stat'ing and
490   // opening the file.
491   File = FileMgr.getFile(FileName, /*openFile=*/true, /*cacheFailure=*/false);
492 
493   if (!File && FileName != "-") {
494     return false;
495   }
496 
497   if ((ExpectedSize && ExpectedSize != File->getSize()) ||
498       (ExpectedModTime && ExpectedModTime != File->getModificationTime()))
499     // Do not destroy File, as it may be referenced. If we need to rebuild it,
500     // it will be destroyed by removeModules.
501     return true;
502 
503   return false;
504 }
505 
506 #ifndef NDEBUG
507 namespace llvm {
508   template<>
509   struct GraphTraits<ModuleManager> {
510     typedef ModuleFile NodeType;
511     typedef llvm::SetVector<ModuleFile *>::const_iterator ChildIteratorType;
512     typedef ModuleManager::ModuleConstIterator nodes_iterator;
513 
514     static ChildIteratorType child_begin(NodeType *Node) {
515       return Node->Imports.begin();
516     }
517 
518     static ChildIteratorType child_end(NodeType *Node) {
519       return Node->Imports.end();
520     }
521 
522     static nodes_iterator nodes_begin(const ModuleManager &Manager) {
523       return Manager.begin();
524     }
525 
526     static nodes_iterator nodes_end(const ModuleManager &Manager) {
527       return Manager.end();
528     }
529   };
530 
531   template<>
532   struct DOTGraphTraits<ModuleManager> : public DefaultDOTGraphTraits {
533     explicit DOTGraphTraits(bool IsSimple = false)
534       : DefaultDOTGraphTraits(IsSimple) { }
535 
536     static bool renderGraphFromBottomUp() {
537       return true;
538     }
539 
540     std::string getNodeLabel(ModuleFile *M, const ModuleManager&) {
541       return M->ModuleName;
542     }
543   };
544 }
545 
546 void ModuleManager::viewGraph() {
547   llvm::ViewGraph(*this, "Modules");
548 }
549 #endif
550