19dba64beSDimitry Andric //===-- CppModuleConfiguration.cpp ----------------------------------------===//
29dba64beSDimitry Andric //
39dba64beSDimitry Andric // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
49dba64beSDimitry Andric // See https://llvm.org/LICENSE.txt for license information.
59dba64beSDimitry Andric // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
69dba64beSDimitry Andric //
79dba64beSDimitry Andric //===----------------------------------------------------------------------===//
89dba64beSDimitry Andric 
99dba64beSDimitry Andric #include "CppModuleConfiguration.h"
109dba64beSDimitry Andric 
119dba64beSDimitry Andric #include "ClangHost.h"
129dba64beSDimitry Andric #include "lldb/Host/FileSystem.h"
1306c3fb27SDimitry Andric #include "llvm/TargetParser/Triple.h"
14bdd1243dSDimitry Andric #include <optional>
159dba64beSDimitry Andric 
169dba64beSDimitry Andric using namespace lldb_private;
179dba64beSDimitry Andric 
189dba64beSDimitry Andric bool CppModuleConfiguration::SetOncePath::TrySet(llvm::StringRef path) {
199dba64beSDimitry Andric   // Setting for the first time always works.
209dba64beSDimitry Andric   if (m_first) {
219dba64beSDimitry Andric     m_path = path.str();
229dba64beSDimitry Andric     m_valid = true;
239dba64beSDimitry Andric     m_first = false;
249dba64beSDimitry Andric     return true;
259dba64beSDimitry Andric   }
269dba64beSDimitry Andric   // Changing the path to the same value is fine.
279dba64beSDimitry Andric   if (m_path == path)
289dba64beSDimitry Andric     return true;
299dba64beSDimitry Andric 
309dba64beSDimitry Andric   // Changing the path after it was already set is not allowed.
319dba64beSDimitry Andric   m_valid = false;
329dba64beSDimitry Andric   return false;
339dba64beSDimitry Andric }
349dba64beSDimitry Andric 
354824e7fdSDimitry Andric static llvm::SmallVector<std::string, 2>
364824e7fdSDimitry Andric getTargetIncludePaths(const llvm::Triple &triple) {
374824e7fdSDimitry Andric   llvm::SmallVector<std::string, 2> paths;
384824e7fdSDimitry Andric   if (!triple.str().empty()) {
394824e7fdSDimitry Andric     paths.push_back("/usr/include/" + triple.str());
404824e7fdSDimitry Andric     if (!triple.getArchName().empty() ||
414824e7fdSDimitry Andric         triple.getOSAndEnvironmentName().empty())
424824e7fdSDimitry Andric       paths.push_back(("/usr/include/" + triple.getArchName() + "-" +
434824e7fdSDimitry Andric                        triple.getOSAndEnvironmentName())
444824e7fdSDimitry Andric                           .str());
454824e7fdSDimitry Andric   }
464824e7fdSDimitry Andric   return paths;
474824e7fdSDimitry Andric }
484824e7fdSDimitry Andric 
494824e7fdSDimitry Andric /// Returns the include path matching the given pattern for the given file
50bdd1243dSDimitry Andric /// path (or std::nullopt if the path doesn't match the pattern).
51bdd1243dSDimitry Andric static std::optional<llvm::StringRef>
524824e7fdSDimitry Andric guessIncludePath(llvm::StringRef path_to_file, llvm::StringRef pattern) {
534824e7fdSDimitry Andric   if (pattern.empty())
54bdd1243dSDimitry Andric     return std::nullopt;
554824e7fdSDimitry Andric   size_t pos = path_to_file.find(pattern);
564824e7fdSDimitry Andric   if (pos == llvm::StringRef::npos)
57bdd1243dSDimitry Andric     return std::nullopt;
584824e7fdSDimitry Andric 
594824e7fdSDimitry Andric   return path_to_file.substr(0, pos + pattern.size());
604824e7fdSDimitry Andric }
614824e7fdSDimitry Andric 
624824e7fdSDimitry Andric bool CppModuleConfiguration::analyzeFile(const FileSpec &f,
634824e7fdSDimitry Andric                                          const llvm::Triple &triple) {
649dba64beSDimitry Andric   using namespace llvm::sys::path;
659dba64beSDimitry Andric   // Convert to slashes to make following operations simpler.
669dba64beSDimitry Andric   std::string dir_buffer = convert_to_slash(f.GetDirectory().GetStringRef());
679dba64beSDimitry Andric   llvm::StringRef posix_dir(dir_buffer);
689dba64beSDimitry Andric 
699dba64beSDimitry Andric   // Check for /c++/vX/ that is used by libc++.
709dba64beSDimitry Andric   static llvm::Regex libcpp_regex(R"regex(/c[+][+]/v[0-9]/)regex");
71e8d8bef9SDimitry Andric   // If the path is in the libc++ include directory use it as the found libc++
72e8d8bef9SDimitry Andric   // path. Ignore subdirectories such as /c++/v1/experimental as those don't
73e8d8bef9SDimitry Andric   // need to be specified in the header search.
74*0fca6ea1SDimitry Andric   if (libcpp_regex.match(convert_to_slash(f.GetPath())) &&
755f757f3fSDimitry Andric       parent_path(posix_dir, Style::posix).ends_with("c++")) {
764824e7fdSDimitry Andric     if (!m_std_inc.TrySet(posix_dir))
774824e7fdSDimitry Andric       return false;
784824e7fdSDimitry Andric     if (triple.str().empty())
794824e7fdSDimitry Andric       return true;
804824e7fdSDimitry Andric 
814824e7fdSDimitry Andric     posix_dir.consume_back("c++/v1");
824824e7fdSDimitry Andric     // Check if this is a target-specific libc++ include directory.
834824e7fdSDimitry Andric     return m_std_target_inc.TrySet(
844824e7fdSDimitry Andric         (posix_dir + triple.str() + "/c++/v1").str());
859dba64beSDimitry Andric   }
869dba64beSDimitry Andric 
87bdd1243dSDimitry Andric   std::optional<llvm::StringRef> inc_path;
884824e7fdSDimitry Andric   // Target specific paths contains /usr/include, so we check them first
894824e7fdSDimitry Andric   for (auto &path : getTargetIncludePaths(triple)) {
904824e7fdSDimitry Andric     if ((inc_path = guessIncludePath(posix_dir, path)))
914824e7fdSDimitry Andric       return m_c_target_inc.TrySet(*inc_path);
924824e7fdSDimitry Andric   }
934824e7fdSDimitry Andric   if ((inc_path = guessIncludePath(posix_dir, "/usr/include")))
944824e7fdSDimitry Andric     return m_c_inc.TrySet(*inc_path);
959dba64beSDimitry Andric 
969dba64beSDimitry Andric   // File wasn't interesting, continue analyzing.
979dba64beSDimitry Andric   return true;
989dba64beSDimitry Andric }
999dba64beSDimitry Andric 
100e8d8bef9SDimitry Andric /// Utility function for just appending two paths.
101e8d8bef9SDimitry Andric static std::string MakePath(llvm::StringRef lhs, llvm::StringRef rhs) {
102e8d8bef9SDimitry Andric   llvm::SmallString<256> result(lhs);
103e8d8bef9SDimitry Andric   llvm::sys::path::append(result, rhs);
104e8d8bef9SDimitry Andric   return std::string(result);
105e8d8bef9SDimitry Andric }
106e8d8bef9SDimitry Andric 
1079dba64beSDimitry Andric bool CppModuleConfiguration::hasValidConfig() {
108e8d8bef9SDimitry Andric   // We need to have a C and C++ include dir for a valid configuration.
109e8d8bef9SDimitry Andric   if (!m_c_inc.Valid() || !m_std_inc.Valid())
110e8d8bef9SDimitry Andric     return false;
111e8d8bef9SDimitry Andric 
112e8d8bef9SDimitry Andric   // Do some basic sanity checks on the directories that we don't activate
113e8d8bef9SDimitry Andric   // the module when it's clear that it's not usable.
114e8d8bef9SDimitry Andric   const std::vector<std::string> files_to_check = {
115e8d8bef9SDimitry Andric       // * Check that the C library contains at least one random C standard
116e8d8bef9SDimitry Andric       //   library header.
117e8d8bef9SDimitry Andric       MakePath(m_c_inc.Get(), "stdio.h"),
118e8d8bef9SDimitry Andric       // * Without a libc++ modulemap file we can't have a 'std' module that
119e8d8bef9SDimitry Andric       //   could be imported.
120e8d8bef9SDimitry Andric       MakePath(m_std_inc.Get(), "module.modulemap"),
121e8d8bef9SDimitry Andric       // * Check for a random libc++ header (vector in this case) that has to
122e8d8bef9SDimitry Andric       //   exist in a working libc++ setup.
123e8d8bef9SDimitry Andric       MakePath(m_std_inc.Get(), "vector"),
124e8d8bef9SDimitry Andric   };
125e8d8bef9SDimitry Andric 
126e8d8bef9SDimitry Andric   for (llvm::StringRef file_to_check : files_to_check) {
127e8d8bef9SDimitry Andric     if (!FileSystem::Instance().Exists(file_to_check))
128e8d8bef9SDimitry Andric       return false;
129e8d8bef9SDimitry Andric   }
130e8d8bef9SDimitry Andric 
131e8d8bef9SDimitry Andric   return true;
1329dba64beSDimitry Andric }
1339dba64beSDimitry Andric 
1349dba64beSDimitry Andric CppModuleConfiguration::CppModuleConfiguration(
1354824e7fdSDimitry Andric     const FileSpecList &support_files, const llvm::Triple &triple) {
1369dba64beSDimitry Andric   // Analyze all files we were given to build the configuration.
1371db9f3b2SDimitry Andric   bool error = !llvm::all_of(support_files, [&](auto &file) {
1381db9f3b2SDimitry Andric     return CppModuleConfiguration::analyzeFile(file, triple);
1391db9f3b2SDimitry Andric   });
1409dba64beSDimitry Andric   // If we have a valid configuration at this point, set the
1419dba64beSDimitry Andric   // include directories and module list that should be used.
1429dba64beSDimitry Andric   if (!error && hasValidConfig()) {
1439dba64beSDimitry Andric     // Calculate the resource directory for LLDB.
1449dba64beSDimitry Andric     llvm::SmallString<256> resource_dir;
1459dba64beSDimitry Andric     llvm::sys::path::append(resource_dir, GetClangResourceDir().GetPath(),
1469dba64beSDimitry Andric                             "include");
1475ffd83dbSDimitry Andric     m_resource_inc = std::string(resource_dir.str());
1489dba64beSDimitry Andric 
1499dba64beSDimitry Andric     // This order matches the way Clang orders these directories.
150e8d8bef9SDimitry Andric     m_include_dirs = {m_std_inc.Get().str(), m_resource_inc,
151e8d8bef9SDimitry Andric                       m_c_inc.Get().str()};
1524824e7fdSDimitry Andric     if (m_c_target_inc.Valid())
1534824e7fdSDimitry Andric       m_include_dirs.push_back(m_c_target_inc.Get().str());
1544824e7fdSDimitry Andric     if (m_std_target_inc.Valid())
1554824e7fdSDimitry Andric       m_include_dirs.push_back(m_std_target_inc.Get().str());
1569dba64beSDimitry Andric     m_imported_modules = {"std"};
1579dba64beSDimitry Andric   }
1589dba64beSDimitry Andric }
159