1 //===--- ModuleDependencyCollector.cpp - Collect module dependencies ------===//
2 //
3 //                     The LLVM Compiler Infrastructure
4 //
5 // This file is distributed under the University of Illinois Open Source
6 // License. See LICENSE.TXT for details.
7 //
8 //===----------------------------------------------------------------------===//
9 //
10 // Collect the dependencies of a set of modules.
11 //
12 //===----------------------------------------------------------------------===//
13 
14 #include "clang/Basic/CharInfo.h"
15 #include "clang/Frontend/Utils.h"
16 #include "clang/Lex/Preprocessor.h"
17 #include "clang/Serialization/ASTReader.h"
18 #include "llvm/ADT/StringMap.h"
19 #include "llvm/ADT/iterator_range.h"
20 #include "llvm/Support/FileSystem.h"
21 #include "llvm/Support/Path.h"
22 #include "llvm/Support/raw_ostream.h"
23 
24 using namespace clang;
25 
26 namespace {
27 /// Private implementations for ModuleDependencyCollector
28 class ModuleDependencyListener : public ASTReaderListener {
29   ModuleDependencyCollector &Collector;
30 public:
ModuleDependencyListener(ModuleDependencyCollector & Collector)31   ModuleDependencyListener(ModuleDependencyCollector &Collector)
32       : Collector(Collector) {}
needsInputFileVisitation()33   bool needsInputFileVisitation() override { return true; }
needsSystemInputFileVisitation()34   bool needsSystemInputFileVisitation() override { return true; }
visitInputFile(StringRef Filename,bool IsSystem,bool IsOverridden,bool IsExplicitModule)35   bool visitInputFile(StringRef Filename, bool IsSystem, bool IsOverridden,
36                       bool IsExplicitModule) override {
37     Collector.addFile(Filename);
38     return true;
39   }
40 };
41 
42 struct ModuleDependencyMMCallbacks : public ModuleMapCallbacks {
43   ModuleDependencyCollector &Collector;
ModuleDependencyMMCallbacks__anonaae4e8570111::ModuleDependencyMMCallbacks44   ModuleDependencyMMCallbacks(ModuleDependencyCollector &Collector)
45       : Collector(Collector) {}
46 
moduleMapAddHeader__anonaae4e8570111::ModuleDependencyMMCallbacks47   void moduleMapAddHeader(StringRef HeaderPath) override {
48     if (llvm::sys::path::is_absolute(HeaderPath))
49       Collector.addFile(HeaderPath);
50   }
moduleMapAddUmbrellaHeader__anonaae4e8570111::ModuleDependencyMMCallbacks51   void moduleMapAddUmbrellaHeader(FileManager *FileMgr,
52                                   const FileEntry *Header) override {
53     StringRef HeaderFilename = Header->getName();
54     moduleMapAddHeader(HeaderFilename);
55     // The FileManager can find and cache the symbolic link for a framework
56     // header before its real path, this means a module can have some of its
57     // headers to use other paths. Although this is usually not a problem, it's
58     // inconsistent, and not collecting the original path header leads to
59     // umbrella clashes while rebuilding modules in the crash reproducer. For
60     // example:
61     //    ApplicationServices.framework/Frameworks/ImageIO.framework/ImageIO.h
62     // instead of:
63     //    ImageIO.framework/ImageIO.h
64     //
65     // FIXME: this shouldn't be necessary once we have FileName instances
66     // around instead of FileEntry ones. For now, make sure we collect all
67     // that we need for the reproducer to work correctly.
68     StringRef UmbreallDirFromHeader =
69         llvm::sys::path::parent_path(HeaderFilename);
70     StringRef UmbrellaDir = Header->getDir()->getName();
71     if (!UmbrellaDir.equals(UmbreallDirFromHeader)) {
72       SmallString<128> AltHeaderFilename;
73       llvm::sys::path::append(AltHeaderFilename, UmbrellaDir,
74                               llvm::sys::path::filename(HeaderFilename));
75       if (FileMgr->getFile(AltHeaderFilename))
76         moduleMapAddHeader(AltHeaderFilename);
77     }
78   }
79 };
80 
81 }
82 
83 // TODO: move this to Support/Path.h and check for HAVE_REALPATH?
real_path(StringRef SrcPath,SmallVectorImpl<char> & RealPath)84 static bool real_path(StringRef SrcPath, SmallVectorImpl<char> &RealPath) {
85 #ifdef LLVM_ON_UNIX
86   char CanonicalPath[PATH_MAX];
87 
88   // TODO: emit a warning in case this fails...?
89   if (!realpath(SrcPath.str().c_str(), CanonicalPath))
90     return false;
91 
92   SmallString<256> RPath(CanonicalPath);
93   RealPath.swap(RPath);
94   return true;
95 #else
96   // FIXME: Add support for systems without realpath.
97   return false;
98 #endif
99 }
100 
attachToASTReader(ASTReader & R)101 void ModuleDependencyCollector::attachToASTReader(ASTReader &R) {
102   R.addListener(llvm::make_unique<ModuleDependencyListener>(*this));
103 }
104 
attachToPreprocessor(Preprocessor & PP)105 void ModuleDependencyCollector::attachToPreprocessor(Preprocessor &PP) {
106   PP.getHeaderSearchInfo().getModuleMap().addModuleMapCallbacks(
107       llvm::make_unique<ModuleDependencyMMCallbacks>(*this));
108 }
109 
isCaseSensitivePath(StringRef Path)110 static bool isCaseSensitivePath(StringRef Path) {
111   SmallString<256> TmpDest = Path, UpperDest, RealDest;
112   // Remove component traversals, links, etc.
113   if (!real_path(Path, TmpDest))
114     return true; // Current default value in vfs.yaml
115   Path = TmpDest;
116 
117   // Change path to all upper case and ask for its real path, if the latter
118   // exists and is equal to Path, it's not case sensitive. Default to case
119   // sensitive in the absense of realpath, since this is what the VFSWriter
120   // already expects when sensitivity isn't setup.
121   for (auto &C : Path)
122     UpperDest.push_back(toUppercase(C));
123   if (real_path(UpperDest, RealDest) && Path.equals(RealDest))
124     return false;
125   return true;
126 }
127 
writeFileMap()128 void ModuleDependencyCollector::writeFileMap() {
129   if (Seen.empty())
130     return;
131 
132   StringRef VFSDir = getDest();
133 
134   // Default to use relative overlay directories in the VFS yaml file. This
135   // allows crash reproducer scripts to work across machines.
136   VFSWriter.setOverlayDir(VFSDir);
137 
138   // Explicitly set case sensitivity for the YAML writer. For that, find out
139   // the sensitivity at the path where the headers all collected to.
140   VFSWriter.setCaseSensitivity(isCaseSensitivePath(VFSDir));
141 
142   // Do not rely on real path names when executing the crash reproducer scripts
143   // since we only want to actually use the files we have on the VFS cache.
144   VFSWriter.setUseExternalNames(false);
145 
146   std::error_code EC;
147   SmallString<256> YAMLPath = VFSDir;
148   llvm::sys::path::append(YAMLPath, "vfs.yaml");
149   llvm::raw_fd_ostream OS(YAMLPath, EC, llvm::sys::fs::F_Text);
150   if (EC) {
151     HasErrors = true;
152     return;
153   }
154   VFSWriter.write(OS);
155 }
156 
getRealPath(StringRef SrcPath,SmallVectorImpl<char> & Result)157 bool ModuleDependencyCollector::getRealPath(StringRef SrcPath,
158                                             SmallVectorImpl<char> &Result) {
159   using namespace llvm::sys;
160   SmallString<256> RealPath;
161   StringRef FileName = path::filename(SrcPath);
162   std::string Dir = path::parent_path(SrcPath).str();
163   auto DirWithSymLink = SymLinkMap.find(Dir);
164 
165   // Use real_path to fix any symbolic link component present in a path.
166   // Computing the real path is expensive, cache the search through the
167   // parent path directory.
168   if (DirWithSymLink == SymLinkMap.end()) {
169     if (!real_path(Dir, RealPath))
170       return false;
171     SymLinkMap[Dir] = RealPath.str();
172   } else {
173     RealPath = DirWithSymLink->second;
174   }
175 
176   path::append(RealPath, FileName);
177   Result.swap(RealPath);
178   return true;
179 }
180 
copyToRoot(StringRef Src)181 std::error_code ModuleDependencyCollector::copyToRoot(StringRef Src) {
182   using namespace llvm::sys;
183 
184   // We need an absolute src path to append to the root.
185   SmallString<256> AbsoluteSrc = Src;
186   fs::make_absolute(AbsoluteSrc);
187   // Canonicalize src to a native path to avoid mixed separator styles.
188   path::native(AbsoluteSrc);
189   // Remove redundant leading "./" pieces and consecutive separators.
190   AbsoluteSrc = path::remove_leading_dotslash(AbsoluteSrc);
191 
192   // Canonicalize the source path by removing "..", "." components.
193   SmallString<256> CanonicalPath = AbsoluteSrc;
194   path::remove_dots(CanonicalPath, /*remove_dot_dot=*/true);
195 
196   // If a ".." component is present after a symlink component, remove_dots may
197   // lead to the wrong real destination path. Let the source be canonicalized
198   // like that but make sure we always use the real path for the destination.
199   SmallString<256> RealPath;
200   if (!getRealPath(AbsoluteSrc, RealPath))
201     RealPath = CanonicalPath;
202   SmallString<256> Dest = getDest();
203   path::append(Dest, path::relative_path(RealPath));
204 
205   // Copy the file into place.
206   if (std::error_code EC = fs::create_directories(path::parent_path(Dest),
207                                                    /*IgnoreExisting=*/true))
208     return EC;
209   if (std::error_code EC = fs::copy_file(RealPath, Dest))
210     return EC;
211 
212   // Always map a canonical src path to its real path into the YAML, by doing
213   // this we map different virtual src paths to the same entry in the VFS
214   // overlay, which is a way to emulate symlink inside the VFS; this is also
215   // needed for correctness, not doing that can lead to module redifinition
216   // errors.
217   addFileMapping(CanonicalPath, Dest);
218   return std::error_code();
219 }
220 
addFile(StringRef Filename)221 void ModuleDependencyCollector::addFile(StringRef Filename) {
222   if (insertSeen(Filename))
223     if (copyToRoot(Filename))
224       HasErrors = true;
225 }
226