1 //===- DependencyScanningFilesystem.h - clang-scan-deps fs ===---*- C++ -*-===//
2 //
3 // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4 // See https://llvm.org/LICENSE.txt for license information.
5 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6 //
7 //===----------------------------------------------------------------------===//
8 
9 #ifndef LLVM_CLANG_TOOLING_DEPENDENCY_SCANNING_FILESYSTEM_H
10 #define LLVM_CLANG_TOOLING_DEPENDENCY_SCANNING_FILESYSTEM_H
11 
12 #include "clang/Basic/LLVM.h"
13 #include "clang/Lex/PreprocessorExcludedConditionalDirectiveSkipMapping.h"
14 #include "llvm/ADT/StringMap.h"
15 #include "llvm/ADT/StringSet.h"
16 #include "llvm/Support/Allocator.h"
17 #include "llvm/Support/ErrorOr.h"
18 #include "llvm/Support/VirtualFileSystem.h"
19 #include <mutex>
20 
21 namespace clang {
22 namespace tooling {
23 namespace dependencies {
24 
25 /// An in-memory representation of a file system entity that is of interest to
26 /// the dependency scanning filesystem.
27 ///
28 /// It represents one of the following:
29 /// - an opened source file with minimized contents and a stat value.
30 /// - an opened source file with original contents and a stat value.
31 /// - a directory entry with its stat value.
32 /// - an error value to represent a file system error.
33 /// - a placeholder with an invalid stat indicating a not yet initialized entry.
34 class CachedFileSystemEntry {
35 public:
36   /// Default constructor creates an entry with an invalid stat.
CachedFileSystemEntry()37   CachedFileSystemEntry() : MaybeStat(llvm::vfs::Status()) {}
38 
CachedFileSystemEntry(std::error_code Error)39   CachedFileSystemEntry(std::error_code Error) : MaybeStat(std::move(Error)) {}
40 
41   /// Create an entry that represents an opened source file with minimized or
42   /// original contents.
43   ///
44   /// The filesystem opens the file even for `stat` calls open to avoid the
45   /// issues with stat + open of minimized files that might lead to a
46   /// mismatching size of the file. If file is not minimized, the full file is
47   /// read and copied into memory to ensure that it's not memory mapped to avoid
48   /// running out of file descriptors.
49   static CachedFileSystemEntry createFileEntry(StringRef Filename,
50                                                llvm::vfs::FileSystem &FS,
51                                                bool Minimize = true);
52 
53   /// Create an entry that represents a directory on the filesystem.
54   static CachedFileSystemEntry createDirectoryEntry(llvm::vfs::Status &&Stat);
55 
56   /// \returns True if the entry is valid.
isValid()57   bool isValid() const { return !MaybeStat || MaybeStat->isStatusKnown(); }
58 
59   /// \returns True if the current entry points to a directory.
isDirectory()60   bool isDirectory() const { return MaybeStat && MaybeStat->isDirectory(); }
61 
62   /// \returns The error or the file's contents.
getContents()63   llvm::ErrorOr<StringRef> getContents() const {
64     if (!MaybeStat)
65       return MaybeStat.getError();
66     assert(!MaybeStat->isDirectory() && "not a file");
67     assert(isValid() && "not initialized");
68     return StringRef(Contents);
69   }
70 
71   /// \returns The error or the status of the entry.
getStatus()72   llvm::ErrorOr<llvm::vfs::Status> getStatus() const {
73     assert(isValid() && "not initialized");
74     return MaybeStat;
75   }
76 
77   /// \returns the name of the file.
getName()78   StringRef getName() const {
79     assert(isValid() && "not initialized");
80     return MaybeStat->getName();
81   }
82 
83   /// Return the mapping between location -> distance that is used to speed up
84   /// the block skipping in the preprocessor.
getPPSkippedRangeMapping()85   const PreprocessorSkippedRangeMapping &getPPSkippedRangeMapping() const {
86     return PPSkippedRangeMapping;
87   }
88 
89   CachedFileSystemEntry(CachedFileSystemEntry &&) = default;
90   CachedFileSystemEntry &operator=(CachedFileSystemEntry &&) = default;
91 
92   CachedFileSystemEntry(const CachedFileSystemEntry &) = delete;
93   CachedFileSystemEntry &operator=(const CachedFileSystemEntry &) = delete;
94 
95 private:
96   llvm::ErrorOr<llvm::vfs::Status> MaybeStat;
97   // Store the contents in a small string to allow a
98   // move from the small string for the minimized contents.
99   // Note: small size of 1 allows us to store an empty string with an implicit
100   // null terminator without any allocations.
101   llvm::SmallString<1> Contents;
102   PreprocessorSkippedRangeMapping PPSkippedRangeMapping;
103 };
104 
105 /// This class is a shared cache, that caches the 'stat' and 'open' calls to the
106 /// underlying real file system.
107 ///
108 /// It is sharded based on the hash of the key to reduce the lock contention for
109 /// the worker threads.
110 class DependencyScanningFilesystemSharedCache {
111 public:
112   struct SharedFileSystemEntry {
113     std::mutex ValueLock;
114     CachedFileSystemEntry Value;
115   };
116 
117   DependencyScanningFilesystemSharedCache();
118 
119   /// Returns a cache entry for the corresponding key.
120   ///
121   /// A new cache entry is created if the key is not in the cache. This is a
122   /// thread safe call.
123   SharedFileSystemEntry &get(StringRef Key);
124 
125 private:
126   struct CacheShard {
127     std::mutex CacheLock;
128     llvm::StringMap<SharedFileSystemEntry, llvm::BumpPtrAllocator> Cache;
129   };
130   std::unique_ptr<CacheShard[]> CacheShards;
131   unsigned NumShards;
132 };
133 
134 /// A virtual file system optimized for the dependency discovery.
135 ///
136 /// It is primarily designed to work with source files whose contents was was
137 /// preprocessed to remove any tokens that are unlikely to affect the dependency
138 /// computation.
139 ///
140 /// This is not a thread safe VFS. A single instance is meant to be used only in
141 /// one thread. Multiple instances are allowed to service multiple threads
142 /// running in parallel.
143 class DependencyScanningWorkerFilesystem : public llvm::vfs::ProxyFileSystem {
144 public:
DependencyScanningWorkerFilesystem(DependencyScanningFilesystemSharedCache & SharedCache,IntrusiveRefCntPtr<llvm::vfs::FileSystem> FS,ExcludedPreprocessorDirectiveSkipMapping * PPSkipMappings)145   DependencyScanningWorkerFilesystem(
146       DependencyScanningFilesystemSharedCache &SharedCache,
147       IntrusiveRefCntPtr<llvm::vfs::FileSystem> FS,
148       ExcludedPreprocessorDirectiveSkipMapping *PPSkipMappings)
149       : ProxyFileSystem(std::move(FS)), SharedCache(SharedCache),
150         PPSkipMappings(PPSkipMappings) {}
151 
152   llvm::ErrorOr<llvm::vfs::Status> status(const Twine &Path) override;
153   llvm::ErrorOr<std::unique_ptr<llvm::vfs::File>>
154   openFileForRead(const Twine &Path) override;
155 
156   /// The set of files that should not be minimized.
157   llvm::StringSet<> IgnoredFiles;
158 
159 private:
setCachedEntry(StringRef Filename,const CachedFileSystemEntry * Entry)160   void setCachedEntry(StringRef Filename, const CachedFileSystemEntry *Entry) {
161     bool IsInserted = Cache.try_emplace(Filename, Entry).second;
162     (void)IsInserted;
163     assert(IsInserted && "local cache is updated more than once");
164   }
165 
getCachedEntry(StringRef Filename)166   const CachedFileSystemEntry *getCachedEntry(StringRef Filename) {
167     auto It = Cache.find(Filename);
168     return It == Cache.end() ? nullptr : It->getValue();
169   }
170 
171   llvm::ErrorOr<const CachedFileSystemEntry *>
172   getOrCreateFileSystemEntry(const StringRef Filename);
173 
174   DependencyScanningFilesystemSharedCache &SharedCache;
175   /// The local cache is used by the worker thread to cache file system queries
176   /// locally instead of querying the global cache every time.
177   llvm::StringMap<const CachedFileSystemEntry *, llvm::BumpPtrAllocator> Cache;
178   /// The optional mapping structure which records information about the
179   /// excluded conditional directive skip mappings that are used by the
180   /// currently active preprocessor.
181   ExcludedPreprocessorDirectiveSkipMapping *PPSkipMappings;
182 };
183 
184 } // end namespace dependencies
185 } // end namespace tooling
186 } // end namespace clang
187 
188 #endif // LLVM_CLANG_TOOLING_DEPENDENCY_SCANNING_FILESYSTEM_H
189