1 //===--- GlobalModuleIndex.h - Global Module Index --------------*- C++ -*-===//
2 //
3 //                     The LLVM Compiler Infrastructure
4 //
5 // This file is distributed under the University of Illinois Open Source
6 // License. See LICENSE.TXT for details.
7 //
8 //===----------------------------------------------------------------------===//
9 //
10 // This file defines the GlobalModuleIndex class, which manages a global index
11 // containing all of the identifiers known to the various modules within a given
12 // subdirectory of the module cache. It is used to improve the performance of
13 // queries such as "do any modules know about this identifier?"
14 //
15 //===----------------------------------------------------------------------===//
16 #ifndef LLVM_CLANG_SERIALIZATION_GLOBALMODULEINDEX_H
17 #define LLVM_CLANG_SERIALIZATION_GLOBALMODULEINDEX_H
18 
19 #include "llvm/ADT/DenseMap.h"
20 #include "llvm/ADT/SmallPtrSet.h"
21 #include "llvm/ADT/SmallVector.h"
22 #include "llvm/ADT/StringMap.h"
23 #include "llvm/ADT/StringRef.h"
24 #include <memory>
25 #include <utility>
26 
27 namespace llvm {
28 class BitstreamCursor;
29 class MemoryBuffer;
30 }
31 
32 namespace clang {
33 
34 class DirectoryEntry;
35 class FileEntry;
36 class FileManager;
37 class IdentifierIterator;
38 
39 namespace serialization {
40   class ModuleFile;
41 }
42 
43 using llvm::SmallVector;
44 using llvm::SmallVectorImpl;
45 using llvm::StringRef;
46 using serialization::ModuleFile;
47 
48 /// \brief A global index for a set of module files, providing information about
49 /// the identifiers within those module files.
50 ///
51 /// The global index is an aid for name lookup into modules, offering a central
52 /// place where one can look for identifiers determine which
53 /// module files contain any information about that identifier. This
54 /// allows the client to restrict the search to only those module files known
55 /// to have a information about that identifier, improving performance. Moreover,
56 /// the global module index may know about module files that have not been
57 /// imported, and can be queried to determine which modules the current
58 /// translation could or should load to fix a problem.
59 class GlobalModuleIndex {
60   /// \brief Buffer containing the index file, which is lazily accessed so long
61   /// as the global module index is live.
62   std::unique_ptr<llvm::MemoryBuffer> Buffer;
63 
64   /// \brief The hash table.
65   ///
66   /// This pointer actually points to a IdentifierIndexTable object,
67   /// but that type is only accessible within the implementation of
68   /// GlobalModuleIndex.
69   void *IdentifierIndex;
70 
71   /// \brief Information about a given module file.
72   struct ModuleInfo {
ModuleInfoModuleInfo73     ModuleInfo() : File(), Size(), ModTime() { }
74 
75     /// \brief The module file, once it has been resolved.
76     ModuleFile *File;
77 
78     /// \brief The module file name.
79     std::string FileName;
80 
81     /// \brief Size of the module file at the time the global index was built.
82     off_t Size;
83 
84     /// \brief Modification time of the module file at the time the global
85     /// index was built.
86     time_t ModTime;
87 
88     /// \brief The module IDs on which this module directly depends.
89     /// FIXME: We don't really need a vector here.
90     llvm::SmallVector<unsigned, 4> Dependencies;
91   };
92 
93   /// \brief A mapping from module IDs to information about each module.
94   ///
95   /// This vector may have gaps, if module files have been removed or have
96   /// been updated since the index was built. A gap is indicated by an empty
97   /// file name.
98   llvm::SmallVector<ModuleInfo, 16> Modules;
99 
100   /// \brief Lazily-populated mapping from module files to their
101   /// corresponding index into the \c Modules vector.
102   llvm::DenseMap<ModuleFile *, unsigned> ModulesByFile;
103 
104   /// \brief The set of modules that have not yet been resolved.
105   ///
106   /// The string is just the name of the module itself, which maps to the
107   /// module ID.
108   llvm::StringMap<unsigned> UnresolvedModules;
109 
110   /// \brief The number of identifier lookups we performed.
111   unsigned NumIdentifierLookups;
112 
113   /// \brief The number of identifier lookup hits, where we recognize the
114   /// identifier.
115   unsigned NumIdentifierLookupHits;
116 
117   /// \brief Internal constructor. Use \c readIndex() to read an index.
118   explicit GlobalModuleIndex(std::unique_ptr<llvm::MemoryBuffer> Buffer,
119                              llvm::BitstreamCursor Cursor);
120 
121   GlobalModuleIndex(const GlobalModuleIndex &) = delete;
122   GlobalModuleIndex &operator=(const GlobalModuleIndex &) = delete;
123 
124 public:
125   ~GlobalModuleIndex();
126 
127   /// \brief An error code returned when trying to read an index.
128   enum ErrorCode {
129     /// \brief No error occurred.
130     EC_None,
131     /// \brief No index was found.
132     EC_NotFound,
133     /// \brief Some other process is currently building the index; it is not
134     /// available yet.
135     EC_Building,
136     /// \brief There was an unspecified I/O error reading or writing the index.
137     EC_IOError
138   };
139 
140   /// \brief Read a global index file for the given directory.
141   ///
142   /// \param Path The path to the specific module cache where the module files
143   /// for the intended configuration reside.
144   ///
145   /// \returns A pair containing the global module index (if it exists) and
146   /// the error code.
147   static std::pair<GlobalModuleIndex *, ErrorCode>
148   readIndex(StringRef Path);
149 
150   /// \brief Returns an iterator for identifiers stored in the index table.
151   ///
152   /// The caller accepts ownership of the returned object.
153   IdentifierIterator *createIdentifierIterator() const;
154 
155   /// \brief Retrieve the set of modules that have up-to-date indexes.
156   ///
157   /// \param ModuleFiles Will be populated with the set of module files that
158   /// have been indexed.
159   void getKnownModules(SmallVectorImpl<ModuleFile *> &ModuleFiles);
160 
161   /// \brief Retrieve the set of module files on which the given module file
162   /// directly depends.
163   void getModuleDependencies(ModuleFile *File,
164                              SmallVectorImpl<ModuleFile *> &Dependencies);
165 
166   /// \brief A set of module files in which we found a result.
167   typedef llvm::SmallPtrSet<ModuleFile *, 4> HitSet;
168 
169   /// \brief Look for all of the module files with information about the given
170   /// identifier, e.g., a global function, variable, or type with that name.
171   ///
172   /// \param Name The identifier to look for.
173   ///
174   /// \param Hits Will be populated with the set of module files that have
175   /// information about this name.
176   ///
177   /// \returns true if the identifier is known to the index, false otherwise.
178   bool lookupIdentifier(StringRef Name, HitSet &Hits);
179 
180   /// \brief Note that the given module file has been loaded.
181   ///
182   /// \returns false if the global module index has information about this
183   /// module file, and true otherwise.
184   bool loadedModuleFile(ModuleFile *File);
185 
186   /// \brief Print statistics to standard error.
187   void printStats();
188 
189   /// \brief Print debugging view to standard error.
190   void dump();
191 
192   /// \brief Write a global index into the given
193   ///
194   /// \param FileMgr The file manager to use to load module files.
195   ///
196   /// \param Path The path to the directory containing module files, into
197   /// which the global index will be written.
198   static ErrorCode writeIndex(FileManager &FileMgr, StringRef Path);
199 };
200 
201 }
202 
203 #endif
204