1 //===--- Module.h - Module description --------------------------*- C++ -*-===//
3 // The LLVM Compiler Infrastructure
5 // This file is distributed under the University of Illinois Open Source
6 // License. See LICENSE.TXT for details.
8 //===----------------------------------------------------------------------===//
10 // This file defines the Module class, which describes a module that has
11 // been loaded from an AST file.
13 //===----------------------------------------------------------------------===//
15 #ifndef LLVM_CLANG_SERIALIZATION_MODULE_H
16 #define LLVM_CLANG_SERIALIZATION_MODULE_H
18 #include "clang/Basic/FileManager.h"
19 #include "clang/Basic/Module.h"
20 #include "clang/Basic/SourceLocation.h"
21 #include "clang/Serialization/ASTBitCodes.h"
22 #include "clang/Serialization/ContinuousRangeMap.h"
23 #include "clang/Serialization/ModuleFileExtension.h"
24 #include "llvm/ADT/SetVector.h"
25 #include "llvm/Bitcode/BitstreamReader.h"
26 #include "llvm/Support/Endian.h"
31 template <typename Info> class OnDiskChainedHashTable;
32 template <typename Info> class OnDiskIterableChainedHashTable;
40 namespace serialization {
43 class ASTDeclContextNameLookupTrait;
46 /// \brief Specifies the kind of module that has been loaded.
48 MK_ImplicitModule, ///< File is an implicitly-loaded module.
49 MK_ExplicitModule, ///< File is an explicitly-loaded module.
50 MK_PCH, ///< File is a PCH file treated as such.
51 MK_Preamble, ///< File is a PCH file treated as the preamble.
52 MK_MainFile, ///< File is a PCH file treated as the actual main file.
53 MK_PrebuiltModule ///< File is from a prebuilt module path.
56 /// \brief The input file that has been loaded from this AST file, along with
57 /// bools indicating whether this was an overridden buffer or if it was
58 /// out-of-date or not-found.
65 llvm::PointerIntPair<const FileEntry *, 2, unsigned> Val;
69 InputFile(const FileEntry *File,
70 bool isOverridden = false, bool isOutOfDate = false) {
71 assert(!(isOverridden && isOutOfDate) &&
72 "an overridden cannot be out-of-date");
78 Val.setPointerAndInt(File, intVal);
81 static InputFile getNotFound() {
83 File.Val.setInt(NotFound);
87 const FileEntry *getFile() const { return Val.getPointer(); }
88 bool isOverridden() const { return Val.getInt() == Overridden; }
89 bool isOutOfDate() const { return Val.getInt() == OutOfDate; }
90 bool isNotFound() const { return Val.getInt() == NotFound; }
93 /// \brief Information about a module that has been loaded by the ASTReader.
95 /// Each instance of the Module class corresponds to a single AST file, which
96 /// may be a precompiled header, precompiled preamble, a module, or an AST file
97 /// of some sort loaded as the main file, all of which are specific formulations
98 /// of the general notion of a "module". A module may depend on any number of
102 ModuleFile(ModuleKind Kind, unsigned Generation)
103 : Kind(Kind), Generation(Generation) {}
106 // === General information ===
108 /// \brief The index of this module in the list of modules.
111 /// \brief The type of this module.
114 /// \brief The file name of the module file.
115 std::string FileName;
117 /// \brief The name of the module.
118 std::string ModuleName;
120 /// \brief The base directory of the module.
121 std::string BaseDirectory;
123 std::string getTimestampFilename() const {
124 return FileName + ".timestamp";
127 /// \brief The original source file name that was used to build the
128 /// primary AST file, which may have been modified for
129 /// relocatable-pch support.
130 std::string OriginalSourceFileName;
132 /// \brief The actual original source file name that was used to
133 /// build this AST file.
134 std::string ActualOriginalSourceFileName;
136 /// \brief The file ID for the original source file that was used to
137 /// build this AST file.
138 FileID OriginalSourceFileID;
140 /// \brief The directory that the PCH was originally created in. Used to
141 /// allow resolving headers even after headers+PCH was moved to a new path.
142 std::string OriginalDir;
144 std::string ModuleMapPath;
146 /// \brief Whether this precompiled header is a relocatable PCH file.
147 bool RelocatablePCH = false;
149 /// \brief Whether timestamps are included in this module file.
150 bool HasTimestamps = false;
152 /// \brief The file entry for the module file.
153 const FileEntry *File = nullptr;
155 /// The signature of the module file, which may be used instead of the size
156 /// and modification time to identify this particular file.
157 ASTFileSignature Signature;
159 /// \brief Whether this module has been directly imported by the
161 bool DirectlyImported = false;
163 /// \brief The generation of which this module file is a part.
166 /// The memory buffer that stores the data associated with
167 /// this AST file, owned by the PCMCache in the ModuleManager.
168 llvm::MemoryBuffer *Buffer;
170 /// \brief The size of this file, in bits.
171 uint64_t SizeInBits = 0;
173 /// \brief The global bit offset (or base) of this module
174 uint64_t GlobalBitOffset = 0;
176 /// \brief The serialized bitstream data for this file.
179 /// \brief The main bitstream cursor for the main block.
180 llvm::BitstreamCursor Stream;
182 /// \brief The source location where the module was explicitly or implicitly
183 /// imported in the local translation unit.
185 /// If module A depends on and imports module B, both modules will have the
186 /// same DirectImportLoc, but different ImportLoc (B's ImportLoc will be a
187 /// source location inside module A).
189 /// WARNING: This is largely useless. It doesn't tell you when a module was
190 /// made visible, just when the first submodule of that module was imported.
191 SourceLocation DirectImportLoc;
193 /// \brief The source location where this module was first imported.
194 SourceLocation ImportLoc;
196 /// \brief The first source location in this module.
197 SourceLocation FirstLoc;
199 /// The list of extension readers that are attached to this module
201 std::vector<std::unique_ptr<ModuleFileExtensionReader>> ExtensionReaders;
203 /// The module offset map data for this file. If non-empty, the various
204 /// ContinuousRangeMaps described below have not yet been populated.
205 StringRef ModuleOffsetMap;
207 // === Input Files ===
208 /// \brief The cursor to the start of the input-files block.
209 llvm::BitstreamCursor InputFilesCursor;
211 /// \brief Offsets for all of the input file entries in the AST file.
212 const llvm::support::unaligned_uint64_t *InputFileOffsets = nullptr;
214 /// \brief The input files that have been loaded from this AST file.
215 std::vector<InputFile> InputFilesLoaded;
217 // All user input files reside at the index range [0, NumUserInputFiles), and
218 // system input files reside at [NumUserInputFiles, InputFilesLoaded.size()).
219 unsigned NumUserInputFiles = 0;
221 /// \brief If non-zero, specifies the time when we last validated input
222 /// files. Zero means we never validated them.
224 /// The time is specified in seconds since the start of the Epoch.
225 uint64_t InputFilesValidationTimestamp = 0;
227 // === Source Locations ===
229 /// \brief Cursor used to read source location entries.
230 llvm::BitstreamCursor SLocEntryCursor;
232 /// \brief The number of source location entries in this AST file.
233 unsigned LocalNumSLocEntries = 0;
235 /// \brief The base ID in the source manager's view of this module.
236 int SLocEntryBaseID = 0;
238 /// \brief The base offset in the source manager's view of this module.
239 unsigned SLocEntryBaseOffset = 0;
241 /// \brief Offsets for all of the source location entries in the
243 const uint32_t *SLocEntryOffsets = nullptr;
245 /// \brief SLocEntries that we're going to preload.
246 SmallVector<uint64_t, 4> PreloadSLocEntries;
248 /// \brief Remapping table for source locations in this module.
249 ContinuousRangeMap<uint32_t, int, 2> SLocRemap;
251 // === Identifiers ===
253 /// \brief The number of identifiers in this AST file.
254 unsigned LocalNumIdentifiers = 0;
256 /// \brief Offsets into the identifier table data.
258 /// This array is indexed by the identifier ID (-1), and provides
259 /// the offset into IdentifierTableData where the string data is
261 const uint32_t *IdentifierOffsets = nullptr;
263 /// \brief Base identifier ID for identifiers local to this module.
264 serialization::IdentID BaseIdentifierID = 0;
266 /// \brief Remapping table for identifier IDs in this module.
267 ContinuousRangeMap<uint32_t, int, 2> IdentifierRemap;
269 /// \brief Actual data for the on-disk hash table of identifiers.
271 /// This pointer points into a memory buffer, where the on-disk hash
272 /// table for identifiers actually lives.
273 const char *IdentifierTableData = nullptr;
275 /// \brief A pointer to an on-disk hash table of opaque type
276 /// IdentifierHashTable.
277 void *IdentifierLookupTable = nullptr;
279 /// \brief Offsets of identifiers that we're going to preload within
280 /// IdentifierTableData.
281 std::vector<unsigned> PreloadIdentifierOffsets;
285 /// \brief The cursor to the start of the preprocessor block, which stores
286 /// all of the macro definitions.
287 llvm::BitstreamCursor MacroCursor;
289 /// \brief The number of macros in this AST file.
290 unsigned LocalNumMacros = 0;
292 /// \brief Offsets of macros in the preprocessor block.
294 /// This array is indexed by the macro ID (-1), and provides
295 /// the offset into the preprocessor block where macro definitions are
297 const uint32_t *MacroOffsets = nullptr;
299 /// \brief Base macro ID for macros local to this module.
300 serialization::MacroID BaseMacroID = 0;
302 /// \brief Remapping table for macro IDs in this module.
303 ContinuousRangeMap<uint32_t, int, 2> MacroRemap;
305 /// \brief The offset of the start of the set of defined macros.
306 uint64_t MacroStartOffset = 0;
308 // === Detailed PreprocessingRecord ===
310 /// \brief The cursor to the start of the (optional) detailed preprocessing
312 llvm::BitstreamCursor PreprocessorDetailCursor;
314 /// \brief The offset of the start of the preprocessor detail cursor.
315 uint64_t PreprocessorDetailStartOffset = 0;
317 /// \brief Base preprocessed entity ID for preprocessed entities local to
319 serialization::PreprocessedEntityID BasePreprocessedEntityID = 0;
321 /// \brief Remapping table for preprocessed entity IDs in this module.
322 ContinuousRangeMap<uint32_t, int, 2> PreprocessedEntityRemap;
324 const PPEntityOffset *PreprocessedEntityOffsets = nullptr;
325 unsigned NumPreprocessedEntities = 0;
327 // === Header search information ===
329 /// \brief The number of local HeaderFileInfo structures.
330 unsigned LocalNumHeaderFileInfos = 0;
332 /// \brief Actual data for the on-disk hash table of header file
335 /// This pointer points into a memory buffer, where the on-disk hash
336 /// table for header file information actually lives.
337 const char *HeaderFileInfoTableData = nullptr;
339 /// \brief The on-disk hash table that contains information about each of
340 /// the header files.
341 void *HeaderFileInfoTable = nullptr;
343 // === Submodule information ===
344 /// \brief The number of submodules in this module.
345 unsigned LocalNumSubmodules = 0;
347 /// \brief Base submodule ID for submodules local to this module.
348 serialization::SubmoduleID BaseSubmoduleID = 0;
350 /// \brief Remapping table for submodule IDs in this module.
351 ContinuousRangeMap<uint32_t, int, 2> SubmoduleRemap;
355 /// \brief The number of selectors new to this file.
357 /// This is the number of entries in SelectorOffsets.
358 unsigned LocalNumSelectors = 0;
360 /// \brief Offsets into the selector lookup table's data array
361 /// where each selector resides.
362 const uint32_t *SelectorOffsets = nullptr;
364 /// \brief Base selector ID for selectors local to this module.
365 serialization::SelectorID BaseSelectorID = 0;
367 /// \brief Remapping table for selector IDs in this module.
368 ContinuousRangeMap<uint32_t, int, 2> SelectorRemap;
370 /// \brief A pointer to the character data that comprises the selector table
372 /// The SelectorOffsets table refers into this memory.
373 const unsigned char *SelectorLookupTableData = nullptr;
375 /// \brief A pointer to an on-disk hash table of opaque type
376 /// ASTSelectorLookupTable.
378 /// This hash table provides the IDs of all selectors, and the associated
379 /// instance and factory methods.
380 void *SelectorLookupTable = nullptr;
382 // === Declarations ===
384 /// DeclsCursor - This is a cursor to the start of the DECLS_BLOCK block. It
385 /// has read all the abbreviations at the start of the block and is ready to
386 /// jump around with these in context.
387 llvm::BitstreamCursor DeclsCursor;
389 /// \brief The number of declarations in this AST file.
390 unsigned LocalNumDecls = 0;
392 /// \brief Offset of each declaration within the bitstream, indexed
393 /// by the declaration ID (-1).
394 const DeclOffset *DeclOffsets = nullptr;
396 /// \brief Base declaration ID for declarations local to this module.
397 serialization::DeclID BaseDeclID = 0;
399 /// \brief Remapping table for declaration IDs in this module.
400 ContinuousRangeMap<uint32_t, int, 2> DeclRemap;
402 /// \brief Mapping from the module files that this module file depends on
403 /// to the base declaration ID for that module as it is understood within this
406 /// This is effectively a reverse global-to-local mapping for declaration
407 /// IDs, so that we can interpret a true global ID (for this translation unit)
408 /// as a local ID (for this module file).
409 llvm::DenseMap<ModuleFile *, serialization::DeclID> GlobalToLocalDeclIDs;
411 /// \brief Array of file-level DeclIDs sorted by file.
412 const serialization::DeclID *FileSortedDecls = nullptr;
413 unsigned NumFileSortedDecls = 0;
415 /// \brief Array of category list location information within this
416 /// module file, sorted by the definition ID.
417 const serialization::ObjCCategoriesInfo *ObjCCategoriesMap = nullptr;
419 /// \brief The number of redeclaration info entries in ObjCCategoriesMap.
420 unsigned LocalNumObjCCategoriesInMap = 0;
422 /// \brief The Objective-C category lists for categories known to this
424 SmallVector<uint64_t, 1> ObjCCategories;
428 /// \brief The number of types in this AST file.
429 unsigned LocalNumTypes = 0;
431 /// \brief Offset of each type within the bitstream, indexed by the
432 /// type ID, or the representation of a Type*.
433 const uint32_t *TypeOffsets = nullptr;
435 /// \brief Base type ID for types local to this module as represented in
436 /// the global type ID space.
437 serialization::TypeID BaseTypeIndex = 0;
439 /// \brief Remapping table for type IDs in this module.
440 ContinuousRangeMap<uint32_t, int, 2> TypeRemap;
442 // === Miscellaneous ===
444 /// \brief Diagnostic IDs and their mappings that the user changed.
445 SmallVector<uint64_t, 8> PragmaDiagMappings;
447 /// \brief List of modules which depend on this module
448 llvm::SetVector<ModuleFile *> ImportedBy;
450 /// \brief List of modules which this module depends on
451 llvm::SetVector<ModuleFile *> Imports;
453 /// \brief Determine whether this module was directly imported at
454 /// any point during translation.
455 bool isDirectlyImported() const { return DirectlyImported; }
457 /// \brief Is this a module file for a module (rather than a PCH or similar).
458 bool isModule() const {
459 return Kind == MK_ImplicitModule || Kind == MK_ExplicitModule ||
460 Kind == MK_PrebuiltModule;
463 /// \brief Dump debugging output for this module.
467 } // end namespace serialization
469 } // end namespace clang