Coverage Report

Created: 2024-01-17 10:31

/src/llvm-project/clang/include/clang/Serialization/ASTWriter.h
Line
Count
Source (jump to first uncovered line)
1
//===- ASTWriter.h - AST File Writer ----------------------------*- C++ -*-===//
2
//
3
// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4
// See https://llvm.org/LICENSE.txt for license information.
5
// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6
//
7
//===----------------------------------------------------------------------===//
8
//
9
//  This file defines the ASTWriter class, which writes an AST file
10
//  containing a serialized representation of a translation unit.
11
//
12
//===----------------------------------------------------------------------===//
13
14
#ifndef LLVM_CLANG_SERIALIZATION_ASTWRITER_H
15
#define LLVM_CLANG_SERIALIZATION_ASTWRITER_H
16
17
#include "clang/AST/ASTMutationListener.h"
18
#include "clang/AST/Decl.h"
19
#include "clang/AST/Type.h"
20
#include "clang/Basic/LLVM.h"
21
#include "clang/Basic/Module.h"
22
#include "clang/Basic/SourceLocation.h"
23
#include "clang/Sema/Sema.h"
24
#include "clang/Sema/SemaConsumer.h"
25
#include "clang/Serialization/ASTBitCodes.h"
26
#include "clang/Serialization/ASTDeserializationListener.h"
27
#include "clang/Serialization/PCHContainerOperations.h"
28
#include "clang/Serialization/SourceLocationEncoding.h"
29
#include "llvm/ADT/ArrayRef.h"
30
#include "llvm/ADT/DenseMap.h"
31
#include "llvm/ADT/DenseSet.h"
32
#include "llvm/ADT/MapVector.h"
33
#include "llvm/ADT/STLExtras.h"
34
#include "llvm/ADT/SetVector.h"
35
#include "llvm/ADT/SmallVector.h"
36
#include "llvm/ADT/StringRef.h"
37
#include "llvm/Bitstream/BitstreamWriter.h"
38
#include <cassert>
39
#include <cstddef>
40
#include <cstdint>
41
#include <ctime>
42
#include <memory>
43
#include <queue>
44
#include <string>
45
#include <utility>
46
#include <vector>
47
48
namespace clang {
49
50
class ASTContext;
51
class ASTReader;
52
class Attr;
53
class CXXRecordDecl;
54
class FileEntry;
55
class FPOptionsOverride;
56
class FunctionDecl;
57
class HeaderSearch;
58
class HeaderSearchOptions;
59
class IdentifierResolver;
60
class LangOptions;
61
class MacroDefinitionRecord;
62
class MacroInfo;
63
class Module;
64
class InMemoryModuleCache;
65
class ModuleFileExtension;
66
class ModuleFileExtensionWriter;
67
class NamedDecl;
68
class ObjCInterfaceDecl;
69
class PreprocessingRecord;
70
class Preprocessor;
71
class RecordDecl;
72
class Sema;
73
class SourceManager;
74
class Stmt;
75
class StoredDeclsList;
76
class SwitchCase;
77
class Token;
78
79
/// Writes an AST file containing the contents of a translation unit.
80
///
81
/// The ASTWriter class produces a bitstream containing the serialized
82
/// representation of a given abstract syntax tree and its supporting
83
/// data structures. This bitstream can be de-serialized via an
84
/// instance of the ASTReader class.
85
class ASTWriter : public ASTDeserializationListener,
86
                  public ASTMutationListener {
87
public:
88
  friend class ASTDeclWriter;
89
  friend class ASTRecordWriter;
90
91
  using RecordData = SmallVector<uint64_t, 64>;
92
  using RecordDataImpl = SmallVectorImpl<uint64_t>;
93
  using RecordDataRef = ArrayRef<uint64_t>;
94
95
private:
96
  /// Map that provides the ID numbers of each type within the
97
  /// output stream, plus those deserialized from a chained PCH.
98
  ///
99
  /// The ID numbers of types are consecutive (in order of discovery)
100
  /// and start at 1. 0 is reserved for NULL. When types are actually
101
  /// stored in the stream, the ID number is shifted by 2 bits to
102
  /// allow for the const/volatile qualifiers.
103
  ///
104
  /// Keys in the map never have const/volatile qualifiers.
105
  using TypeIdxMap = llvm::DenseMap<QualType, serialization::TypeIdx,
106
                                    serialization::UnsafeQualTypeDenseMapInfo>;
107
108
  using LocSeq = SourceLocationSequence;
109
110
  /// The bitstream writer used to emit this precompiled header.
111
  llvm::BitstreamWriter &Stream;
112
113
  /// The buffer associated with the bitstream.
114
  const SmallVectorImpl<char> &Buffer;
115
116
  /// The PCM manager which manages memory buffers for pcm files.
117
  InMemoryModuleCache &ModuleCache;
118
119
  /// The ASTContext we're writing.
120
  ASTContext *Context = nullptr;
121
122
  /// The preprocessor we're writing.
123
  Preprocessor *PP = nullptr;
124
125
  /// The reader of existing AST files, if we're chaining.
126
  ASTReader *Chain = nullptr;
127
128
  /// The module we're currently writing, if any.
129
  Module *WritingModule = nullptr;
130
131
  /// The byte range representing all the UNHASHED_CONTROL_BLOCK.
132
  std::pair<uint64_t, uint64_t> UnhashedControlBlockRange;
133
  /// The bit offset of the AST block hash blob.
134
  uint64_t ASTBlockHashOffset = 0;
135
  /// The bit offset of the signature blob.
136
  uint64_t SignatureOffset = 0;
137
138
  /// The bit offset of the first bit inside the AST_BLOCK.
139
  uint64_t ASTBlockStartOffset = 0;
140
141
  /// The byte range representing all the AST_BLOCK.
142
  std::pair<uint64_t, uint64_t> ASTBlockRange;
143
144
  /// The base directory for any relative paths we emit.
145
  std::string BaseDirectory;
146
147
  /// Indicates whether timestamps should be written to the produced
148
  /// module file. This is the case for files implicitly written to the
149
  /// module cache, where we need the timestamps to determine if the module
150
  /// file is up to date, but not otherwise.
151
  bool IncludeTimestamps;
152
153
  /// Indicates whether the AST file being written is an implicit module.
154
  /// If that's the case, we may be able to skip writing some information that
155
  /// are guaranteed to be the same in the importer by the context hash.
156
  bool BuildingImplicitModule = false;
157
158
  /// Indicates when the AST writing is actively performing
159
  /// serialization, rather than just queueing updates.
160
  bool WritingAST = false;
161
162
  /// Indicates that we are done serializing the collection of decls
163
  /// and types to emit.
164
  bool DoneWritingDeclsAndTypes = false;
165
166
  /// Indicates that the AST contained compiler errors.
167
  bool ASTHasCompilerErrors = false;
168
169
  /// Mapping from input file entries to the index into the
170
  /// offset table where information about that input file is stored.
171
  llvm::DenseMap<const FileEntry *, uint32_t> InputFileIDs;
172
173
  /// Stores a declaration or a type to be written to the AST file.
174
  class DeclOrType {
175
  public:
176
0
    DeclOrType(Decl *D) : Stored(D), IsType(false) {}
177
0
    DeclOrType(QualType T) : Stored(T.getAsOpaquePtr()), IsType(true) {}
178
179
0
    bool isType() const { return IsType; }
180
0
    bool isDecl() const { return !IsType; }
181
182
0
    QualType getType() const {
183
0
      assert(isType() && "Not a type!");
184
0
      return QualType::getFromOpaquePtr(Stored);
185
0
    }
186
187
0
    Decl *getDecl() const {
188
0
      assert(isDecl() && "Not a decl!");
189
0
      return static_cast<Decl *>(Stored);
190
0
    }
191
192
  private:
193
    void *Stored;
194
    bool IsType;
195
  };
196
197
  /// The declarations and types to emit.
198
  std::queue<DeclOrType> DeclTypesToEmit;
199
200
  /// The first ID number we can use for our own declarations.
201
  serialization::DeclID FirstDeclID = serialization::NUM_PREDEF_DECL_IDS;
202
203
  /// The decl ID that will be assigned to the next new decl.
204
  serialization::DeclID NextDeclID = FirstDeclID;
205
206
  /// Map that provides the ID numbers of each declaration within
207
  /// the output stream, as well as those deserialized from a chained PCH.
208
  ///
209
  /// The ID numbers of declarations are consecutive (in order of
210
  /// discovery) and start at 2. 1 is reserved for the translation
211
  /// unit, while 0 is reserved for NULL.
212
  llvm::DenseMap<const Decl *, serialization::DeclID> DeclIDs;
213
214
  /// Offset of each declaration in the bitstream, indexed by
215
  /// the declaration's ID.
216
  std::vector<serialization::DeclOffset> DeclOffsets;
217
218
  /// The offset of the DECLTYPES_BLOCK. The offsets in DeclOffsets
219
  /// are relative to this value.
220
  uint64_t DeclTypesBlockStartOffset = 0;
221
222
  /// Sorted (by file offset) vector of pairs of file offset/DeclID.
223
  using LocDeclIDsTy =
224
      SmallVector<std::pair<unsigned, serialization::DeclID>, 64>;
225
  struct DeclIDInFileInfo {
226
    LocDeclIDsTy DeclIDs;
227
228
    /// Set when the DeclIDs vectors from all files are joined, this
229
    /// indicates the index that this particular vector has in the global one.
230
    unsigned FirstDeclIndex;
231
  };
232
  using FileDeclIDsTy =
233
      llvm::DenseMap<FileID, std::unique_ptr<DeclIDInFileInfo>>;
234
235
  /// Map from file SLocEntries to info about the file-level declarations
236
  /// that it contains.
237
  FileDeclIDsTy FileDeclIDs;
238
239
  void associateDeclWithFile(const Decl *D, serialization::DeclID);
240
241
  /// The first ID number we can use for our own types.
242
  serialization::TypeID FirstTypeID = serialization::NUM_PREDEF_TYPE_IDS;
243
244
  /// The type ID that will be assigned to the next new type.
245
  serialization::TypeID NextTypeID = FirstTypeID;
246
247
  /// Map that provides the ID numbers of each type within the
248
  /// output stream, plus those deserialized from a chained PCH.
249
  ///
250
  /// The ID numbers of types are consecutive (in order of discovery)
251
  /// and start at 1. 0 is reserved for NULL. When types are actually
252
  /// stored in the stream, the ID number is shifted by 2 bits to
253
  /// allow for the const/volatile qualifiers.
254
  ///
255
  /// Keys in the map never have const/volatile qualifiers.
256
  TypeIdxMap TypeIdxs;
257
258
  /// Offset of each type in the bitstream, indexed by
259
  /// the type's ID.
260
  std::vector<serialization::UnderalignedInt64> TypeOffsets;
261
262
  /// The first ID number we can use for our own identifiers.
263
  serialization::IdentID FirstIdentID = serialization::NUM_PREDEF_IDENT_IDS;
264
265
  /// The identifier ID that will be assigned to the next new identifier.
266
  serialization::IdentID NextIdentID = FirstIdentID;
267
268
  /// Map that provides the ID numbers of each identifier in
269
  /// the output stream.
270
  ///
271
  /// The ID numbers for identifiers are consecutive (in order of
272
  /// discovery), starting at 1. An ID of zero refers to a NULL
273
  /// IdentifierInfo.
274
  llvm::MapVector<const IdentifierInfo *, serialization::IdentID> IdentifierIDs;
275
276
  /// The first ID number we can use for our own macros.
277
  serialization::MacroID FirstMacroID = serialization::NUM_PREDEF_MACRO_IDS;
278
279
  /// The identifier ID that will be assigned to the next new identifier.
280
  serialization::MacroID NextMacroID = FirstMacroID;
281
282
  /// Map that provides the ID numbers of each macro.
283
  llvm::DenseMap<MacroInfo *, serialization::MacroID> MacroIDs;
284
285
  struct MacroInfoToEmitData {
286
    const IdentifierInfo *Name;
287
    MacroInfo *MI;
288
    serialization::MacroID ID;
289
  };
290
291
  /// The macro infos to emit.
292
  std::vector<MacroInfoToEmitData> MacroInfosToEmit;
293
294
  llvm::DenseMap<const IdentifierInfo *, uint32_t>
295
      IdentMacroDirectivesOffsetMap;
296
297
  /// @name FlushStmt Caches
298
  /// @{
299
300
  /// Set of parent Stmts for the currently serializing sub-stmt.
301
  llvm::DenseSet<Stmt *> ParentStmts;
302
303
  /// Offsets of sub-stmts already serialized. The offset points
304
  /// just after the stmt record.
305
  llvm::DenseMap<Stmt *, uint64_t> SubStmtEntries;
306
307
  /// @}
308
309
  /// Offsets of each of the identifier IDs into the identifier
310
  /// table.
311
  std::vector<uint32_t> IdentifierOffsets;
312
313
  /// The first ID number we can use for our own submodules.
314
  serialization::SubmoduleID FirstSubmoduleID =
315
      serialization::NUM_PREDEF_SUBMODULE_IDS;
316
317
  /// The submodule ID that will be assigned to the next new submodule.
318
  serialization::SubmoduleID NextSubmoduleID = FirstSubmoduleID;
319
320
  /// The first ID number we can use for our own selectors.
321
  serialization::SelectorID FirstSelectorID =
322
      serialization::NUM_PREDEF_SELECTOR_IDS;
323
324
  /// The selector ID that will be assigned to the next new selector.
325
  serialization::SelectorID NextSelectorID = FirstSelectorID;
326
327
  /// Map that provides the ID numbers of each Selector.
328
  llvm::MapVector<Selector, serialization::SelectorID> SelectorIDs;
329
330
  /// Offset of each selector within the method pool/selector
331
  /// table, indexed by the Selector ID (-1).
332
  std::vector<uint32_t> SelectorOffsets;
333
334
  /// Mapping from macro definitions (as they occur in the preprocessing
335
  /// record) to the macro IDs.
336
  llvm::DenseMap<const MacroDefinitionRecord *,
337
                 serialization::PreprocessedEntityID> MacroDefinitions;
338
339
  /// Cache of indices of anonymous declarations within their lexical
340
  /// contexts.
341
  llvm::DenseMap<const Decl *, unsigned> AnonymousDeclarationNumbers;
342
343
  /// An update to a Decl.
344
  class DeclUpdate {
345
    /// A DeclUpdateKind.
346
    unsigned Kind;
347
    union {
348
      const Decl *Dcl;
349
      void *Type;
350
      SourceLocation::UIntTy Loc;
351
      unsigned Val;
352
      Module *Mod;
353
      const Attr *Attribute;
354
    };
355
356
  public:
357
0
    DeclUpdate(unsigned Kind) : Kind(Kind), Dcl(nullptr) {}
358
0
    DeclUpdate(unsigned Kind, const Decl *Dcl) : Kind(Kind), Dcl(Dcl) {}
359
    DeclUpdate(unsigned Kind, QualType Type)
360
0
        : Kind(Kind), Type(Type.getAsOpaquePtr()) {}
361
    DeclUpdate(unsigned Kind, SourceLocation Loc)
362
0
        : Kind(Kind), Loc(Loc.getRawEncoding()) {}
363
0
    DeclUpdate(unsigned Kind, unsigned Val) : Kind(Kind), Val(Val) {}
364
0
    DeclUpdate(unsigned Kind, Module *M) : Kind(Kind), Mod(M) {}
365
    DeclUpdate(unsigned Kind, const Attr *Attribute)
366
0
          : Kind(Kind), Attribute(Attribute) {}
367
368
0
    unsigned getKind() const { return Kind; }
369
0
    const Decl *getDecl() const { return Dcl; }
370
0
    QualType getType() const { return QualType::getFromOpaquePtr(Type); }
371
372
0
    SourceLocation getLoc() const {
373
0
      return SourceLocation::getFromRawEncoding(Loc);
374
0
    }
375
376
0
    unsigned getNumber() const { return Val; }
377
0
    Module *getModule() const { return Mod; }
378
0
    const Attr *getAttr() const { return Attribute; }
379
  };
380
381
  using UpdateRecord = SmallVector<DeclUpdate, 1>;
382
  using DeclUpdateMap = llvm::MapVector<const Decl *, UpdateRecord>;
383
384
  /// Mapping from declarations that came from a chained PCH to the
385
  /// record containing modifications to them.
386
  DeclUpdateMap DeclUpdates;
387
388
  using FirstLatestDeclMap = llvm::DenseMap<Decl *, Decl *>;
389
390
  /// Map of first declarations from a chained PCH that point to the
391
  /// most recent declarations in another PCH.
392
  FirstLatestDeclMap FirstLatestDecls;
393
394
  /// Declarations encountered that might be external
395
  /// definitions.
396
  ///
397
  /// We keep track of external definitions and other 'interesting' declarations
398
  /// as we are emitting declarations to the AST file. The AST file contains a
399
  /// separate record for these declarations, which are provided to the AST
400
  /// consumer by the AST reader. This is behavior is required to properly cope with,
401
  /// e.g., tentative variable definitions that occur within
402
  /// headers. The declarations themselves are stored as declaration
403
  /// IDs, since they will be written out to an EAGERLY_DESERIALIZED_DECLS
404
  /// record.
405
  SmallVector<serialization::DeclID, 16> EagerlyDeserializedDecls;
406
  SmallVector<serialization::DeclID, 16> ModularCodegenDecls;
407
408
  /// DeclContexts that have received extensions since their serialized
409
  /// form.
410
  ///
411
  /// For namespaces, when we're chaining and encountering a namespace, we check
412
  /// if its primary namespace comes from the chain. If it does, we add the
413
  /// primary to this set, so that we can write out lexical content updates for
414
  /// it.
415
  llvm::SmallSetVector<const DeclContext *, 16> UpdatedDeclContexts;
416
417
  /// Keeps track of declarations that we must emit, even though we're
418
  /// not guaranteed to be able to find them by walking the AST starting at the
419
  /// translation unit.
420
  SmallVector<const Decl *, 16> DeclsToEmitEvenIfUnreferenced;
421
422
  /// The set of Objective-C class that have categories we
423
  /// should serialize.
424
  llvm::SetVector<ObjCInterfaceDecl *> ObjCClassesWithCategories;
425
426
  /// The set of declarations that may have redeclaration chains that
427
  /// need to be serialized.
428
  llvm::SmallVector<const Decl *, 16> Redeclarations;
429
430
  /// A cache of the first local declaration for "interesting"
431
  /// redeclaration chains.
432
  llvm::DenseMap<const Decl *, const Decl *> FirstLocalDeclCache;
433
434
  /// Mapping from SwitchCase statements to IDs.
435
  llvm::DenseMap<SwitchCase *, unsigned> SwitchCaseIDs;
436
437
  /// The number of statements written to the AST file.
438
  unsigned NumStatements = 0;
439
440
  /// The number of macros written to the AST file.
441
  unsigned NumMacros = 0;
442
443
  /// The number of lexical declcontexts written to the AST
444
  /// file.
445
  unsigned NumLexicalDeclContexts = 0;
446
447
  /// The number of visible declcontexts written to the AST
448
  /// file.
449
  unsigned NumVisibleDeclContexts = 0;
450
451
  /// A mapping from each known submodule to its ID number, which will
452
  /// be a positive integer.
453
  llvm::DenseMap<const Module *, unsigned> SubmoduleIDs;
454
455
  /// A list of the module file extension writers.
456
  std::vector<std::unique_ptr<ModuleFileExtensionWriter>>
457
      ModuleFileExtensionWriters;
458
459
  /// Mapping from a source location entry to whether it is affecting or not.
460
  llvm::BitVector IsSLocAffecting;
461
462
  /// Mapping from \c FileID to an index into the FileID adjustment table.
463
  std::vector<FileID> NonAffectingFileIDs;
464
  std::vector<unsigned> NonAffectingFileIDAdjustments;
465
466
  /// Mapping from an offset to an index into the offset adjustment table.
467
  std::vector<SourceRange> NonAffectingRanges;
468
  std::vector<SourceLocation::UIntTy> NonAffectingOffsetAdjustments;
469
470
  /// Collects input files that didn't affect compilation of the current module,
471
  /// and initializes data structures necessary for leaving those files out
472
  /// during \c SourceManager serialization.
473
  void collectNonAffectingInputFiles();
474
475
  /// Returns an adjusted \c FileID, accounting for any non-affecting input
476
  /// files.
477
  FileID getAdjustedFileID(FileID FID) const;
478
  /// Returns an adjusted number of \c FileIDs created within the specified \c
479
  /// FileID, accounting for any non-affecting input files.
480
  unsigned getAdjustedNumCreatedFIDs(FileID FID) const;
481
  /// Returns an adjusted \c SourceLocation, accounting for any non-affecting
482
  /// input files.
483
  SourceLocation getAdjustedLocation(SourceLocation Loc) const;
484
  /// Returns an adjusted \c SourceRange, accounting for any non-affecting input
485
  /// files.
486
  SourceRange getAdjustedRange(SourceRange Range) const;
487
  /// Returns an adjusted \c SourceLocation offset, accounting for any
488
  /// non-affecting input files.
489
  SourceLocation::UIntTy getAdjustedOffset(SourceLocation::UIntTy Offset) const;
490
  /// Returns an adjustment for offset into SourceManager, accounting for any
491
  /// non-affecting input files.
492
  SourceLocation::UIntTy getAdjustment(SourceLocation::UIntTy Offset) const;
493
494
  /// Retrieve or create a submodule ID for this module.
495
  unsigned getSubmoduleID(Module *Mod);
496
497
  /// Write the given subexpression to the bitstream.
498
  void WriteSubStmt(Stmt *S);
499
500
  void WriteBlockInfoBlock();
501
  void WriteControlBlock(Preprocessor &PP, ASTContext &Context,
502
                         StringRef isysroot);
503
504
  /// Write out the signature and diagnostic options, and return the signature.
505
  void writeUnhashedControlBlock(Preprocessor &PP, ASTContext &Context);
506
  ASTFileSignature backpatchSignature();
507
508
  /// Calculate hash of the pcm content.
509
  std::pair<ASTFileSignature, ASTFileSignature> createSignature() const;
510
511
  void WriteInputFiles(SourceManager &SourceMgr, HeaderSearchOptions &HSOpts);
512
  void WriteSourceManagerBlock(SourceManager &SourceMgr,
513
                               const Preprocessor &PP);
514
  void WritePreprocessor(const Preprocessor &PP, bool IsModule);
515
  void WriteHeaderSearch(const HeaderSearch &HS);
516
  void WritePreprocessorDetail(PreprocessingRecord &PPRec,
517
                               uint64_t MacroOffsetsBase);
518
  void WriteSubmodules(Module *WritingModule);
519
520
  void WritePragmaDiagnosticMappings(const DiagnosticsEngine &Diag,
521
                                     bool isModule);
522
523
  unsigned TypeExtQualAbbrev = 0;
524
  void WriteTypeAbbrevs();
525
  void WriteType(QualType T);
526
527
  bool isLookupResultExternal(StoredDeclsList &Result, DeclContext *DC);
528
  bool isLookupResultEntirelyExternal(StoredDeclsList &Result, DeclContext *DC);
529
530
  void GenerateNameLookupTable(const DeclContext *DC,
531
                               llvm::SmallVectorImpl<char> &LookupTable);
532
  uint64_t WriteDeclContextLexicalBlock(ASTContext &Context, DeclContext *DC);
533
  uint64_t WriteDeclContextVisibleBlock(ASTContext &Context, DeclContext *DC);
534
  void WriteTypeDeclOffsets();
535
  void WriteFileDeclIDsMap();
536
  void WriteComments();
537
  void WriteSelectors(Sema &SemaRef);
538
  void WriteReferencedSelectorsPool(Sema &SemaRef);
539
  void WriteIdentifierTable(Preprocessor &PP, IdentifierResolver &IdResolver,
540
                            bool IsModule);
541
  void WriteDeclUpdatesBlocks(RecordDataImpl &OffsetsRecord);
542
  void WriteDeclContextVisibleUpdate(const DeclContext *DC);
543
  void WriteFPPragmaOptions(const FPOptionsOverride &Opts);
544
  void WriteOpenCLExtensions(Sema &SemaRef);
545
  void WriteCUDAPragmas(Sema &SemaRef);
546
  void WriteObjCCategories();
547
  void WriteLateParsedTemplates(Sema &SemaRef);
548
  void WriteOptimizePragmaOptions(Sema &SemaRef);
549
  void WriteMSStructPragmaOptions(Sema &SemaRef);
550
  void WriteMSPointersToMembersPragmaOptions(Sema &SemaRef);
551
  void WritePackPragmaOptions(Sema &SemaRef);
552
  void WriteFloatControlPragmaOptions(Sema &SemaRef);
553
  void WriteModuleFileExtension(Sema &SemaRef,
554
                                ModuleFileExtensionWriter &Writer);
555
556
  unsigned DeclParmVarAbbrev = 0;
557
  unsigned DeclContextLexicalAbbrev = 0;
558
  unsigned DeclContextVisibleLookupAbbrev = 0;
559
  unsigned UpdateVisibleAbbrev = 0;
560
  unsigned DeclRecordAbbrev = 0;
561
  unsigned DeclTypedefAbbrev = 0;
562
  unsigned DeclVarAbbrev = 0;
563
  unsigned DeclFieldAbbrev = 0;
564
  unsigned DeclEnumAbbrev = 0;
565
  unsigned DeclObjCIvarAbbrev = 0;
566
  unsigned DeclCXXMethodAbbrev = 0;
567
  unsigned DeclDependentNonTemplateCXXMethodAbbrev = 0;
568
  unsigned DeclTemplateCXXMethodAbbrev = 0;
569
  unsigned DeclMemberSpecializedCXXMethodAbbrev = 0;
570
  unsigned DeclTemplateSpecializedCXXMethodAbbrev = 0;
571
  unsigned DeclDependentSpecializationCXXMethodAbbrev = 0;
572
  unsigned DeclTemplateTypeParmAbbrev = 0;
573
  unsigned DeclUsingShadowAbbrev = 0;
574
575
  unsigned DeclRefExprAbbrev = 0;
576
  unsigned CharacterLiteralAbbrev = 0;
577
  unsigned IntegerLiteralAbbrev = 0;
578
  unsigned ExprImplicitCastAbbrev = 0;
579
  unsigned BinaryOperatorAbbrev = 0;
580
  unsigned CompoundAssignOperatorAbbrev = 0;
581
  unsigned CallExprAbbrev = 0;
582
  unsigned CXXOperatorCallExprAbbrev = 0;
583
  unsigned CXXMemberCallExprAbbrev = 0;
584
585
  unsigned CompoundStmtAbbrev = 0;
586
587
  void WriteDeclAbbrevs();
588
  void WriteDecl(ASTContext &Context, Decl *D);
589
590
  ASTFileSignature WriteASTCore(Sema &SemaRef, StringRef isysroot,
591
                                Module *WritingModule);
592
593
public:
594
  /// Create a new precompiled header writer that outputs to
595
  /// the given bitstream.
596
  ASTWriter(llvm::BitstreamWriter &Stream, SmallVectorImpl<char> &Buffer,
597
            InMemoryModuleCache &ModuleCache,
598
            ArrayRef<std::shared_ptr<ModuleFileExtension>> Extensions,
599
            bool IncludeTimestamps = true, bool BuildingImplicitModule = false);
600
  ~ASTWriter() override;
601
602
0
  ASTContext &getASTContext() const {
603
0
    assert(Context && "requested AST context when not writing AST");
604
0
    return *Context;
605
0
  }
606
607
  const LangOptions &getLangOpts() const;
608
609
  /// Get a timestamp for output into the AST file. The actual timestamp
610
  /// of the specified file may be ignored if we have been instructed to not
611
  /// include timestamps in the output file.
612
  time_t getTimestampForOutput(const FileEntry *E) const;
613
614
  /// Write a precompiled header for the given semantic analysis.
615
  ///
616
  /// \param SemaRef a reference to the semantic analysis object that processed
617
  /// the AST to be written into the precompiled header.
618
  ///
619
  /// \param WritingModule The module that we are writing. If null, we are
620
  /// writing a precompiled header.
621
  ///
622
  /// \param isysroot if non-empty, write a relocatable file whose headers
623
  /// are relative to the given system root. If we're writing a module, its
624
  /// build directory will be used in preference to this if both are available.
625
  ///
626
  /// \return the module signature, which eventually will be a hash of
627
  /// the module but currently is merely a random 32-bit number.
628
  ASTFileSignature WriteAST(Sema &SemaRef, StringRef OutputFile,
629
                            Module *WritingModule, StringRef isysroot,
630
                            bool ShouldCacheASTInMemory = false);
631
632
  /// Emit a token.
633
  void AddToken(const Token &Tok, RecordDataImpl &Record);
634
635
  /// Emit a AlignPackInfo.
636
  void AddAlignPackInfo(const Sema::AlignPackInfo &Info,
637
                        RecordDataImpl &Record);
638
639
  /// Emit a FileID.
640
  void AddFileID(FileID FID, RecordDataImpl &Record);
641
642
  /// Emit a source location.
643
  void AddSourceLocation(SourceLocation Loc, RecordDataImpl &Record,
644
                         LocSeq *Seq = nullptr);
645
646
  /// Emit a source range.
647
  void AddSourceRange(SourceRange Range, RecordDataImpl &Record,
648
                      LocSeq *Seq = nullptr);
649
650
  /// Emit a reference to an identifier.
651
  void AddIdentifierRef(const IdentifierInfo *II, RecordDataImpl &Record);
652
653
  /// Get the unique number used to refer to the given selector.
654
  serialization::SelectorID getSelectorRef(Selector Sel);
655
656
  /// Get the unique number used to refer to the given identifier.
657
  serialization::IdentID getIdentifierRef(const IdentifierInfo *II);
658
659
  /// Get the unique number used to refer to the given macro.
660
  serialization::MacroID getMacroRef(MacroInfo *MI, const IdentifierInfo *Name);
661
662
  /// Determine the ID of an already-emitted macro.
663
  serialization::MacroID getMacroID(MacroInfo *MI);
664
665
  uint32_t getMacroDirectivesOffset(const IdentifierInfo *Name);
666
667
  /// Emit a reference to a type.
668
  void AddTypeRef(QualType T, RecordDataImpl &Record);
669
670
  /// Force a type to be emitted and get its ID.
671
  serialization::TypeID GetOrCreateTypeID(QualType T);
672
673
  /// Determine the type ID of an already-emitted type.
674
  serialization::TypeID getTypeID(QualType T) const;
675
676
  /// Find the first local declaration of a given local redeclarable
677
  /// decl.
678
  const Decl *getFirstLocalDecl(const Decl *D);
679
680
  /// Is this a local declaration (that is, one that will be written to
681
  /// our AST file)? This is the case for declarations that are neither imported
682
  /// from another AST file nor predefined.
683
0
  bool IsLocalDecl(const Decl *D) {
684
0
    if (D->isFromASTFile())
685
0
      return false;
686
0
    auto I = DeclIDs.find(D);
687
0
    return (I == DeclIDs.end() ||
688
0
            I->second >= serialization::NUM_PREDEF_DECL_IDS);
689
0
  };
690
691
  /// Emit a reference to a declaration.
692
  void AddDeclRef(const Decl *D, RecordDataImpl &Record);
693
694
  /// Force a declaration to be emitted and get its ID.
695
  serialization::DeclID GetDeclRef(const Decl *D);
696
697
  /// Determine the declaration ID of an already-emitted
698
  /// declaration.
699
  serialization::DeclID getDeclID(const Decl *D);
700
701
  unsigned getAnonymousDeclarationNumber(const NamedDecl *D);
702
703
  /// Add a string to the given record.
704
  void AddString(StringRef Str, RecordDataImpl &Record);
705
706
  /// Convert a path from this build process into one that is appropriate
707
  /// for emission in the module file.
708
  bool PreparePathForOutput(SmallVectorImpl<char> &Path);
709
710
  /// Add a path to the given record.
711
  void AddPath(StringRef Path, RecordDataImpl &Record);
712
713
  /// Emit the current record with the given path as a blob.
714
  void EmitRecordWithPath(unsigned Abbrev, RecordDataRef Record,
715
                          StringRef Path);
716
717
  /// Add a version tuple to the given record
718
  void AddVersionTuple(const VersionTuple &Version, RecordDataImpl &Record);
719
720
  /// Retrieve or create a submodule ID for this module, or return 0 if
721
  /// the submodule is neither local (a submodle of the currently-written module)
722
  /// nor from an imported module.
723
  unsigned getLocalOrImportedSubmoduleID(const Module *Mod);
724
725
  /// Note that the identifier II occurs at the given offset
726
  /// within the identifier table.
727
  void SetIdentifierOffset(const IdentifierInfo *II, uint32_t Offset);
728
729
  /// Note that the selector Sel occurs at the given offset
730
  /// within the method pool/selector table.
731
  void SetSelectorOffset(Selector Sel, uint32_t Offset);
732
733
  /// Record an ID for the given switch-case statement.
734
  unsigned RecordSwitchCaseID(SwitchCase *S);
735
736
  /// Retrieve the ID for the given switch-case statement.
737
  unsigned getSwitchCaseID(SwitchCase *S);
738
739
  void ClearSwitchCaseIDs();
740
741
0
  unsigned getTypeExtQualAbbrev() const {
742
0
    return TypeExtQualAbbrev;
743
0
  }
744
745
0
  unsigned getDeclParmVarAbbrev() const { return DeclParmVarAbbrev; }
746
0
  unsigned getDeclRecordAbbrev() const { return DeclRecordAbbrev; }
747
0
  unsigned getDeclTypedefAbbrev() const { return DeclTypedefAbbrev; }
748
0
  unsigned getDeclVarAbbrev() const { return DeclVarAbbrev; }
749
0
  unsigned getDeclFieldAbbrev() const { return DeclFieldAbbrev; }
750
0
  unsigned getDeclEnumAbbrev() const { return DeclEnumAbbrev; }
751
0
  unsigned getDeclObjCIvarAbbrev() const { return DeclObjCIvarAbbrev; }
752
0
  unsigned getDeclCXXMethodAbbrev(FunctionDecl::TemplatedKind Kind) const {
753
0
    switch (Kind) {
754
0
    case FunctionDecl::TK_NonTemplate:
755
0
      return DeclCXXMethodAbbrev;
756
0
    case FunctionDecl::TK_FunctionTemplate:
757
0
      return DeclTemplateCXXMethodAbbrev;
758
0
    case FunctionDecl::TK_MemberSpecialization:
759
0
      return DeclMemberSpecializedCXXMethodAbbrev;
760
0
    case FunctionDecl::TK_FunctionTemplateSpecialization:
761
0
      return DeclTemplateSpecializedCXXMethodAbbrev;
762
0
    case FunctionDecl::TK_DependentNonTemplate:
763
0
      return DeclDependentNonTemplateCXXMethodAbbrev;
764
0
    case FunctionDecl::TK_DependentFunctionTemplateSpecialization:
765
0
      return DeclDependentSpecializationCXXMethodAbbrev;
766
0
    }
767
0
    llvm_unreachable("Unknwon Template Kind!");
768
0
  }
769
0
  unsigned getDeclTemplateTypeParmAbbrev() const {
770
0
    return DeclTemplateTypeParmAbbrev;
771
0
  }
772
0
  unsigned getDeclUsingShadowAbbrev() const { return DeclUsingShadowAbbrev; }
773
774
0
  unsigned getDeclRefExprAbbrev() const { return DeclRefExprAbbrev; }
775
0
  unsigned getCharacterLiteralAbbrev() const { return CharacterLiteralAbbrev; }
776
0
  unsigned getIntegerLiteralAbbrev() const { return IntegerLiteralAbbrev; }
777
0
  unsigned getExprImplicitCastAbbrev() const { return ExprImplicitCastAbbrev; }
778
0
  unsigned getBinaryOperatorAbbrev() const { return BinaryOperatorAbbrev; }
779
0
  unsigned getCompoundAssignOperatorAbbrev() const {
780
0
    return CompoundAssignOperatorAbbrev;
781
0
  }
782
0
  unsigned getCallExprAbbrev() const { return CallExprAbbrev; }
783
0
  unsigned getCXXOperatorCallExprAbbrev() { return CXXOperatorCallExprAbbrev; }
784
0
  unsigned getCXXMemberCallExprAbbrev() { return CXXMemberCallExprAbbrev; }
785
786
0
  unsigned getCompoundStmtAbbrev() const { return CompoundStmtAbbrev; }
787
788
0
  bool hasChain() const { return Chain; }
789
0
  ASTReader *getChain() const { return Chain; }
790
791
0
  bool isWritingStdCXXNamedModules() const {
792
0
    return WritingModule && WritingModule->isNamedModule();
793
0
  }
794
795
private:
796
  // ASTDeserializationListener implementation
797
  void ReaderInitialized(ASTReader *Reader) override;
798
  void IdentifierRead(serialization::IdentID ID, IdentifierInfo *II) override;
799
  void MacroRead(serialization::MacroID ID, MacroInfo *MI) override;
800
  void TypeRead(serialization::TypeIdx Idx, QualType T) override;
801
  void SelectorRead(serialization::SelectorID ID, Selector Sel) override;
802
  void MacroDefinitionRead(serialization::PreprocessedEntityID ID,
803
                           MacroDefinitionRecord *MD) override;
804
  void ModuleRead(serialization::SubmoduleID ID, Module *Mod) override;
805
806
  // ASTMutationListener implementation.
807
  void CompletedTagDefinition(const TagDecl *D) override;
808
  void AddedVisibleDecl(const DeclContext *DC, const Decl *D) override;
809
  void AddedCXXImplicitMember(const CXXRecordDecl *RD, const Decl *D) override;
810
  void AddedCXXTemplateSpecialization(
811
      const ClassTemplateDecl *TD,
812
      const ClassTemplateSpecializationDecl *D) override;
813
  void AddedCXXTemplateSpecialization(
814
      const VarTemplateDecl *TD,
815
      const VarTemplateSpecializationDecl *D) override;
816
  void AddedCXXTemplateSpecialization(const FunctionTemplateDecl *TD,
817
                                      const FunctionDecl *D) override;
818
  void ResolvedExceptionSpec(const FunctionDecl *FD) override;
819
  void DeducedReturnType(const FunctionDecl *FD, QualType ReturnType) override;
820
  void ResolvedOperatorDelete(const CXXDestructorDecl *DD,
821
                              const FunctionDecl *Delete,
822
                              Expr *ThisArg) override;
823
  void CompletedImplicitDefinition(const FunctionDecl *D) override;
824
  void InstantiationRequested(const ValueDecl *D) override;
825
  void VariableDefinitionInstantiated(const VarDecl *D) override;
826
  void FunctionDefinitionInstantiated(const FunctionDecl *D) override;
827
  void DefaultArgumentInstantiated(const ParmVarDecl *D) override;
828
  void DefaultMemberInitializerInstantiated(const FieldDecl *D) override;
829
  void AddedObjCCategoryToInterface(const ObjCCategoryDecl *CatD,
830
                                    const ObjCInterfaceDecl *IFD) override;
831
  void DeclarationMarkedUsed(const Decl *D) override;
832
  void DeclarationMarkedOpenMPThreadPrivate(const Decl *D) override;
833
  void DeclarationMarkedOpenMPDeclareTarget(const Decl *D,
834
                                            const Attr *Attr) override;
835
  void DeclarationMarkedOpenMPAllocate(const Decl *D, const Attr *A) override;
836
  void RedefinedHiddenDefinition(const NamedDecl *D, Module *M) override;
837
  void AddedAttributeToRecord(const Attr *Attr,
838
                              const RecordDecl *Record) override;
839
};
840
841
/// AST and semantic-analysis consumer that generates a
842
/// precompiled header from the parsed source code.
843
class PCHGenerator : public SemaConsumer {
844
  const Preprocessor &PP;
845
  std::string OutputFile;
846
  std::string isysroot;
847
  Sema *SemaPtr;
848
  std::shared_ptr<PCHBuffer> Buffer;
849
  llvm::BitstreamWriter Stream;
850
  ASTWriter Writer;
851
  bool AllowASTWithErrors;
852
  bool ShouldCacheASTInMemory;
853
854
protected:
855
0
  ASTWriter &getWriter() { return Writer; }
856
0
  const ASTWriter &getWriter() const { return Writer; }
857
0
  SmallVectorImpl<char> &getPCH() const { return Buffer->Data; }
858
859
public:
860
  PCHGenerator(const Preprocessor &PP, InMemoryModuleCache &ModuleCache,
861
               StringRef OutputFile, StringRef isysroot,
862
               std::shared_ptr<PCHBuffer> Buffer,
863
               ArrayRef<std::shared_ptr<ModuleFileExtension>> Extensions,
864
               bool AllowASTWithErrors = false, bool IncludeTimestamps = true,
865
               bool BuildingImplicitModule = false,
866
               bool ShouldCacheASTInMemory = false);
867
  ~PCHGenerator() override;
868
869
0
  void InitializeSema(Sema &S) override { SemaPtr = &S; }
870
  void HandleTranslationUnit(ASTContext &Ctx) override;
871
  ASTMutationListener *GetASTMutationListener() override;
872
  ASTDeserializationListener *GetASTDeserializationListener() override;
873
0
  bool hasEmittedPCH() const { return Buffer->IsComplete; }
874
};
875
876
/// A simple helper class to pack several bits in order into (a) 32 bit
877
/// integer(s).
878
class BitsPacker {
879
  constexpr static uint32_t BitIndexUpbound = 32u;
880
881
public:
882
0
  BitsPacker() = default;
883
  BitsPacker(const BitsPacker &) = delete;
884
  BitsPacker(BitsPacker &&) = delete;
885
  BitsPacker operator=(const BitsPacker &) = delete;
886
  BitsPacker operator=(BitsPacker &&) = delete;
887
  ~BitsPacker() = default;
888
889
0
  bool canWriteNextNBits(uint32_t BitsWidth) const {
890
0
    return CurrentBitIndex + BitsWidth < BitIndexUpbound;
891
0
  }
892
893
0
  void reset(uint32_t Value) {
894
0
    UnderlyingValue = Value;
895
0
    CurrentBitIndex = 0;
896
0
  }
897
898
0
  void addBit(bool Value) { addBits(Value, 1); }
899
0
  void addBits(uint32_t Value, uint32_t BitsWidth) {
900
0
    assert(BitsWidth < BitIndexUpbound);
901
0
    assert((Value < (1u << BitsWidth)) && "Passing narrower bit width!");
902
0
    assert(canWriteNextNBits(BitsWidth) &&
903
0
           "Inserting too much bits into a value!");
904
905
0
    UnderlyingValue |= Value << CurrentBitIndex;
906
0
    CurrentBitIndex += BitsWidth;
907
0
  }
908
909
0
  operator uint32_t() { return UnderlyingValue; }
910
911
private:
912
  uint32_t UnderlyingValue = 0;
913
  uint32_t CurrentBitIndex = 0;
914
};
915
916
} // namespace clang
917
918
#endif // LLVM_CLANG_SERIALIZATION_ASTWRITER_H