xref: /freebsd/contrib/llvm-project/clang/include/clang/Lex/PreprocessingRecord.h (revision 0fca6ea1d4eea4c934cfff25ac9ee8ad6fe95583)
1 //===- PreprocessingRecord.h - Record of Preprocessing ----------*- C++ -*-===//
2 //
3 // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4 // See https://llvm.org/LICENSE.txt for license information.
5 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6 //
7 //===----------------------------------------------------------------------===//
8 //
9 //  This file defines the PreprocessingRecord class, which maintains a record
10 //  of what occurred during preprocessing.
11 //
12 //===----------------------------------------------------------------------===//
13 
14 #ifndef LLVM_CLANG_LEX_PREPROCESSINGRECORD_H
15 #define LLVM_CLANG_LEX_PREPROCESSINGRECORD_H
16 
17 #include "clang/Basic/IdentifierTable.h"
18 #include "clang/Basic/LLVM.h"
19 #include "clang/Basic/SourceLocation.h"
20 #include "clang/Lex/PPCallbacks.h"
21 #include "llvm/ADT/DenseMap.h"
22 #include "llvm/ADT/PointerUnion.h"
23 #include "llvm/ADT/StringRef.h"
24 #include "llvm/ADT/iterator.h"
25 #include "llvm/ADT/iterator_range.h"
26 #include "llvm/Support/Allocator.h"
27 #include "llvm/Support/Compiler.h"
28 #include <cassert>
29 #include <cstddef>
30 #include <iterator>
31 #include <optional>
32 #include <utility>
33 #include <vector>
34 
35 namespace clang {
36 
37 class PreprocessingRecord;
38 
39 } // namespace clang
40 
41 /// Allocates memory within a Clang preprocessing record.
42 void *operator new(size_t bytes, clang::PreprocessingRecord &PR,
43                    unsigned alignment = 8) noexcept;
44 
45 /// Frees memory allocated in a Clang preprocessing record.
46 void operator delete(void *ptr, clang::PreprocessingRecord &PR,
47                      unsigned) noexcept;
48 
49 namespace clang {
50 
51 class IdentifierInfo;
52 class MacroInfo;
53 class SourceManager;
54 class Token;
55 
56   /// Base class that describes a preprocessed entity, which may be a
57   /// preprocessor directive or macro expansion.
58   class PreprocessedEntity {
59   public:
60     /// The kind of preprocessed entity an object describes.
61     enum EntityKind {
62       /// Indicates a problem trying to load the preprocessed entity.
63       InvalidKind,
64 
65       /// A macro expansion.
66       MacroExpansionKind,
67 
68       /// \defgroup Preprocessing directives
69       /// @{
70 
71       /// A macro definition.
72       MacroDefinitionKind,
73 
74       /// An inclusion directive, such as \c \#include, \c
75       /// \#import, or \c \#include_next.
76       InclusionDirectiveKind,
77 
78       /// @}
79 
80       FirstPreprocessingDirective = MacroDefinitionKind,
81       LastPreprocessingDirective = InclusionDirectiveKind
82     };
83 
84   private:
85     /// The kind of preprocessed entity that this object describes.
86     EntityKind Kind;
87 
88     /// The source range that covers this preprocessed entity.
89     SourceRange Range;
90 
91   protected:
92     friend class PreprocessingRecord;
93 
PreprocessedEntity(EntityKind Kind,SourceRange Range)94     PreprocessedEntity(EntityKind Kind, SourceRange Range)
95         : Kind(Kind), Range(Range) {}
96 
97   public:
98     /// Retrieve the kind of preprocessed entity stored in this object.
getKind()99     EntityKind getKind() const { return Kind; }
100 
101     /// Retrieve the source range that covers this entire preprocessed
102     /// entity.
getSourceRange()103     SourceRange getSourceRange() const LLVM_READONLY { return Range; }
104 
105     /// Returns true if there was a problem loading the preprocessed
106     /// entity.
isInvalid()107     bool isInvalid() const { return Kind == InvalidKind; }
108 
109     // Only allow allocation of preprocessed entities using the allocator
110     // in PreprocessingRecord or by doing a placement new.
111     void *operator new(size_t bytes, PreprocessingRecord &PR,
112                        unsigned alignment = 8) noexcept {
113       return ::operator new(bytes, PR, alignment);
114     }
115 
new(size_t bytes,void * mem)116     void *operator new(size_t bytes, void *mem) noexcept { return mem; }
117 
delete(void * ptr,PreprocessingRecord & PR,unsigned alignment)118     void operator delete(void *ptr, PreprocessingRecord &PR,
119                          unsigned alignment) noexcept {
120       return ::operator delete(ptr, PR, alignment);
121     }
122 
delete(void *,std::size_t)123     void operator delete(void *, std::size_t) noexcept {}
delete(void *,void *)124     void operator delete(void *, void *) noexcept {}
125 
126   private:
127     // Make vanilla 'new' and 'delete' illegal for preprocessed entities.
128     void *operator new(size_t bytes) noexcept;
129     void operator delete(void *data) noexcept;
130   };
131 
132   /// Records the presence of a preprocessor directive.
133   class PreprocessingDirective : public PreprocessedEntity {
134   public:
PreprocessingDirective(EntityKind Kind,SourceRange Range)135     PreprocessingDirective(EntityKind Kind, SourceRange Range)
136         : PreprocessedEntity(Kind, Range) {}
137 
138     // Implement isa/cast/dyncast/etc.
classof(const PreprocessedEntity * PD)139     static bool classof(const PreprocessedEntity *PD) {
140       return PD->getKind() >= FirstPreprocessingDirective &&
141              PD->getKind() <= LastPreprocessingDirective;
142     }
143   };
144 
145   /// Record the location of a macro definition.
146   class MacroDefinitionRecord : public PreprocessingDirective {
147     /// The name of the macro being defined.
148     const IdentifierInfo *Name;
149 
150   public:
MacroDefinitionRecord(const IdentifierInfo * Name,SourceRange Range)151     explicit MacroDefinitionRecord(const IdentifierInfo *Name,
152                                    SourceRange Range)
153         : PreprocessingDirective(MacroDefinitionKind, Range), Name(Name) {}
154 
155     /// Retrieve the name of the macro being defined.
getName()156     const IdentifierInfo *getName() const { return Name; }
157 
158     /// Retrieve the location of the macro name in the definition.
getLocation()159     SourceLocation getLocation() const { return getSourceRange().getBegin(); }
160 
161     // Implement isa/cast/dyncast/etc.
classof(const PreprocessedEntity * PE)162     static bool classof(const PreprocessedEntity *PE) {
163       return PE->getKind() == MacroDefinitionKind;
164     }
165   };
166 
167   /// Records the location of a macro expansion.
168   class MacroExpansion : public PreprocessedEntity {
169     /// The definition of this macro or the name of the macro if it is
170     /// a builtin macro.
171     llvm::PointerUnion<IdentifierInfo *, MacroDefinitionRecord *> NameOrDef;
172 
173   public:
MacroExpansion(IdentifierInfo * BuiltinName,SourceRange Range)174     MacroExpansion(IdentifierInfo *BuiltinName, SourceRange Range)
175         : PreprocessedEntity(MacroExpansionKind, Range),
176           NameOrDef(BuiltinName) {}
177 
MacroExpansion(MacroDefinitionRecord * Definition,SourceRange Range)178     MacroExpansion(MacroDefinitionRecord *Definition, SourceRange Range)
179         : PreprocessedEntity(MacroExpansionKind, Range), NameOrDef(Definition) {
180     }
181 
182     /// True if it is a builtin macro.
isBuiltinMacro()183     bool isBuiltinMacro() const { return NameOrDef.is<IdentifierInfo *>(); }
184 
185     /// The name of the macro being expanded.
getName()186     const IdentifierInfo *getName() const {
187       if (MacroDefinitionRecord *Def = getDefinition())
188         return Def->getName();
189       return NameOrDef.get<IdentifierInfo *>();
190     }
191 
192     /// The definition of the macro being expanded. May return null if
193     /// this is a builtin macro.
getDefinition()194     MacroDefinitionRecord *getDefinition() const {
195       return NameOrDef.dyn_cast<MacroDefinitionRecord *>();
196     }
197 
198     // Implement isa/cast/dyncast/etc.
classof(const PreprocessedEntity * PE)199     static bool classof(const PreprocessedEntity *PE) {
200       return PE->getKind() == MacroExpansionKind;
201     }
202   };
203 
204   /// Record the location of an inclusion directive, such as an
205   /// \c \#include or \c \#import statement.
206   class InclusionDirective : public PreprocessingDirective {
207   public:
208     /// The kind of inclusion directives known to the
209     /// preprocessor.
210     enum InclusionKind {
211       /// An \c \#include directive.
212       Include,
213 
214       /// An Objective-C \c \#import directive.
215       Import,
216 
217       /// A GNU \c \#include_next directive.
218       IncludeNext,
219 
220       /// A Clang \c \#__include_macros directive.
221       IncludeMacros
222     };
223 
224   private:
225     /// The name of the file that was included, as written in
226     /// the source.
227     StringRef FileName;
228 
229     /// Whether the file name was in quotation marks; otherwise, it was
230     /// in angle brackets.
231     LLVM_PREFERRED_TYPE(bool)
232     unsigned InQuotes : 1;
233 
234     /// The kind of inclusion directive we have.
235     ///
236     /// This is a value of type InclusionKind.
237     LLVM_PREFERRED_TYPE(InclusionKind)
238     unsigned Kind : 2;
239 
240     /// Whether the inclusion directive was automatically turned into
241     /// a module import.
242     LLVM_PREFERRED_TYPE(bool)
243     unsigned ImportedModule : 1;
244 
245     /// The file that was included.
246     OptionalFileEntryRef File;
247 
248   public:
249     InclusionDirective(PreprocessingRecord &PPRec, InclusionKind Kind,
250                        StringRef FileName, bool InQuotes, bool ImportedModule,
251                        OptionalFileEntryRef File, SourceRange Range);
252 
253     /// Determine what kind of inclusion directive this is.
getKind()254     InclusionKind getKind() const { return static_cast<InclusionKind>(Kind); }
255 
256     /// Retrieve the included file name as it was written in the source.
getFileName()257     StringRef getFileName() const { return FileName; }
258 
259     /// Determine whether the included file name was written in quotes;
260     /// otherwise, it was written in angle brackets.
wasInQuotes()261     bool wasInQuotes() const { return InQuotes; }
262 
263     /// Determine whether the inclusion directive was automatically
264     /// turned into a module import.
importedModule()265     bool importedModule() const { return ImportedModule; }
266 
267     /// Retrieve the file entry for the actual file that was included
268     /// by this directive.
getFile()269     OptionalFileEntryRef getFile() const { return File; }
270 
271     // Implement isa/cast/dyncast/etc.
classof(const PreprocessedEntity * PE)272     static bool classof(const PreprocessedEntity *PE) {
273       return PE->getKind() == InclusionDirectiveKind;
274     }
275   };
276 
277   /// An abstract class that should be subclassed by any external source
278   /// of preprocessing record entries.
279   class ExternalPreprocessingRecordSource {
280   public:
281     virtual ~ExternalPreprocessingRecordSource();
282 
283     /// Read a preallocated preprocessed entity from the external source.
284     ///
285     /// \returns null if an error occurred that prevented the preprocessed
286     /// entity from being loaded.
287     virtual PreprocessedEntity *ReadPreprocessedEntity(unsigned Index) = 0;
288 
289     /// Returns a pair of [Begin, End) indices of preallocated
290     /// preprocessed entities that \p Range encompasses.
291     virtual std::pair<unsigned, unsigned>
292         findPreprocessedEntitiesInRange(SourceRange Range) = 0;
293 
294     /// Optionally returns true or false if the preallocated preprocessed
295     /// entity with index \p Index came from file \p FID.
isPreprocessedEntityInFileID(unsigned Index,FileID FID)296     virtual std::optional<bool> isPreprocessedEntityInFileID(unsigned Index,
297                                                              FileID FID) {
298       return std::nullopt;
299     }
300 
301     /// Read a preallocated skipped range from the external source.
302     virtual SourceRange ReadSkippedRange(unsigned Index) = 0;
303   };
304 
305   /// A record of the steps taken while preprocessing a source file,
306   /// including the various preprocessing directives processed, macros
307   /// expanded, etc.
308   class PreprocessingRecord : public PPCallbacks {
309     SourceManager &SourceMgr;
310 
311     /// Allocator used to store preprocessing objects.
312     llvm::BumpPtrAllocator BumpAlloc;
313 
314     /// The set of preprocessed entities in this record, in order they
315     /// were seen.
316     std::vector<PreprocessedEntity *> PreprocessedEntities;
317 
318     /// The set of preprocessed entities in this record that have been
319     /// loaded from external sources.
320     ///
321     /// The entries in this vector are loaded lazily from the external source,
322     /// and are referenced by the iterator using negative indices.
323     std::vector<PreprocessedEntity *> LoadedPreprocessedEntities;
324 
325     /// The set of ranges that were skipped by the preprocessor,
326     std::vector<SourceRange> SkippedRanges;
327 
328     bool SkippedRangesAllLoaded = true;
329 
330     /// Global (loaded or local) ID for a preprocessed entity.
331     /// Negative values are used to indicate preprocessed entities
332     /// loaded from the external source while non-negative values are used to
333     /// indicate preprocessed entities introduced by the current preprocessor.
334     /// Value -1 corresponds to element 0 in the loaded entities vector,
335     /// value -2 corresponds to element 1 in the loaded entities vector, etc.
336     /// Value 0 is an invalid value, the index to local entities is 1-based,
337     /// value 1 corresponds to element 0 in the local entities vector,
338     /// value 2 corresponds to element 1 in the local entities vector, etc.
339     class PPEntityID {
340       friend class PreprocessingRecord;
341 
342       int ID = 0;
343 
PPEntityID(int ID)344       explicit PPEntityID(int ID) : ID(ID) {}
345 
346     public:
347       PPEntityID() = default;
348     };
349 
getPPEntityID(unsigned Index,bool isLoaded)350     static PPEntityID getPPEntityID(unsigned Index, bool isLoaded) {
351       return isLoaded ? PPEntityID(-int(Index)-1) : PPEntityID(Index+1);
352     }
353 
354     /// Mapping from MacroInfo structures to their definitions.
355     llvm::DenseMap<const MacroInfo *, MacroDefinitionRecord *> MacroDefinitions;
356 
357     /// External source of preprocessed entities.
358     ExternalPreprocessingRecordSource *ExternalSource = nullptr;
359 
360     /// Retrieve the preprocessed entity at the given ID.
361     PreprocessedEntity *getPreprocessedEntity(PPEntityID PPID);
362 
363     /// Retrieve the loaded preprocessed entity at the given index.
364     PreprocessedEntity *getLoadedPreprocessedEntity(unsigned Index);
365 
366     /// Determine the number of preprocessed entities that were
367     /// loaded (or can be loaded) from an external source.
getNumLoadedPreprocessedEntities()368     unsigned getNumLoadedPreprocessedEntities() const {
369       return LoadedPreprocessedEntities.size();
370     }
371 
372     /// Returns a pair of [Begin, End) indices of local preprocessed
373     /// entities that \p Range encompasses.
374     std::pair<unsigned, unsigned>
375       findLocalPreprocessedEntitiesInRange(SourceRange Range) const;
376     unsigned findBeginLocalPreprocessedEntity(SourceLocation Loc) const;
377     unsigned findEndLocalPreprocessedEntity(SourceLocation Loc) const;
378 
379     /// Allocate space for a new set of loaded preprocessed entities.
380     ///
381     /// \returns The index into the set of loaded preprocessed entities, which
382     /// corresponds to the first newly-allocated entity.
383     unsigned allocateLoadedEntities(unsigned NumEntities);
384 
385     /// Allocate space for a new set of loaded preprocessed skipped
386     /// ranges.
387     ///
388     /// \returns The index into the set of loaded preprocessed ranges, which
389     /// corresponds to the first newly-allocated range.
390     unsigned allocateSkippedRanges(unsigned NumRanges);
391 
392     /// Ensures that all external skipped ranges have been loaded.
393     void ensureSkippedRangesLoaded();
394 
395     /// Register a new macro definition.
396     void RegisterMacroDefinition(MacroInfo *Macro, MacroDefinitionRecord *Def);
397 
398   public:
399     /// Construct a new preprocessing record.
400     explicit PreprocessingRecord(SourceManager &SM);
401 
402     /// Allocate memory in the preprocessing record.
403     void *Allocate(unsigned Size, unsigned Align = 8) {
404       return BumpAlloc.Allocate(Size, Align);
405     }
406 
407     /// Deallocate memory in the preprocessing record.
Deallocate(void * Ptr)408     void Deallocate(void *Ptr) {}
409 
410     size_t getTotalMemory() const;
411 
getSourceManager()412     SourceManager &getSourceManager() const { return SourceMgr; }
413 
414     /// Iteration over the preprocessed entities.
415     ///
416     /// In a complete iteration, the iterator walks the range [-M, N),
417     /// where negative values are used to indicate preprocessed entities
418     /// loaded from the external source while non-negative values are used to
419     /// indicate preprocessed entities introduced by the current preprocessor.
420     /// However, to provide iteration in source order (for, e.g., chained
421     /// precompiled headers), dereferencing the iterator flips the negative
422     /// values (corresponding to loaded entities), so that position -M
423     /// corresponds to element 0 in the loaded entities vector, position -M+1
424     /// corresponds to element 1 in the loaded entities vector, etc. This
425     /// gives us a reasonably efficient, source-order walk.
426     ///
427     /// We define this as a wrapping iterator around an int. The
428     /// iterator_adaptor_base class forwards the iterator methods to basic
429     /// integer arithmetic.
430     class iterator : public llvm::iterator_adaptor_base<
431                          iterator, int, std::random_access_iterator_tag,
432                          PreprocessedEntity *, int, PreprocessedEntity *,
433                          PreprocessedEntity *> {
434       friend class PreprocessingRecord;
435 
436       PreprocessingRecord *Self;
437 
iterator(PreprocessingRecord * Self,int Position)438       iterator(PreprocessingRecord *Self, int Position)
439           : iterator::iterator_adaptor_base(Position), Self(Self) {}
440 
441     public:
iterator()442       iterator() : iterator(nullptr, 0) {}
443 
444       PreprocessedEntity *operator*() const {
445         bool isLoaded = this->I < 0;
446         unsigned Index = isLoaded ?
447             Self->LoadedPreprocessedEntities.size() + this->I : this->I;
448         PPEntityID ID = Self->getPPEntityID(Index, isLoaded);
449         return Self->getPreprocessedEntity(ID);
450       }
451       PreprocessedEntity *operator->() const { return **this; }
452     };
453 
454     /// Begin iterator for all preprocessed entities.
begin()455     iterator begin() {
456       return iterator(this, -(int)LoadedPreprocessedEntities.size());
457     }
458 
459     /// End iterator for all preprocessed entities.
end()460     iterator end() {
461       return iterator(this, PreprocessedEntities.size());
462     }
463 
464     /// Begin iterator for local, non-loaded, preprocessed entities.
local_begin()465     iterator local_begin() {
466       return iterator(this, 0);
467     }
468 
469     /// End iterator for local, non-loaded, preprocessed entities.
local_end()470     iterator local_end() {
471       return iterator(this, PreprocessedEntities.size());
472     }
473 
474     /// iterator range for the given range of loaded
475     /// preprocessed entities.
getIteratorsForLoadedRange(unsigned start,unsigned count)476     llvm::iterator_range<iterator> getIteratorsForLoadedRange(unsigned start,
477                                                               unsigned count) {
478       unsigned end = start + count;
479       assert(end <= LoadedPreprocessedEntities.size());
480       return llvm::make_range(
481           iterator(this, int(start) - LoadedPreprocessedEntities.size()),
482           iterator(this, int(end) - LoadedPreprocessedEntities.size()));
483     }
484 
485     /// Returns a range of preprocessed entities that source range \p R
486     /// encompasses.
487     ///
488     /// \param R the range to look for preprocessed entities.
489     llvm::iterator_range<iterator>
490     getPreprocessedEntitiesInRange(SourceRange R);
491 
492     /// Returns true if the preprocessed entity that \p PPEI iterator
493     /// points to is coming from the file \p FID.
494     ///
495     /// Can be used to avoid implicit deserializations of preallocated
496     /// preprocessed entities if we only care about entities of a specific file
497     /// and not from files \#included in the range given at
498     /// \see getPreprocessedEntitiesInRange.
499     bool isEntityInFileID(iterator PPEI, FileID FID);
500 
501     /// Add a new preprocessed entity to this record.
502     PPEntityID addPreprocessedEntity(PreprocessedEntity *Entity);
503 
504     /// Set the external source for preprocessed entities.
505     void SetExternalSource(ExternalPreprocessingRecordSource &Source);
506 
507     /// Retrieve the external source for preprocessed entities.
getExternalSource()508     ExternalPreprocessingRecordSource *getExternalSource() const {
509       return ExternalSource;
510     }
511 
512     /// Retrieve the macro definition that corresponds to the given
513     /// \c MacroInfo.
514     MacroDefinitionRecord *findMacroDefinition(const MacroInfo *MI);
515 
516     /// Retrieve all ranges that got skipped while preprocessing.
getSkippedRanges()517     const std::vector<SourceRange> &getSkippedRanges() {
518       ensureSkippedRangesLoaded();
519       return SkippedRanges;
520     }
521 
522   private:
523     friend class ASTReader;
524     friend class ASTWriter;
525 
526     void MacroExpands(const Token &Id, const MacroDefinition &MD,
527                       SourceRange Range, const MacroArgs *Args) override;
528     void MacroDefined(const Token &Id, const MacroDirective *MD) override;
529     void MacroUndefined(const Token &Id, const MacroDefinition &MD,
530                         const MacroDirective *Undef) override;
531     void InclusionDirective(SourceLocation HashLoc, const Token &IncludeTok,
532                             StringRef FileName, bool IsAngled,
533                             CharSourceRange FilenameRange,
534                             OptionalFileEntryRef File, StringRef SearchPath,
535                             StringRef RelativePath,
536                             const Module *SuggestedModule, bool ModuleImported,
537                             SrcMgr::CharacteristicKind FileType) override;
538     void Ifdef(SourceLocation Loc, const Token &MacroNameTok,
539                const MacroDefinition &MD) override;
540     void Ifndef(SourceLocation Loc, const Token &MacroNameTok,
541                 const MacroDefinition &MD) override;
542 
543     using PPCallbacks::Elifdef;
544     using PPCallbacks::Elifndef;
545     void Elifdef(SourceLocation Loc, const Token &MacroNameTok,
546                  const MacroDefinition &MD) override;
547     void Elifndef(SourceLocation Loc, const Token &MacroNameTok,
548                   const MacroDefinition &MD) override;
549 
550     /// Hook called whenever the 'defined' operator is seen.
551     void Defined(const Token &MacroNameTok, const MacroDefinition &MD,
552                  SourceRange Range) override;
553 
554     void SourceRangeSkipped(SourceRange Range,
555                             SourceLocation EndifLoc) override;
556 
557     void addMacroExpansion(const Token &Id, const MacroInfo *MI,
558                            SourceRange Range);
559 
560     /// Cached result of the last \see getPreprocessedEntitiesInRange
561     /// query.
562     struct {
563       SourceRange Range;
564       std::pair<int, int> Result;
565     } CachedRangeQuery;
566 
567     std::pair<int, int> getPreprocessedEntitiesInRangeSlow(SourceRange R);
568   };
569 
570 } // namespace clang
571 
new(size_t bytes,clang::PreprocessingRecord & PR,unsigned alignment)572 inline void *operator new(size_t bytes, clang::PreprocessingRecord &PR,
573                           unsigned alignment) noexcept {
574   return PR.Allocate(bytes, alignment);
575 }
576 
delete(void * ptr,clang::PreprocessingRecord & PR,unsigned)577 inline void operator delete(void *ptr, clang::PreprocessingRecord &PR,
578                             unsigned) noexcept {
579   PR.Deallocate(ptr);
580 }
581 
582 #endif // LLVM_CLANG_LEX_PREPROCESSINGRECORD_H
583