1//===--- ExternalASTSource.h - Abstract External AST Interface --*- C++ -*-===//
2//
3//                     The LLVM Compiler Infrastructure
4//
5// This file is distributed under the University of Illinois Open Source
6// License. See LICENSE.TXT for details.
7//
8//===----------------------------------------------------------------------===//
9//
10//  This file defines the ExternalASTSource interface, which enables
11//  construction of AST nodes from some external source.
12//
13//===----------------------------------------------------------------------===//
14#ifndef LLVM_CLANG_AST_EXTERNALASTSOURCE_H
15#define LLVM_CLANG_AST_EXTERNALASTSOURCE_H
16
17#include "clang/AST/CharUnits.h"
18#include "clang/AST/DeclBase.h"
19#include "llvm/ADT/DenseMap.h"
20
21namespace clang {
22
23class ASTConsumer;
24class CXXBaseSpecifier;
25class CXXCtorInitializer;
26class DeclarationName;
27class ExternalSemaSource; // layering violation required for downcasting
28class FieldDecl;
29class Module;
30class NamedDecl;
31class RecordDecl;
32class Selector;
33class Stmt;
34class TagDecl;
35
36/// \brief Abstract interface for external sources of AST nodes.
37///
38/// External AST sources provide AST nodes constructed from some
39/// external source, such as a precompiled header. External AST
40/// sources can resolve types and declarations from abstract IDs into
41/// actual type and declaration nodes, and read parts of declaration
42/// contexts.
43class ExternalASTSource : public RefCountedBase<ExternalASTSource> {
44  /// Generation number for this external AST source. Must be increased
45  /// whenever we might have added new redeclarations for existing decls.
46  uint32_t CurrentGeneration;
47
48  /// \brief Whether this AST source also provides information for
49  /// semantic analysis.
50  bool SemaSource;
51
52  friend class ExternalSemaSource;
53
54public:
55  ExternalASTSource() : CurrentGeneration(0), SemaSource(false) { }
56
57  virtual ~ExternalASTSource();
58
59  /// \brief RAII class for safely pairing a StartedDeserializing call
60  /// with FinishedDeserializing.
61  class Deserializing {
62    ExternalASTSource *Source;
63  public:
64    explicit Deserializing(ExternalASTSource *source) : Source(source) {
65      assert(Source);
66      Source->StartedDeserializing();
67    }
68    ~Deserializing() {
69      Source->FinishedDeserializing();
70    }
71  };
72
73  /// \brief Get the current generation of this AST source. This number
74  /// is incremented each time the AST source lazily extends an existing
75  /// entity.
76  uint32_t getGeneration() const { return CurrentGeneration; }
77
78  /// \brief Resolve a declaration ID into a declaration, potentially
79  /// building a new declaration.
80  ///
81  /// This method only needs to be implemented if the AST source ever
82  /// passes back decl sets as VisibleDeclaration objects.
83  ///
84  /// The default implementation of this method is a no-op.
85  virtual Decl *GetExternalDecl(uint32_t ID);
86
87  /// \brief Resolve a selector ID into a selector.
88  ///
89  /// This operation only needs to be implemented if the AST source
90  /// returns non-zero for GetNumKnownSelectors().
91  ///
92  /// The default implementation of this method is a no-op.
93  virtual Selector GetExternalSelector(uint32_t ID);
94
95  /// \brief Returns the number of selectors known to the external AST
96  /// source.
97  ///
98  /// The default implementation of this method is a no-op.
99  virtual uint32_t GetNumExternalSelectors();
100
101  /// \brief Resolve the offset of a statement in the decl stream into
102  /// a statement.
103  ///
104  /// This operation is meant to be used via a LazyOffsetPtr.  It only
105  /// needs to be implemented if the AST source uses methods like
106  /// FunctionDecl::setLazyBody when building decls.
107  ///
108  /// The default implementation of this method is a no-op.
109  virtual Stmt *GetExternalDeclStmt(uint64_t Offset);
110
111  /// \brief Resolve the offset of a set of C++ constructor initializers in
112  /// the decl stream into an array of initializers.
113  ///
114  /// The default implementation of this method is a no-op.
115  virtual CXXCtorInitializer **GetExternalCXXCtorInitializers(uint64_t Offset);
116
117  /// \brief Resolve the offset of a set of C++ base specifiers in the decl
118  /// stream into an array of specifiers.
119  ///
120  /// The default implementation of this method is a no-op.
121  virtual CXXBaseSpecifier *GetExternalCXXBaseSpecifiers(uint64_t Offset);
122
123  /// \brief Update an out-of-date identifier.
124  virtual void updateOutOfDateIdentifier(IdentifierInfo &II) { }
125
126  /// \brief Find all declarations with the given name in the given context,
127  /// and add them to the context by calling SetExternalVisibleDeclsForName
128  /// or SetNoExternalVisibleDeclsForName.
129  /// \return \c true if any declarations might have been found, \c false if
130  /// we definitely have no declarations with tbis name.
131  ///
132  /// The default implementation of this method is a no-op returning \c false.
133  virtual bool
134  FindExternalVisibleDeclsByName(const DeclContext *DC, DeclarationName Name);
135
136  /// \brief Ensures that the table of all visible declarations inside this
137  /// context is up to date.
138  ///
139  /// The default implementation of this function is a no-op.
140  virtual void completeVisibleDeclsMap(const DeclContext *DC);
141
142  /// \brief Retrieve the module that corresponds to the given module ID.
143  virtual Module *getModule(unsigned ID) { return nullptr; }
144
145  /// Abstracts clang modules and precompiled header files and holds
146  /// everything needed to generate debug info for an imported module
147  /// or PCH.
148  class ASTSourceDescriptor {
149    StringRef PCHModuleName;
150    StringRef Path;
151    StringRef ASTFile;
152    uint64_t Signature = 0;
153    const Module *ClangModule = nullptr;
154
155  public:
156    ASTSourceDescriptor(){};
157    ASTSourceDescriptor(StringRef Name, StringRef Path, StringRef ASTFile,
158                        uint64_t Signature)
159        : PCHModuleName(std::move(Name)), Path(std::move(Path)),
160          ASTFile(std::move(ASTFile)), Signature(Signature){};
161    ASTSourceDescriptor(const Module &M);
162    std::string getModuleName() const;
163    StringRef getPath() const { return Path; }
164    StringRef getASTFile() const { return ASTFile; }
165    uint64_t getSignature() const { return Signature; }
166    const Module *getModuleOrNull() const { return ClangModule; }
167  };
168
169  /// Return a descriptor for the corresponding module, if one exists.
170  virtual llvm::Optional<ASTSourceDescriptor> getSourceDescriptor(unsigned ID);
171
172  /// \brief Finds all declarations lexically contained within the given
173  /// DeclContext, after applying an optional filter predicate.
174  ///
175  /// \param IsKindWeWant a predicate function that returns true if the passed
176  /// declaration kind is one we are looking for.
177  ///
178  /// The default implementation of this method is a no-op.
179  virtual void
180  FindExternalLexicalDecls(const DeclContext *DC,
181                           llvm::function_ref<bool(Decl::Kind)> IsKindWeWant,
182                           SmallVectorImpl<Decl *> &Result);
183
184  /// \brief Finds all declarations lexically contained within the given
185  /// DeclContext.
186  void FindExternalLexicalDecls(const DeclContext *DC,
187                                SmallVectorImpl<Decl *> &Result) {
188    FindExternalLexicalDecls(DC, [](Decl::Kind) { return true; }, Result);
189  }
190
191  /// \brief Get the decls that are contained in a file in the Offset/Length
192  /// range. \p Length can be 0 to indicate a point at \p Offset instead of
193  /// a range.
194  virtual void FindFileRegionDecls(FileID File, unsigned Offset,
195                                   unsigned Length,
196                                   SmallVectorImpl<Decl *> &Decls);
197
198  /// \brief Gives the external AST source an opportunity to complete
199  /// the redeclaration chain for a declaration. Called each time we
200  /// need the most recent declaration of a declaration after the
201  /// generation count is incremented.
202  virtual void CompleteRedeclChain(const Decl *D);
203
204  /// \brief Gives the external AST source an opportunity to complete
205  /// an incomplete type.
206  virtual void CompleteType(TagDecl *Tag);
207
208  /// \brief Gives the external AST source an opportunity to complete an
209  /// incomplete Objective-C class.
210  ///
211  /// This routine will only be invoked if the "externally completed" bit is
212  /// set on the ObjCInterfaceDecl via the function
213  /// \c ObjCInterfaceDecl::setExternallyCompleted().
214  virtual void CompleteType(ObjCInterfaceDecl *Class);
215
216  /// \brief Loads comment ranges.
217  virtual void ReadComments();
218
219  /// \brief Notify ExternalASTSource that we started deserialization of
220  /// a decl or type so until FinishedDeserializing is called there may be
221  /// decls that are initializing. Must be paired with FinishedDeserializing.
222  ///
223  /// The default implementation of this method is a no-op.
224  virtual void StartedDeserializing();
225
226  /// \brief Notify ExternalASTSource that we finished the deserialization of
227  /// a decl or type. Must be paired with StartedDeserializing.
228  ///
229  /// The default implementation of this method is a no-op.
230  virtual void FinishedDeserializing();
231
232  /// \brief Function that will be invoked when we begin parsing a new
233  /// translation unit involving this external AST source.
234  ///
235  /// The default implementation of this method is a no-op.
236  virtual void StartTranslationUnit(ASTConsumer *Consumer);
237
238  /// \brief Print any statistics that have been gathered regarding
239  /// the external AST source.
240  ///
241  /// The default implementation of this method is a no-op.
242  virtual void PrintStats();
243
244
245  /// \brief Perform layout on the given record.
246  ///
247  /// This routine allows the external AST source to provide an specific
248  /// layout for a record, overriding the layout that would normally be
249  /// constructed. It is intended for clients who receive specific layout
250  /// details rather than source code (such as LLDB). The client is expected
251  /// to fill in the field offsets, base offsets, virtual base offsets, and
252  /// complete object size.
253  ///
254  /// \param Record The record whose layout is being requested.
255  ///
256  /// \param Size The final size of the record, in bits.
257  ///
258  /// \param Alignment The final alignment of the record, in bits.
259  ///
260  /// \param FieldOffsets The offset of each of the fields within the record,
261  /// expressed in bits. All of the fields must be provided with offsets.
262  ///
263  /// \param BaseOffsets The offset of each of the direct, non-virtual base
264  /// classes. If any bases are not given offsets, the bases will be laid
265  /// out according to the ABI.
266  ///
267  /// \param VirtualBaseOffsets The offset of each of the virtual base classes
268  /// (either direct or not). If any bases are not given offsets, the bases will be laid
269  /// out according to the ABI.
270  ///
271  /// \returns true if the record layout was provided, false otherwise.
272  virtual bool layoutRecordType(
273      const RecordDecl *Record, uint64_t &Size, uint64_t &Alignment,
274      llvm::DenseMap<const FieldDecl *, uint64_t> &FieldOffsets,
275      llvm::DenseMap<const CXXRecordDecl *, CharUnits> &BaseOffsets,
276      llvm::DenseMap<const CXXRecordDecl *, CharUnits> &VirtualBaseOffsets);
277
278  //===--------------------------------------------------------------------===//
279  // Queries for performance analysis.
280  //===--------------------------------------------------------------------===//
281
282  struct MemoryBufferSizes {
283    size_t malloc_bytes;
284    size_t mmap_bytes;
285
286    MemoryBufferSizes(size_t malloc_bytes, size_t mmap_bytes)
287    : malloc_bytes(malloc_bytes), mmap_bytes(mmap_bytes) {}
288  };
289
290  /// Return the amount of memory used by memory buffers, breaking down
291  /// by heap-backed versus mmap'ed memory.
292  MemoryBufferSizes getMemoryBufferSizes() const {
293    MemoryBufferSizes sizes(0, 0);
294    getMemoryBufferSizes(sizes);
295    return sizes;
296  }
297
298  virtual void getMemoryBufferSizes(MemoryBufferSizes &sizes) const;
299
300protected:
301  static DeclContextLookupResult
302  SetExternalVisibleDeclsForName(const DeclContext *DC,
303                                 DeclarationName Name,
304                                 ArrayRef<NamedDecl*> Decls);
305
306  static DeclContextLookupResult
307  SetNoExternalVisibleDeclsForName(const DeclContext *DC,
308                                   DeclarationName Name);
309
310  /// \brief Increment the current generation.
311  uint32_t incrementGeneration(ASTContext &C);
312};
313
314/// \brief A lazy pointer to an AST node (of base type T) that resides
315/// within an external AST source.
316///
317/// The AST node is identified within the external AST source by a
318/// 63-bit offset, and can be retrieved via an operation on the
319/// external AST source itself.
320template<typename T, typename OffsT, T* (ExternalASTSource::*Get)(OffsT Offset)>
321struct LazyOffsetPtr {
322  /// \brief Either a pointer to an AST node or the offset within the
323  /// external AST source where the AST node can be found.
324  ///
325  /// If the low bit is clear, a pointer to the AST node. If the low
326  /// bit is set, the upper 63 bits are the offset.
327  mutable uint64_t Ptr;
328
329public:
330  LazyOffsetPtr() : Ptr(0) { }
331
332  explicit LazyOffsetPtr(T *Ptr) : Ptr(reinterpret_cast<uint64_t>(Ptr)) { }
333  explicit LazyOffsetPtr(uint64_t Offset) : Ptr((Offset << 1) | 0x01) {
334    assert((Offset << 1 >> 1) == Offset && "Offsets must require < 63 bits");
335    if (Offset == 0)
336      Ptr = 0;
337  }
338
339  LazyOffsetPtr &operator=(T *Ptr) {
340    this->Ptr = reinterpret_cast<uint64_t>(Ptr);
341    return *this;
342  }
343
344  LazyOffsetPtr &operator=(uint64_t Offset) {
345    assert((Offset << 1 >> 1) == Offset && "Offsets must require < 63 bits");
346    if (Offset == 0)
347      Ptr = 0;
348    else
349      Ptr = (Offset << 1) | 0x01;
350
351    return *this;
352  }
353
354  /// \brief Whether this pointer is non-NULL.
355  ///
356  /// This operation does not require the AST node to be deserialized.
357  explicit operator bool() const { return Ptr != 0; }
358
359  /// \brief Whether this pointer is non-NULL.
360  ///
361  /// This operation does not require the AST node to be deserialized.
362  bool isValid() const { return Ptr != 0; }
363
364  /// \brief Whether this pointer is currently stored as an offset.
365  bool isOffset() const { return Ptr & 0x01; }
366
367  /// \brief Retrieve the pointer to the AST node that this lazy pointer
368  ///
369  /// \param Source the external AST source.
370  ///
371  /// \returns a pointer to the AST node.
372  T* get(ExternalASTSource *Source) const {
373    if (isOffset()) {
374      assert(Source &&
375             "Cannot deserialize a lazy pointer without an AST source");
376      Ptr = reinterpret_cast<uint64_t>((Source->*Get)(Ptr >> 1));
377    }
378    return reinterpret_cast<T*>(Ptr);
379  }
380};
381
382/// \brief A lazy value (of type T) that is within an AST node of type Owner,
383/// where the value might change in later generations of the external AST
384/// source.
385template<typename Owner, typename T, void (ExternalASTSource::*Update)(Owner)>
386struct LazyGenerationalUpdatePtr {
387  /// A cache of the value of this pointer, in the most recent generation in
388  /// which we queried it.
389  struct LazyData {
390    LazyData(ExternalASTSource *Source, T Value)
391        : ExternalSource(Source), LastGeneration(0), LastValue(Value) {}
392    ExternalASTSource *ExternalSource;
393    uint32_t LastGeneration;
394    T LastValue;
395  };
396
397  // Our value is represented as simply T if there is no external AST source.
398  typedef llvm::PointerUnion<T, LazyData*> ValueType;
399  ValueType Value;
400
401  LazyGenerationalUpdatePtr(ValueType V) : Value(V) {}
402
403  // Defined in ASTContext.h
404  static ValueType makeValue(const ASTContext &Ctx, T Value);
405
406public:
407  explicit LazyGenerationalUpdatePtr(const ASTContext &Ctx, T Value = T())
408      : Value(makeValue(Ctx, Value)) {}
409
410  /// Create a pointer that is not potentially updated by later generations of
411  /// the external AST source.
412  enum NotUpdatedTag { NotUpdated };
413  LazyGenerationalUpdatePtr(NotUpdatedTag, T Value = T())
414      : Value(Value) {}
415
416  /// Forcibly set this pointer (which must be lazy) as needing updates.
417  void markIncomplete() {
418    Value.template get<LazyData *>()->LastGeneration = 0;
419  }
420
421  /// Set the value of this pointer, in the current generation.
422  void set(T NewValue) {
423    if (LazyData *LazyVal = Value.template dyn_cast<LazyData*>()) {
424      LazyVal->LastValue = NewValue;
425      return;
426    }
427    Value = NewValue;
428  }
429
430  /// Set the value of this pointer, for this and all future generations.
431  void setNotUpdated(T NewValue) { Value = NewValue; }
432
433  /// Get the value of this pointer, updating its owner if necessary.
434  T get(Owner O) {
435    if (LazyData *LazyVal = Value.template dyn_cast<LazyData*>()) {
436      if (LazyVal->LastGeneration != LazyVal->ExternalSource->getGeneration()) {
437        LazyVal->LastGeneration = LazyVal->ExternalSource->getGeneration();
438        (LazyVal->ExternalSource->*Update)(O);
439      }
440      return LazyVal->LastValue;
441    }
442    return Value.template get<T>();
443  }
444
445  /// Get the most recently computed value of this pointer without updating it.
446  T getNotUpdated() const {
447    if (LazyData *LazyVal = Value.template dyn_cast<LazyData*>())
448      return LazyVal->LastValue;
449    return Value.template get<T>();
450  }
451
452  void *getOpaqueValue() { return Value.getOpaqueValue(); }
453  static LazyGenerationalUpdatePtr getFromOpaqueValue(void *Ptr) {
454    return LazyGenerationalUpdatePtr(ValueType::getFromOpaqueValue(Ptr));
455  }
456};
457} // end namespace clang
458
459/// Specialize PointerLikeTypeTraits to allow LazyGenerationalUpdatePtr to be
460/// placed into a PointerUnion.
461namespace llvm {
462template<typename Owner, typename T,
463         void (clang::ExternalASTSource::*Update)(Owner)>
464struct PointerLikeTypeTraits<
465    clang::LazyGenerationalUpdatePtr<Owner, T, Update>> {
466  typedef clang::LazyGenerationalUpdatePtr<Owner, T, Update> Ptr;
467  static void *getAsVoidPointer(Ptr P) { return P.getOpaqueValue(); }
468  static Ptr getFromVoidPointer(void *P) { return Ptr::getFromOpaqueValue(P); }
469  enum {
470    NumLowBitsAvailable = PointerLikeTypeTraits<T>::NumLowBitsAvailable - 1
471  };
472};
473}
474
475namespace clang {
476/// \brief Represents a lazily-loaded vector of data.
477///
478/// The lazily-loaded vector of data contains data that is partially loaded
479/// from an external source and partially added by local translation. The
480/// items loaded from the external source are loaded lazily, when needed for
481/// iteration over the complete vector.
482template<typename T, typename Source,
483         void (Source::*Loader)(SmallVectorImpl<T>&),
484         unsigned LoadedStorage = 2, unsigned LocalStorage = 4>
485class LazyVector {
486  SmallVector<T, LoadedStorage> Loaded;
487  SmallVector<T, LocalStorage> Local;
488
489public:
490  /// Iteration over the elements in the vector.
491  ///
492  /// In a complete iteration, the iterator walks the range [-M, N),
493  /// where negative values are used to indicate elements
494  /// loaded from the external source while non-negative values are used to
495  /// indicate elements added via \c push_back().
496  /// However, to provide iteration in source order (for, e.g., chained
497  /// precompiled headers), dereferencing the iterator flips the negative
498  /// values (corresponding to loaded entities), so that position -M
499  /// corresponds to element 0 in the loaded entities vector, position -M+1
500  /// corresponds to element 1 in the loaded entities vector, etc. This
501  /// gives us a reasonably efficient, source-order walk.
502  ///
503  /// We define this as a wrapping iterator around an int. The
504  /// iterator_adaptor_base class forwards the iterator methods to basic integer
505  /// arithmetic.
506  class iterator : public llvm::iterator_adaptor_base<
507                       iterator, int, std::random_access_iterator_tag, T, int> {
508    LazyVector *Self;
509
510    iterator(LazyVector *Self, int Position)
511        : iterator::iterator_adaptor_base(Position), Self(Self) {}
512
513    bool isLoaded() const { return this->I < 0; }
514    friend class LazyVector;
515
516  public:
517    iterator() : iterator(nullptr, 0) {}
518
519    typename iterator::reference operator*() const {
520      if (isLoaded())
521        return Self->Loaded.end()[this->I];
522      return Self->Local.begin()[this->I];
523    }
524  };
525
526  iterator begin(Source *source, bool LocalOnly = false) {
527    if (LocalOnly)
528      return iterator(this, 0);
529
530    if (source)
531      (source->*Loader)(Loaded);
532    return iterator(this, -(int)Loaded.size());
533  }
534
535  iterator end() {
536    return iterator(this, Local.size());
537  }
538
539  void push_back(const T& LocalValue) {
540    Local.push_back(LocalValue);
541  }
542
543  void erase(iterator From, iterator To) {
544    if (From.isLoaded() && To.isLoaded()) {
545      Loaded.erase(&*From, &*To);
546      return;
547    }
548
549    if (From.isLoaded()) {
550      Loaded.erase(&*From, Loaded.end());
551      From = begin(nullptr, true);
552    }
553
554    Local.erase(&*From, &*To);
555  }
556};
557
558/// \brief A lazy pointer to a statement.
559typedef LazyOffsetPtr<Stmt, uint64_t, &ExternalASTSource::GetExternalDeclStmt>
560  LazyDeclStmtPtr;
561
562/// \brief A lazy pointer to a declaration.
563typedef LazyOffsetPtr<Decl, uint32_t, &ExternalASTSource::GetExternalDecl>
564  LazyDeclPtr;
565
566/// \brief A lazy pointer to a set of CXXCtorInitializers.
567typedef LazyOffsetPtr<CXXCtorInitializer *, uint64_t,
568                      &ExternalASTSource::GetExternalCXXCtorInitializers>
569  LazyCXXCtorInitializersPtr;
570
571/// \brief A lazy pointer to a set of CXXBaseSpecifiers.
572typedef LazyOffsetPtr<CXXBaseSpecifier, uint64_t,
573                      &ExternalASTSource::GetExternalCXXBaseSpecifiers>
574  LazyCXXBaseSpecifiersPtr;
575
576} // end namespace clang
577
578#endif
579