HeaderSearch.h revision fba18aa8f2cd1994dc65e8cb9f4be201c560dc0b
1//===--- HeaderSearch.h - Resolve Header File Locations ---------*- C++ -*-===//
2//
3//                     The LLVM Compiler Infrastructure
4//
5// This file is distributed under the University of Illinois Open Source
6// License. See LICENSE.TXT for details.
7//
8//===----------------------------------------------------------------------===//
9//
10// This file defines the HeaderSearch interface.
11//
12//===----------------------------------------------------------------------===//
13
14#ifndef LLVM_CLANG_LEX_HEADERSEARCH_H
15#define LLVM_CLANG_LEX_HEADERSEARCH_H
16
17#include "clang/Lex/DirectoryLookup.h"
18#include "llvm/ADT/StringMap.h"
19#include "llvm/ADT/StringSet.h"
20#include "llvm/Support/Allocator.h"
21#include <vector>
22
23namespace clang {
24
25class ExternalIdentifierLookup;
26class FileEntry;
27class FileManager;
28class IdentifierInfo;
29
30/// HeaderFileInfo - The preprocessor keeps track of this information for each
31/// file that is #included.
32struct HeaderFileInfo {
33  /// isImport - True if this is a #import'd or #pragma once file.
34  unsigned isImport : 1;
35
36  /// isPragmaOnce - True if this is  #pragma once file.
37  unsigned isPragmaOnce : 1;
38
39  /// DirInfo - Keep track of whether this is a system header, and if so,
40  /// whether it is C++ clean or not.  This can be set by the include paths or
41  /// by #pragma gcc system_header.  This is an instance of
42  /// SrcMgr::CharacteristicKind.
43  unsigned DirInfo : 2;
44
45  /// \brief Whether this header file info was supplied by an external source.
46  unsigned External : 1;
47
48  /// \brief Whether this structure is considered to already have been
49  /// "resolved", meaning that it was loaded from the external source.
50  unsigned Resolved : 1;
51
52  /// \brief Whether this is a header inside a framework that is currently
53  /// being built.
54  ///
55  /// When a framework is being built, the headers have not yet been placed
56  /// into the appropriate framework subdirectories, and therefore are
57  /// provided via a header map. This bit indicates when this is one of
58  /// those framework headers.
59  unsigned IndexHeaderMapHeader : 1;
60
61  /// NumIncludes - This is the number of times the file has been included
62  /// already.
63  unsigned short NumIncludes;
64
65  /// \brief The ID number of the controlling macro.
66  ///
67  /// This ID number will be non-zero when there is a controlling
68  /// macro whose IdentifierInfo may not yet have been loaded from
69  /// external storage.
70  unsigned ControllingMacroID;
71
72  /// ControllingMacro - If this file has a #ifndef XXX (or equivalent) guard
73  /// that protects the entire contents of the file, this is the identifier
74  /// for the macro that controls whether or not it has any effect.
75  ///
76  /// Note: Most clients should use getControllingMacro() to access
77  /// the controlling macro of this header, since
78  /// getControllingMacro() is able to load a controlling macro from
79  /// external storage.
80  const IdentifierInfo *ControllingMacro;
81
82  /// \brief If this header came from a framework include, this is the name
83  /// of the framework.
84  StringRef Framework;
85
86  HeaderFileInfo()
87    : isImport(false), isPragmaOnce(false), DirInfo(SrcMgr::C_User),
88      External(false), Resolved(false), IndexHeaderMapHeader(false),
89      NumIncludes(0), ControllingMacroID(0), ControllingMacro(0)  {}
90
91  /// \brief Retrieve the controlling macro for this header file, if
92  /// any.
93  const IdentifierInfo *getControllingMacro(ExternalIdentifierLookup *External);
94
95  /// \brief Determine whether this is a non-default header file info, e.g.,
96  /// it corresponds to an actual header we've included or tried to include.
97  bool isNonDefault() const {
98    return isImport || isPragmaOnce || NumIncludes || ControllingMacro ||
99      ControllingMacroID;
100  }
101};
102
103/// \brief An external source of header file information, which may supply
104/// information about header files already included.
105class ExternalHeaderFileInfoSource {
106public:
107  virtual ~ExternalHeaderFileInfoSource();
108
109  /// \brief Retrieve the header file information for the given file entry.
110  ///
111  /// \returns Header file information for the given file entry, with the
112  /// \c External bit set. If the file entry is not known, return a
113  /// default-constructed \c HeaderFileInfo.
114  virtual HeaderFileInfo GetHeaderFileInfo(const FileEntry *FE) = 0;
115};
116
117/// HeaderSearch - This class encapsulates the information needed to find the
118/// file referenced by a #include or #include_next, (sub-)framework lookup, etc.
119class HeaderSearch {
120  FileManager &FileMgr;
121  /// #include search path information.  Requests for #include "x" search the
122  /// directory of the #including file first, then each directory in SearchDirs
123  /// consecutively. Requests for <x> search the current dir first, then each
124  /// directory in SearchDirs, starting at AngledDirIdx, consecutively.  If
125  /// NoCurDirSearch is true, then the check for the file in the current
126  /// directory is suppressed.
127  std::vector<DirectoryLookup> SearchDirs;
128  unsigned AngledDirIdx;
129  unsigned SystemDirIdx;
130  bool NoCurDirSearch;
131
132  /// \brief The path to the module cache.
133  std::string ModuleCachePath;
134
135  /// \brief The name of the module we're building.
136  std::string BuildingModule;
137
138  /// FileInfo - This contains all of the preprocessor-specific data about files
139  /// that are included.  The vector is indexed by the FileEntry's UID.
140  ///
141  std::vector<HeaderFileInfo> FileInfo;
142
143  /// LookupFileCache - This is keeps track of each lookup performed by
144  /// LookupFile.  The first part of the value is the starting index in
145  /// SearchDirs that the cached search was performed from.  If there is a hit
146  /// and this value doesn't match the current query, the cache has to be
147  /// ignored.  The second value is the entry in SearchDirs that satisfied the
148  /// query.
149  llvm::StringMap<std::pair<unsigned, unsigned>, llvm::BumpPtrAllocator>
150    LookupFileCache;
151
152
153  /// FrameworkMap - This is a collection mapping a framework or subframework
154  /// name like "Carbon" to the Carbon.framework directory.
155  llvm::StringMap<const DirectoryEntry *, llvm::BumpPtrAllocator>
156    FrameworkMap;
157
158  /// HeaderMaps - This is a mapping from FileEntry -> HeaderMap, uniquing
159  /// headermaps.  This vector owns the headermap.
160  std::vector<std::pair<const FileEntry*, const HeaderMap*> > HeaderMaps;
161
162  /// \brief Uniqued set of framework names, which is used to track which
163  /// headers were included as framework headers.
164  llvm::StringSet<llvm::BumpPtrAllocator> FrameworkNames;
165
166  /// \brief Entity used to resolve the identifier IDs of controlling
167  /// macros into IdentifierInfo pointers, as needed.
168  ExternalIdentifierLookup *ExternalLookup;
169
170  /// \brief Entity used to look up stored header file information.
171  ExternalHeaderFileInfoSource *ExternalSource;
172
173  // Various statistics we track for performance analysis.
174  unsigned NumIncluded;
175  unsigned NumMultiIncludeFileOptzn;
176  unsigned NumFrameworkLookups, NumSubFrameworkLookups;
177
178  // HeaderSearch doesn't support default or copy construction.
179  explicit HeaderSearch();
180  explicit HeaderSearch(const HeaderSearch&);
181  void operator=(const HeaderSearch&);
182public:
183  HeaderSearch(FileManager &FM);
184  ~HeaderSearch();
185
186  FileManager &getFileMgr() const { return FileMgr; }
187
188  /// SetSearchPaths - Interface for setting the file search paths.
189  ///
190  void SetSearchPaths(const std::vector<DirectoryLookup> &dirs,
191                      unsigned angledDirIdx, unsigned systemDirIdx,
192                      bool noCurDirSearch) {
193    assert(angledDirIdx <= systemDirIdx && systemDirIdx <= dirs.size() &&
194        "Directory indicies are unordered");
195    SearchDirs = dirs;
196    AngledDirIdx = angledDirIdx;
197    SystemDirIdx = systemDirIdx;
198    NoCurDirSearch = noCurDirSearch;
199    //LookupFileCache.clear();
200  }
201
202  /// \brief Set the path to the module cache and the name of the module
203  /// we're building
204  void configureModules(StringRef CachePath, StringRef BuildingModule) {
205    ModuleCachePath = CachePath;
206    this->BuildingModule = BuildingModule;
207  }
208
209  /// ClearFileInfo - Forget everything we know about headers so far.
210  void ClearFileInfo() {
211    FileInfo.clear();
212  }
213
214  void SetExternalLookup(ExternalIdentifierLookup *EIL) {
215    ExternalLookup = EIL;
216  }
217
218  ExternalIdentifierLookup *getExternalLookup() const {
219    return ExternalLookup;
220  }
221
222  /// \brief Set the external source of header information.
223  void SetExternalSource(ExternalHeaderFileInfoSource *ES) {
224    ExternalSource = ES;
225  }
226
227  /// LookupFile - Given a "foo" or <foo> reference, look up the indicated file,
228  /// return null on failure.
229  ///
230  /// \returns If successful, this returns 'UsedDir', the DirectoryLookup member
231  /// the file was found in, or null if not applicable.
232  ///
233  /// \param isAngled indicates whether the file reference is a <> reference.
234  ///
235  /// \param CurDir If non-null, the file was found in the specified directory
236  /// search location.  This is used to implement #include_next.
237  ///
238  /// \param CurFileEnt If non-null, indicates where the #including file is, in
239  /// case a relative search is needed.
240  ///
241  /// \param SearchPath If non-null, will be set to the search path relative
242  /// to which the file was found. If the include path is absolute, SearchPath
243  /// will be set to an empty string.
244  ///
245  /// \param RelativePath If non-null, will be set to the path relative to
246  /// SearchPath at which the file was found. This only differs from the
247  /// Filename for framework includes.
248  ///
249  /// \param SuggestedModule If non-null, and the file found is semantically
250  /// part of a known module, this will be set to the name of the module that
251  /// could be imported instead of preprocessing/parsing the file found.
252  const FileEntry *LookupFile(StringRef Filename, bool isAngled,
253                              const DirectoryLookup *FromDir,
254                              const DirectoryLookup *&CurDir,
255                              const FileEntry *CurFileEnt,
256                              SmallVectorImpl<char> *SearchPath,
257                              SmallVectorImpl<char> *RelativePath,
258                              StringRef *SuggestedModule);
259
260  /// LookupSubframeworkHeader - Look up a subframework for the specified
261  /// #include file.  For example, if #include'ing <HIToolbox/HIToolbox.h> from
262  /// within ".../Carbon.framework/Headers/Carbon.h", check to see if HIToolbox
263  /// is a subframework within Carbon.framework.  If so, return the FileEntry
264  /// for the designated file, otherwise return null.
265  const FileEntry *LookupSubframeworkHeader(
266      StringRef Filename,
267      const FileEntry *RelativeFileEnt,
268      SmallVectorImpl<char> *SearchPath,
269      SmallVectorImpl<char> *RelativePath);
270
271  /// LookupFrameworkCache - Look up the specified framework name in our
272  /// framework cache, returning the DirectoryEntry it is in if we know,
273  /// otherwise, return null.
274  const DirectoryEntry *&LookupFrameworkCache(StringRef FWName) {
275    return FrameworkMap.GetOrCreateValue(FWName).getValue();
276  }
277
278  /// ShouldEnterIncludeFile - Mark the specified file as a target of of a
279  /// #include, #include_next, or #import directive.  Return false if #including
280  /// the file will have no effect or true if we should include it.
281  bool ShouldEnterIncludeFile(const FileEntry *File, bool isImport);
282
283
284  /// getFileDirFlavor - Return whether the specified file is a normal header,
285  /// a system header, or a C++ friendly system header.
286  SrcMgr::CharacteristicKind getFileDirFlavor(const FileEntry *File) {
287    return (SrcMgr::CharacteristicKind)getFileInfo(File).DirInfo;
288  }
289
290  /// MarkFileIncludeOnce - Mark the specified file as a "once only" file, e.g.
291  /// due to #pragma once.
292  void MarkFileIncludeOnce(const FileEntry *File) {
293    HeaderFileInfo &FI = getFileInfo(File);
294    FI.isImport = true;
295    FI.isPragmaOnce = true;
296  }
297
298  /// MarkFileSystemHeader - Mark the specified file as a system header, e.g.
299  /// due to #pragma GCC system_header.
300  void MarkFileSystemHeader(const FileEntry *File) {
301    getFileInfo(File).DirInfo = SrcMgr::C_System;
302  }
303
304  /// IncrementIncludeCount - Increment the count for the number of times the
305  /// specified FileEntry has been entered.
306  void IncrementIncludeCount(const FileEntry *File) {
307    ++getFileInfo(File).NumIncludes;
308  }
309
310  /// SetFileControllingMacro - Mark the specified file as having a controlling
311  /// macro.  This is used by the multiple-include optimization to eliminate
312  /// no-op #includes.
313  void SetFileControllingMacro(const FileEntry *File,
314                               const IdentifierInfo *ControllingMacro) {
315    getFileInfo(File).ControllingMacro = ControllingMacro;
316  }
317
318  /// \brief Determine whether this file is intended to be safe from
319  /// multiple inclusions, e.g., it has #pragma once or a controlling
320  /// macro.
321  ///
322  /// This routine does not consider the effect of #import
323  bool isFileMultipleIncludeGuarded(const FileEntry *File);
324
325  /// CreateHeaderMap - This method returns a HeaderMap for the specified
326  /// FileEntry, uniquing them through the the 'HeaderMaps' datastructure.
327  const HeaderMap *CreateHeaderMap(const FileEntry *FE);
328
329  /// \brief Search in the module cache path for a module with the given
330  /// name.
331  ///
332  /// \param If non-NULL, will be set to the module file name we expected to
333  /// find (regardless of whether it was actually found or not).
334  ///
335  /// \param UmbrellaHeader If non-NULL, and no module was found in the module
336  /// cache, this routine will search in the framework paths to determine
337  /// whether a module can be built from an umbrella header. If so, the pointee
338  /// will be set to the path of the umbrella header.
339  ///
340  /// \returns A file describing the named module, if available, or NULL to
341  /// indicate that the module could not be found.
342  const FileEntry *lookupModule(StringRef ModuleName,
343                                std::string *ModuleFileName = 0,
344                                std::string *UmbrellaHeader = 0);
345
346  void IncrementFrameworkLookupCount() { ++NumFrameworkLookups; }
347
348  typedef std::vector<HeaderFileInfo>::const_iterator header_file_iterator;
349  header_file_iterator header_file_begin() const { return FileInfo.begin(); }
350  header_file_iterator header_file_end() const { return FileInfo.end(); }
351  unsigned header_file_size() const { return FileInfo.size(); }
352
353  // Used by ASTReader.
354  void setHeaderFileInfoForUID(HeaderFileInfo HFI, unsigned UID);
355
356  // Used by external tools
357  typedef std::vector<DirectoryLookup>::const_iterator search_dir_iterator;
358  search_dir_iterator search_dir_begin() const { return SearchDirs.begin(); }
359  search_dir_iterator search_dir_end() const { return SearchDirs.end(); }
360  unsigned search_dir_size() const { return SearchDirs.size(); }
361
362  search_dir_iterator quoted_dir_begin() const {
363    return SearchDirs.begin();
364  }
365  search_dir_iterator quoted_dir_end() const {
366    return SearchDirs.begin() + AngledDirIdx;
367  }
368
369  search_dir_iterator angled_dir_begin() const {
370    return SearchDirs.begin() + AngledDirIdx;
371  }
372  search_dir_iterator angled_dir_end() const {
373    return SearchDirs.begin() + SystemDirIdx;
374  }
375
376  search_dir_iterator system_dir_begin() const {
377    return SearchDirs.begin() + SystemDirIdx;
378  }
379  search_dir_iterator system_dir_end() const { return SearchDirs.end(); }
380
381  /// \brief Retrieve a uniqued framework name.
382  StringRef getUniqueFrameworkName(StringRef Framework);
383
384  void PrintStats();
385
386  size_t getTotalMemory() const;
387
388private:
389
390  /// getFileInfo - Return the HeaderFileInfo structure for the specified
391  /// FileEntry.
392  HeaderFileInfo &getFileInfo(const FileEntry *FE);
393};
394
395}  // end namespace clang
396
397#endif
398