HeaderSearch.h revision 10285d9113c14d1e523f86a55b193eb752638ea5
1//===--- HeaderSearch.h - Resolve Header File Locations ---------*- C++ -*-===// 2// 3// The LLVM Compiler Infrastructure 4// 5// This file is distributed under the University of Illinois Open Source 6// License. See LICENSE.TXT for details. 7// 8//===----------------------------------------------------------------------===// 9// 10// This file defines the HeaderSearch interface. 11// 12//===----------------------------------------------------------------------===// 13 14#ifndef LLVM_CLANG_LEX_HEADERSEARCH_H 15#define LLVM_CLANG_LEX_HEADERSEARCH_H 16 17#include "clang/Lex/DirectoryLookup.h" 18#include "clang/Lex/ModuleMap.h" 19#include "llvm/ADT/StringMap.h" 20#include "llvm/ADT/StringSet.h" 21#include "llvm/Support/Allocator.h" 22#include <vector> 23 24namespace clang { 25 26class DiagnosticsEngine; 27class ExternalIdentifierLookup; 28class FileEntry; 29class FileManager; 30class IdentifierInfo; 31 32/// HeaderFileInfo - The preprocessor keeps track of this information for each 33/// file that is #included. 34struct HeaderFileInfo { 35 /// isImport - True if this is a #import'd or #pragma once file. 36 unsigned isImport : 1; 37 38 /// isPragmaOnce - True if this is #pragma once file. 39 unsigned isPragmaOnce : 1; 40 41 /// DirInfo - Keep track of whether this is a system header, and if so, 42 /// whether it is C++ clean or not. This can be set by the include paths or 43 /// by #pragma gcc system_header. This is an instance of 44 /// SrcMgr::CharacteristicKind. 45 unsigned DirInfo : 2; 46 47 /// \brief Whether this header file info was supplied by an external source. 48 unsigned External : 1; 49 50 /// \brief Whether this structure is considered to already have been 51 /// "resolved", meaning that it was loaded from the external source. 52 unsigned Resolved : 1; 53 54 /// \brief Whether this is a header inside a framework that is currently 55 /// being built. 56 /// 57 /// When a framework is being built, the headers have not yet been placed 58 /// into the appropriate framework subdirectories, and therefore are 59 /// provided via a header map. This bit indicates when this is one of 60 /// those framework headers. 61 unsigned IndexHeaderMapHeader : 1; 62 63 /// NumIncludes - This is the number of times the file has been included 64 /// already. 65 unsigned short NumIncludes; 66 67 /// \brief The ID number of the controlling macro. 68 /// 69 /// This ID number will be non-zero when there is a controlling 70 /// macro whose IdentifierInfo may not yet have been loaded from 71 /// external storage. 72 unsigned ControllingMacroID; 73 74 /// ControllingMacro - If this file has a #ifndef XXX (or equivalent) guard 75 /// that protects the entire contents of the file, this is the identifier 76 /// for the macro that controls whether or not it has any effect. 77 /// 78 /// Note: Most clients should use getControllingMacro() to access 79 /// the controlling macro of this header, since 80 /// getControllingMacro() is able to load a controlling macro from 81 /// external storage. 82 const IdentifierInfo *ControllingMacro; 83 84 /// \brief If this header came from a framework include, this is the name 85 /// of the framework. 86 StringRef Framework; 87 88 HeaderFileInfo() 89 : isImport(false), isPragmaOnce(false), DirInfo(SrcMgr::C_User), 90 External(false), Resolved(false), IndexHeaderMapHeader(false), 91 NumIncludes(0), ControllingMacroID(0), ControllingMacro(0) {} 92 93 /// \brief Retrieve the controlling macro for this header file, if 94 /// any. 95 const IdentifierInfo *getControllingMacro(ExternalIdentifierLookup *External); 96 97 /// \brief Determine whether this is a non-default header file info, e.g., 98 /// it corresponds to an actual header we've included or tried to include. 99 bool isNonDefault() const { 100 return isImport || isPragmaOnce || NumIncludes || ControllingMacro || 101 ControllingMacroID; 102 } 103}; 104 105/// \brief An external source of header file information, which may supply 106/// information about header files already included. 107class ExternalHeaderFileInfoSource { 108public: 109 virtual ~ExternalHeaderFileInfoSource(); 110 111 /// \brief Retrieve the header file information for the given file entry. 112 /// 113 /// \returns Header file information for the given file entry, with the 114 /// \c External bit set. If the file entry is not known, return a 115 /// default-constructed \c HeaderFileInfo. 116 virtual HeaderFileInfo GetHeaderFileInfo(const FileEntry *FE) = 0; 117}; 118 119/// HeaderSearch - This class encapsulates the information needed to find the 120/// file referenced by a #include or #include_next, (sub-)framework lookup, etc. 121class HeaderSearch { 122 FileManager &FileMgr; 123 DiagnosticsEngine &Diags; 124 /// #include search path information. Requests for #include "x" search the 125 /// directory of the #including file first, then each directory in SearchDirs 126 /// consecutively. Requests for <x> search the current dir first, then each 127 /// directory in SearchDirs, starting at AngledDirIdx, consecutively. If 128 /// NoCurDirSearch is true, then the check for the file in the current 129 /// directory is suppressed. 130 std::vector<DirectoryLookup> SearchDirs; 131 unsigned AngledDirIdx; 132 unsigned SystemDirIdx; 133 bool NoCurDirSearch; 134 135 /// \brief The path to the module cache. 136 std::string ModuleCachePath; 137 138 /// FileInfo - This contains all of the preprocessor-specific data about files 139 /// that are included. The vector is indexed by the FileEntry's UID. 140 /// 141 std::vector<HeaderFileInfo> FileInfo; 142 143 /// LookupFileCache - This is keeps track of each lookup performed by 144 /// LookupFile. The first part of the value is the starting index in 145 /// SearchDirs that the cached search was performed from. If there is a hit 146 /// and this value doesn't match the current query, the cache has to be 147 /// ignored. The second value is the entry in SearchDirs that satisfied the 148 /// query. 149 llvm::StringMap<std::pair<unsigned, unsigned>, llvm::BumpPtrAllocator> 150 LookupFileCache; 151 152 /// FrameworkMap - This is a collection mapping a framework or subframework 153 /// name like "Carbon" to the Carbon.framework directory. 154 llvm::StringMap<const DirectoryEntry *, llvm::BumpPtrAllocator> 155 FrameworkMap; 156 157 /// HeaderMaps - This is a mapping from FileEntry -> HeaderMap, uniquing 158 /// headermaps. This vector owns the headermap. 159 std::vector<std::pair<const FileEntry*, const HeaderMap*> > HeaderMaps; 160 161 /// \brief The mapping between modules and headers. 162 ModuleMap ModMap; 163 164 /// \brief Describes whether a given directory has a module map in it. 165 llvm::DenseMap<const DirectoryEntry *, bool> DirectoryHasModuleMap; 166 167 /// \brief Uniqued set of framework names, which is used to track which 168 /// headers were included as framework headers. 169 llvm::StringSet<llvm::BumpPtrAllocator> FrameworkNames; 170 171 /// \brief Entity used to resolve the identifier IDs of controlling 172 /// macros into IdentifierInfo pointers, as needed. 173 ExternalIdentifierLookup *ExternalLookup; 174 175 /// \brief Entity used to look up stored header file information. 176 ExternalHeaderFileInfoSource *ExternalSource; 177 178 // Various statistics we track for performance analysis. 179 unsigned NumIncluded; 180 unsigned NumMultiIncludeFileOptzn; 181 unsigned NumFrameworkLookups, NumSubFrameworkLookups; 182 183 // HeaderSearch doesn't support default or copy construction. 184 explicit HeaderSearch(); 185 explicit HeaderSearch(const HeaderSearch&); 186 void operator=(const HeaderSearch&); 187 188 friend class DirectoryLookup; 189 190public: 191 HeaderSearch(FileManager &FM, DiagnosticsEngine &Diags, 192 const LangOptions &LangOpts, const TargetInfo *Target); 193 ~HeaderSearch(); 194 195 FileManager &getFileMgr() const { return FileMgr; } 196 197 /// SetSearchPaths - Interface for setting the file search paths. 198 /// 199 void SetSearchPaths(const std::vector<DirectoryLookup> &dirs, 200 unsigned angledDirIdx, unsigned systemDirIdx, 201 bool noCurDirSearch) { 202 assert(angledDirIdx <= systemDirIdx && systemDirIdx <= dirs.size() && 203 "Directory indicies are unordered"); 204 SearchDirs = dirs; 205 AngledDirIdx = angledDirIdx; 206 SystemDirIdx = systemDirIdx; 207 NoCurDirSearch = noCurDirSearch; 208 //LookupFileCache.clear(); 209 } 210 211 /// AddSearchPath - Add an additional search path. 212 void AddSearchPath(const DirectoryLookup &dir, bool isAngled) { 213 unsigned idx = isAngled ? SystemDirIdx : AngledDirIdx; 214 SearchDirs.insert(SearchDirs.begin() + idx, dir); 215 if (!isAngled) 216 AngledDirIdx++; 217 SystemDirIdx++; 218 } 219 220 /// \brief Set the path to the module cache. 221 void setModuleCachePath(StringRef CachePath) { 222 ModuleCachePath = CachePath; 223 } 224 225 /// \brief Retrieve the path to the module cache. 226 StringRef getModuleCachePath() const { return ModuleCachePath; } 227 228 /// ClearFileInfo - Forget everything we know about headers so far. 229 void ClearFileInfo() { 230 FileInfo.clear(); 231 } 232 233 void SetExternalLookup(ExternalIdentifierLookup *EIL) { 234 ExternalLookup = EIL; 235 } 236 237 ExternalIdentifierLookup *getExternalLookup() const { 238 return ExternalLookup; 239 } 240 241 /// \brief Set the external source of header information. 242 void SetExternalSource(ExternalHeaderFileInfoSource *ES) { 243 ExternalSource = ES; 244 } 245 246 /// \brief Set the target information for the header search, if not 247 /// already known. 248 void setTarget(const TargetInfo &Target); 249 250 /// LookupFile - Given a "foo" or <foo> reference, look up the indicated file, 251 /// return null on failure. 252 /// 253 /// \returns If successful, this returns 'UsedDir', the DirectoryLookup member 254 /// the file was found in, or null if not applicable. 255 /// 256 /// \param isAngled indicates whether the file reference is a <> reference. 257 /// 258 /// \param CurDir If non-null, the file was found in the specified directory 259 /// search location. This is used to implement #include_next. 260 /// 261 /// \param CurFileEnt If non-null, indicates where the #including file is, in 262 /// case a relative search is needed. 263 /// 264 /// \param SearchPath If non-null, will be set to the search path relative 265 /// to which the file was found. If the include path is absolute, SearchPath 266 /// will be set to an empty string. 267 /// 268 /// \param RelativePath If non-null, will be set to the path relative to 269 /// SearchPath at which the file was found. This only differs from the 270 /// Filename for framework includes. 271 /// 272 /// \param SuggestedModule If non-null, and the file found is semantically 273 /// part of a known module, this will be set to the module that should 274 /// be imported instead of preprocessing/parsing the file found. 275 const FileEntry *LookupFile(StringRef Filename, bool isAngled, 276 const DirectoryLookup *FromDir, 277 const DirectoryLookup *&CurDir, 278 const FileEntry *CurFileEnt, 279 SmallVectorImpl<char> *SearchPath, 280 SmallVectorImpl<char> *RelativePath, 281 Module **SuggestedModule, 282 bool SkipCache = false); 283 284 /// LookupSubframeworkHeader - Look up a subframework for the specified 285 /// #include file. For example, if #include'ing <HIToolbox/HIToolbox.h> from 286 /// within ".../Carbon.framework/Headers/Carbon.h", check to see if HIToolbox 287 /// is a subframework within Carbon.framework. If so, return the FileEntry 288 /// for the designated file, otherwise return null. 289 const FileEntry *LookupSubframeworkHeader( 290 StringRef Filename, 291 const FileEntry *RelativeFileEnt, 292 SmallVectorImpl<char> *SearchPath, 293 SmallVectorImpl<char> *RelativePath); 294 295 /// LookupFrameworkCache - Look up the specified framework name in our 296 /// framework cache, returning the DirectoryEntry it is in if we know, 297 /// otherwise, return null. 298 const DirectoryEntry *&LookupFrameworkCache(StringRef FWName) { 299 return FrameworkMap.GetOrCreateValue(FWName).getValue(); 300 } 301 302 /// ShouldEnterIncludeFile - Mark the specified file as a target of of a 303 /// #include, #include_next, or #import directive. Return false if #including 304 /// the file will have no effect or true if we should include it. 305 bool ShouldEnterIncludeFile(const FileEntry *File, bool isImport); 306 307 308 /// getFileDirFlavor - Return whether the specified file is a normal header, 309 /// a system header, or a C++ friendly system header. 310 SrcMgr::CharacteristicKind getFileDirFlavor(const FileEntry *File) { 311 return (SrcMgr::CharacteristicKind)getFileInfo(File).DirInfo; 312 } 313 314 /// MarkFileIncludeOnce - Mark the specified file as a "once only" file, e.g. 315 /// due to #pragma once. 316 void MarkFileIncludeOnce(const FileEntry *File) { 317 HeaderFileInfo &FI = getFileInfo(File); 318 FI.isImport = true; 319 FI.isPragmaOnce = true; 320 } 321 322 /// MarkFileSystemHeader - Mark the specified file as a system header, e.g. 323 /// due to #pragma GCC system_header. 324 void MarkFileSystemHeader(const FileEntry *File) { 325 getFileInfo(File).DirInfo = SrcMgr::C_System; 326 } 327 328 /// IncrementIncludeCount - Increment the count for the number of times the 329 /// specified FileEntry has been entered. 330 void IncrementIncludeCount(const FileEntry *File) { 331 ++getFileInfo(File).NumIncludes; 332 } 333 334 /// SetFileControllingMacro - Mark the specified file as having a controlling 335 /// macro. This is used by the multiple-include optimization to eliminate 336 /// no-op #includes. 337 void SetFileControllingMacro(const FileEntry *File, 338 const IdentifierInfo *ControllingMacro) { 339 getFileInfo(File).ControllingMacro = ControllingMacro; 340 } 341 342 /// \brief Determine whether this file is intended to be safe from 343 /// multiple inclusions, e.g., it has #pragma once or a controlling 344 /// macro. 345 /// 346 /// This routine does not consider the effect of #import 347 bool isFileMultipleIncludeGuarded(const FileEntry *File); 348 349 /// CreateHeaderMap - This method returns a HeaderMap for the specified 350 /// FileEntry, uniquing them through the the 'HeaderMaps' datastructure. 351 const HeaderMap *CreateHeaderMap(const FileEntry *FE); 352 353 /// \brief Retrieve the name of the module file that should be used to 354 /// load the given module. 355 /// 356 /// \param Module The module whose module file name will be returned. 357 /// 358 /// \returns The name of the module file that corresponds to this module, 359 /// or an empty string if this module does not correspond to any module file. 360 std::string getModuleFileName(Module *Module); 361 362 /// \brief Retrieve the name of the module file that should be used to 363 /// load a module with the given name. 364 /// 365 /// \param Module The module whose module file name will be returned. 366 /// 367 /// \returns The name of the module file that corresponds to this module, 368 /// or an empty string if this module does not correspond to any module file. 369 std::string getModuleFileName(StringRef ModuleName); 370 371 /// \brief Lookup a module Search for a module with the given name. 372 /// 373 /// \param ModuleName The name of the module we're looking for. 374 /// 375 /// \param AllowSearch Whether we are allowed to search in the various 376 /// search directories to produce a module definition. If not, this lookup 377 /// will only return an already-known module. 378 /// 379 /// \returns The module with the given name. 380 Module *lookupModule(StringRef ModuleName, bool AllowSearch = true); 381 382 void IncrementFrameworkLookupCount() { ++NumFrameworkLookups; } 383 384 /// \brief Determine whether there is a module map that may map the header 385 /// with the given file name to a (sub)module. 386 /// 387 /// \param Filename The name of the file. 388 /// 389 /// \param Root The "root" directory, at which we should stop looking for 390 /// module maps. 391 bool hasModuleMap(StringRef Filename, const DirectoryEntry *Root); 392 393 /// \brief Retrieve the module that corresponds to the given file, if any. 394 /// 395 /// \param File The header that we wish to map to a module. 396 Module *findModuleForHeader(const FileEntry *File); 397 398 /// \brief Read the contents of the given module map file. 399 /// 400 /// \param File The module map file. 401 /// 402 /// \param OnlyModule If non-NULL, this will receive the 403 /// 404 /// \returns true if an error occurred, false otherwise. 405 bool loadModuleMapFile(const FileEntry *File); 406 407 /// \brief Collect the set of all known, top-level modules. 408 /// 409 /// \param Modules Will be filled with the set of known, top-level modules. 410 void collectAllModules(llvm::SmallVectorImpl<Module *> &Modules); 411 412private: 413 /// \brief Retrieve a module with the given name, which may be part of the 414 /// given framework. 415 /// 416 /// \param Name The name of the module to retrieve. 417 /// 418 /// \param Dir The framework directory (e.g., ModuleName.framework). 419 /// 420 /// \param IsSystem Whether the framework directory is part of the system 421 /// frameworks. 422 /// 423 /// \returns The module, if found; otherwise, null. 424 Module *loadFrameworkModule(StringRef Name, 425 const DirectoryEntry *Dir, 426 bool IsSystem); 427 428public: 429 /// \brief Retrieve the module map. 430 ModuleMap &getModuleMap() { return ModMap; } 431 432 unsigned header_file_size() const { return FileInfo.size(); } 433 434 // Used by ASTReader. 435 void setHeaderFileInfoForUID(HeaderFileInfo HFI, unsigned UID); 436 437 /// getFileInfo - Return the HeaderFileInfo structure for the specified 438 /// FileEntry. 439 const HeaderFileInfo &getFileInfo(const FileEntry *FE) const { 440 return const_cast<HeaderSearch*>(this)->getFileInfo(FE); 441 } 442 443 // Used by external tools 444 typedef std::vector<DirectoryLookup>::const_iterator search_dir_iterator; 445 search_dir_iterator search_dir_begin() const { return SearchDirs.begin(); } 446 search_dir_iterator search_dir_end() const { return SearchDirs.end(); } 447 unsigned search_dir_size() const { return SearchDirs.size(); } 448 449 search_dir_iterator quoted_dir_begin() const { 450 return SearchDirs.begin(); 451 } 452 search_dir_iterator quoted_dir_end() const { 453 return SearchDirs.begin() + AngledDirIdx; 454 } 455 456 search_dir_iterator angled_dir_begin() const { 457 return SearchDirs.begin() + AngledDirIdx; 458 } 459 search_dir_iterator angled_dir_end() const { 460 return SearchDirs.begin() + SystemDirIdx; 461 } 462 463 search_dir_iterator system_dir_begin() const { 464 return SearchDirs.begin() + SystemDirIdx; 465 } 466 search_dir_iterator system_dir_end() const { return SearchDirs.end(); } 467 468 /// \brief Retrieve a uniqued framework name. 469 StringRef getUniqueFrameworkName(StringRef Framework); 470 471 void PrintStats(); 472 473 size_t getTotalMemory() const; 474 475 static std::string NormalizeDashIncludePath(StringRef File, 476 FileManager &FileMgr); 477 478private: 479 /// \brief Describes what happened when we tried to load a module map file. 480 enum LoadModuleMapResult { 481 /// \brief The module map file had already been loaded. 482 LMM_AlreadyLoaded, 483 /// \brief The module map file was loaded by this invocation. 484 LMM_NewlyLoaded, 485 /// \brief There is was directory with the given name. 486 LMM_NoDirectory, 487 /// \brief There was either no module map file or the module map file was 488 /// invalid. 489 LMM_InvalidModuleMap 490 }; 491 492 /// \brief Try to load the module map file in the given directory. 493 /// 494 /// \param DirName The name of the directory where we will look for a module 495 /// map file. 496 /// 497 /// \returns The result of attempting to load the module map file from the 498 /// named directory. 499 LoadModuleMapResult loadModuleMapFile(StringRef DirName); 500 501 /// \brief Try to load the module map file in the given directory. 502 /// 503 /// \param Dir The directory where we will look for a module map file. 504 /// 505 /// \returns The result of attempting to load the module map file from the 506 /// named directory. 507 LoadModuleMapResult loadModuleMapFile(const DirectoryEntry *Dir); 508 509 /// getFileInfo - Return the HeaderFileInfo structure for the specified 510 /// FileEntry. 511 HeaderFileInfo &getFileInfo(const FileEntry *FE); 512}; 513 514} // end namespace clang 515 516#endif 517