1 //===--- HeaderSearch.h - Resolve Header File Locations ---------*- C++ -*-===// 2 // 3 // The LLVM Compiler Infrastructure 4 // 5 // This file is distributed under the University of Illinois Open Source 6 // License. See LICENSE.TXT for details. 7 // 8 //===----------------------------------------------------------------------===// 9 // 10 // This file defines the HeaderSearch interface. 11 // 12 //===----------------------------------------------------------------------===// 13 14 #ifndef LLVM_CLANG_LEX_HEADERSEARCH_H 15 #define LLVM_CLANG_LEX_HEADERSEARCH_H 16 17 #include "clang/Lex/DirectoryLookup.h" 18 #include "clang/Lex/ModuleMap.h" 19 #include "llvm/ADT/ArrayRef.h" 20 #include "llvm/ADT/StringMap.h" 21 #include "llvm/ADT/StringSet.h" 22 #include "llvm/Support/Allocator.h" 23 #include "llvm/ADT/OwningPtr.h" 24 #include <vector> 25 26 namespace clang { 27 28 class DiagnosticsEngine; 29 class ExternalIdentifierLookup; 30 class FileEntry; 31 class FileManager; 32 class IdentifierInfo; 33 34 /// \brief The preprocessor keeps track of this information for each 35 /// file that is \#included. 36 struct HeaderFileInfo { 37 /// \brief True if this is a \#import'd or \#pragma once file. 38 unsigned isImport : 1; 39 40 /// \brief True if this is a \#pragma once file. 41 unsigned isPragmaOnce : 1; 42 43 /// DirInfo - Keep track of whether this is a system header, and if so, 44 /// whether it is C++ clean or not. This can be set by the include paths or 45 /// by \#pragma gcc system_header. This is an instance of 46 /// SrcMgr::CharacteristicKind. 47 unsigned DirInfo : 2; 48 49 /// \brief Whether this header file info was supplied by an external source. 50 unsigned External : 1; 51 52 /// \brief Whether this structure is considered to already have been 53 /// "resolved", meaning that it was loaded from the external source. 54 unsigned Resolved : 1; 55 56 /// \brief Whether this is a header inside a framework that is currently 57 /// being built. 58 /// 59 /// When a framework is being built, the headers have not yet been placed 60 /// into the appropriate framework subdirectories, and therefore are 61 /// provided via a header map. This bit indicates when this is one of 62 /// those framework headers. 63 unsigned IndexHeaderMapHeader : 1; 64 65 /// \brief The number of times the file has been included already. 66 unsigned short NumIncludes; 67 68 /// \brief The ID number of the controlling macro. 69 /// 70 /// This ID number will be non-zero when there is a controlling 71 /// macro whose IdentifierInfo may not yet have been loaded from 72 /// external storage. 73 unsigned ControllingMacroID; 74 75 /// If this file has a \#ifndef XXX (or equivalent) guard that 76 /// protects the entire contents of the file, this is the identifier 77 /// for the macro that controls whether or not it has any effect. 78 /// 79 /// Note: Most clients should use getControllingMacro() to access 80 /// the controlling macro of this header, since 81 /// getControllingMacro() is able to load a controlling macro from 82 /// external storage. 83 const IdentifierInfo *ControllingMacro; 84 85 /// \brief If this header came from a framework include, this is the name 86 /// of the framework. 87 StringRef Framework; 88 HeaderFileInfoHeaderFileInfo89 HeaderFileInfo() 90 : isImport(false), isPragmaOnce(false), DirInfo(SrcMgr::C_User), 91 External(false), Resolved(false), IndexHeaderMapHeader(false), 92 NumIncludes(0), ControllingMacroID(0), ControllingMacro(0) {} 93 94 /// \brief Retrieve the controlling macro for this header file, if 95 /// any. 96 const IdentifierInfo *getControllingMacro(ExternalIdentifierLookup *External); 97 98 /// \brief Determine whether this is a non-default header file info, e.g., 99 /// it corresponds to an actual header we've included or tried to include. isNonDefaultHeaderFileInfo100 bool isNonDefault() const { 101 return isImport || isPragmaOnce || NumIncludes || ControllingMacro || 102 ControllingMacroID; 103 } 104 }; 105 106 /// \brief An external source of header file information, which may supply 107 /// information about header files already included. 108 class ExternalHeaderFileInfoSource { 109 public: 110 virtual ~ExternalHeaderFileInfoSource(); 111 112 /// \brief Retrieve the header file information for the given file entry. 113 /// 114 /// \returns Header file information for the given file entry, with the 115 /// \c External bit set. If the file entry is not known, return a 116 /// default-constructed \c HeaderFileInfo. 117 virtual HeaderFileInfo GetHeaderFileInfo(const FileEntry *FE) = 0; 118 }; 119 120 /// \brief Encapsulates the information needed to find the file referenced 121 /// by a \#include or \#include_next, (sub-)framework lookup, etc. 122 class HeaderSearch { 123 /// This structure is used to record entries in our framework cache. 124 struct FrameworkCacheEntry { 125 /// The directory entry which should be used for the cached framework. 126 const DirectoryEntry *Directory; 127 128 /// Whether this framework has been "user-specified" to be treated as if it 129 /// were a system framework (even if it was found outside a system framework 130 /// directory). 131 bool IsUserSpecifiedSystemFramework; 132 }; 133 134 FileManager &FileMgr; 135 DiagnosticsEngine &Diags; 136 /// \#include search path information. Requests for \#include "x" search the 137 /// directory of the \#including file first, then each directory in SearchDirs 138 /// consecutively. Requests for <x> search the current dir first, then each 139 /// directory in SearchDirs, starting at AngledDirIdx, consecutively. If 140 /// NoCurDirSearch is true, then the check for the file in the current 141 /// directory is suppressed. 142 std::vector<DirectoryLookup> SearchDirs; 143 unsigned AngledDirIdx; 144 unsigned SystemDirIdx; 145 bool NoCurDirSearch; 146 147 /// \brief \#include prefixes for which the 'system header' property is 148 /// overridden. 149 /// 150 /// For a \#include "x" or \#include \<x> directive, the last string in this 151 /// list which is a prefix of 'x' determines whether the file is treated as 152 /// a system header. 153 std::vector<std::pair<std::string, bool> > SystemHeaderPrefixes; 154 155 /// \brief The path to the module cache. 156 std::string ModuleCachePath; 157 158 /// \brief All of the preprocessor-specific data about files that are 159 /// included, indexed by the FileEntry's UID. 160 std::vector<HeaderFileInfo> FileInfo; 161 162 /// \brief Keeps track of each lookup performed by LookupFile. 163 /// 164 /// The first part of the value is the starting index in SearchDirs 165 /// that the cached search was performed from. If there is a hit and 166 /// this value doesn't match the current query, the cache has to be 167 /// ignored. The second value is the entry in SearchDirs that satisfied 168 /// the query. 169 llvm::StringMap<std::pair<unsigned, unsigned>, llvm::BumpPtrAllocator> 170 LookupFileCache; 171 172 /// \brief Collection mapping a framework or subframework 173 /// name like "Carbon" to the Carbon.framework directory. 174 llvm::StringMap<FrameworkCacheEntry, llvm::BumpPtrAllocator> FrameworkMap; 175 176 /// IncludeAliases - maps include file names (including the quotes or 177 /// angle brackets) to other include file names. This is used to support the 178 /// include_alias pragma for Microsoft compatibility. 179 typedef llvm::StringMap<std::string, llvm::BumpPtrAllocator> 180 IncludeAliasMap; 181 OwningPtr<IncludeAliasMap> IncludeAliases; 182 183 /// HeaderMaps - This is a mapping from FileEntry -> HeaderMap, uniquing 184 /// headermaps. This vector owns the headermap. 185 std::vector<std::pair<const FileEntry*, const HeaderMap*> > HeaderMaps; 186 187 /// \brief The mapping between modules and headers. 188 ModuleMap ModMap; 189 190 /// \brief Describes whether a given directory has a module map in it. 191 llvm::DenseMap<const DirectoryEntry *, bool> DirectoryHasModuleMap; 192 193 /// \brief Uniqued set of framework names, which is used to track which 194 /// headers were included as framework headers. 195 llvm::StringSet<llvm::BumpPtrAllocator> FrameworkNames; 196 197 /// \brief Entity used to resolve the identifier IDs of controlling 198 /// macros into IdentifierInfo pointers, as needed. 199 ExternalIdentifierLookup *ExternalLookup; 200 201 /// \brief Entity used to look up stored header file information. 202 ExternalHeaderFileInfoSource *ExternalSource; 203 204 // Various statistics we track for performance analysis. 205 unsigned NumIncluded; 206 unsigned NumMultiIncludeFileOptzn; 207 unsigned NumFrameworkLookups, NumSubFrameworkLookups; 208 209 // HeaderSearch doesn't support default or copy construction. 210 explicit HeaderSearch(); 211 explicit HeaderSearch(const HeaderSearch&); 212 void operator=(const HeaderSearch&); 213 214 friend class DirectoryLookup; 215 216 public: 217 HeaderSearch(FileManager &FM, DiagnosticsEngine &Diags, 218 const LangOptions &LangOpts, const TargetInfo *Target); 219 ~HeaderSearch(); 220 getFileMgr()221 FileManager &getFileMgr() const { return FileMgr; } 222 223 /// \brief Interface for setting the file search paths. SetSearchPaths(const std::vector<DirectoryLookup> & dirs,unsigned angledDirIdx,unsigned systemDirIdx,bool noCurDirSearch)224 void SetSearchPaths(const std::vector<DirectoryLookup> &dirs, 225 unsigned angledDirIdx, unsigned systemDirIdx, 226 bool noCurDirSearch) { 227 assert(angledDirIdx <= systemDirIdx && systemDirIdx <= dirs.size() && 228 "Directory indicies are unordered"); 229 SearchDirs = dirs; 230 AngledDirIdx = angledDirIdx; 231 SystemDirIdx = systemDirIdx; 232 NoCurDirSearch = noCurDirSearch; 233 //LookupFileCache.clear(); 234 } 235 236 /// \brief Add an additional search path. AddSearchPath(const DirectoryLookup & dir,bool isAngled)237 void AddSearchPath(const DirectoryLookup &dir, bool isAngled) { 238 unsigned idx = isAngled ? SystemDirIdx : AngledDirIdx; 239 SearchDirs.insert(SearchDirs.begin() + idx, dir); 240 if (!isAngled) 241 AngledDirIdx++; 242 SystemDirIdx++; 243 } 244 245 /// \brief Set the list of system header prefixes. SetSystemHeaderPrefixes(ArrayRef<std::pair<std::string,bool>> P)246 void SetSystemHeaderPrefixes(ArrayRef<std::pair<std::string, bool> > P) { 247 SystemHeaderPrefixes.assign(P.begin(), P.end()); 248 } 249 250 /// \brief Checks whether the map exists or not. HasIncludeAliasMap()251 bool HasIncludeAliasMap() const { 252 return IncludeAliases; 253 } 254 255 /// \brief Map the source include name to the dest include name. 256 /// 257 /// The Source should include the angle brackets or quotes, the dest 258 /// should not. This allows for distinction between <> and "" headers. AddIncludeAlias(StringRef Source,StringRef Dest)259 void AddIncludeAlias(StringRef Source, StringRef Dest) { 260 if (!IncludeAliases) 261 IncludeAliases.reset(new IncludeAliasMap); 262 (*IncludeAliases)[Source] = Dest; 263 } 264 265 /// MapHeaderToIncludeAlias - Maps one header file name to a different header 266 /// file name, for use with the include_alias pragma. Note that the source 267 /// file name should include the angle brackets or quotes. Returns StringRef 268 /// as null if the header cannot be mapped. MapHeaderToIncludeAlias(StringRef Source)269 StringRef MapHeaderToIncludeAlias(StringRef Source) { 270 assert(IncludeAliases && "Trying to map headers when there's no map"); 271 272 // Do any filename replacements before anything else 273 IncludeAliasMap::const_iterator Iter = IncludeAliases->find(Source); 274 if (Iter != IncludeAliases->end()) 275 return Iter->second; 276 return StringRef(); 277 } 278 279 /// \brief Set the path to the module cache. setModuleCachePath(StringRef CachePath)280 void setModuleCachePath(StringRef CachePath) { 281 ModuleCachePath = CachePath; 282 } 283 284 /// \brief Retrieve the path to the module cache. getModuleCachePath()285 StringRef getModuleCachePath() const { return ModuleCachePath; } 286 287 /// \brief Forget everything we know about headers so far. ClearFileInfo()288 void ClearFileInfo() { 289 FileInfo.clear(); 290 } 291 SetExternalLookup(ExternalIdentifierLookup * EIL)292 void SetExternalLookup(ExternalIdentifierLookup *EIL) { 293 ExternalLookup = EIL; 294 } 295 getExternalLookup()296 ExternalIdentifierLookup *getExternalLookup() const { 297 return ExternalLookup; 298 } 299 300 /// \brief Set the external source of header information. SetExternalSource(ExternalHeaderFileInfoSource * ES)301 void SetExternalSource(ExternalHeaderFileInfoSource *ES) { 302 ExternalSource = ES; 303 } 304 305 /// \brief Set the target information for the header search, if not 306 /// already known. 307 void setTarget(const TargetInfo &Target); 308 309 /// \brief Given a "foo" or \<foo> reference, look up the indicated file, 310 /// return null on failure. 311 /// 312 /// \returns If successful, this returns 'UsedDir', the DirectoryLookup member 313 /// the file was found in, or null if not applicable. 314 /// 315 /// \param isAngled indicates whether the file reference is a <> reference. 316 /// 317 /// \param CurDir If non-null, the file was found in the specified directory 318 /// search location. This is used to implement \#include_next. 319 /// 320 /// \param CurFileEnt If non-null, indicates where the \#including file is, in 321 /// case a relative search is needed. 322 /// 323 /// \param SearchPath If non-null, will be set to the search path relative 324 /// to which the file was found. If the include path is absolute, SearchPath 325 /// will be set to an empty string. 326 /// 327 /// \param RelativePath If non-null, will be set to the path relative to 328 /// SearchPath at which the file was found. This only differs from the 329 /// Filename for framework includes. 330 /// 331 /// \param SuggestedModule If non-null, and the file found is semantically 332 /// part of a known module, this will be set to the module that should 333 /// be imported instead of preprocessing/parsing the file found. 334 const FileEntry *LookupFile(StringRef Filename, bool isAngled, 335 const DirectoryLookup *FromDir, 336 const DirectoryLookup *&CurDir, 337 const FileEntry *CurFileEnt, 338 SmallVectorImpl<char> *SearchPath, 339 SmallVectorImpl<char> *RelativePath, 340 Module **SuggestedModule, 341 bool SkipCache = false); 342 343 /// \brief Look up a subframework for the specified \#include file. 344 /// 345 /// For example, if \#include'ing <HIToolbox/HIToolbox.h> from 346 /// within ".../Carbon.framework/Headers/Carbon.h", check to see if 347 /// HIToolbox is a subframework within Carbon.framework. If so, return 348 /// the FileEntry for the designated file, otherwise return null. 349 const FileEntry *LookupSubframeworkHeader( 350 StringRef Filename, 351 const FileEntry *RelativeFileEnt, 352 SmallVectorImpl<char> *SearchPath, 353 SmallVectorImpl<char> *RelativePath); 354 355 /// \brief Look up the specified framework name in our framework cache. 356 /// \returns The DirectoryEntry it is in if we know, null otherwise. LookupFrameworkCache(StringRef FWName)357 FrameworkCacheEntry &LookupFrameworkCache(StringRef FWName) { 358 return FrameworkMap.GetOrCreateValue(FWName).getValue(); 359 } 360 361 /// \brief Mark the specified file as a target of of a \#include, 362 /// \#include_next, or \#import directive. 363 /// 364 /// \return false if \#including the file will have no effect or true 365 /// if we should include it. 366 bool ShouldEnterIncludeFile(const FileEntry *File, bool isImport); 367 368 369 /// \brief Return whether the specified file is a normal header, 370 /// a system header, or a C++ friendly system header. getFileDirFlavor(const FileEntry * File)371 SrcMgr::CharacteristicKind getFileDirFlavor(const FileEntry *File) { 372 return (SrcMgr::CharacteristicKind)getFileInfo(File).DirInfo; 373 } 374 375 /// \brief Mark the specified file as a "once only" file, e.g. due to 376 /// \#pragma once. MarkFileIncludeOnce(const FileEntry * File)377 void MarkFileIncludeOnce(const FileEntry *File) { 378 HeaderFileInfo &FI = getFileInfo(File); 379 FI.isImport = true; 380 FI.isPragmaOnce = true; 381 } 382 383 /// \brief Mark the specified file as a system header, e.g. due to 384 /// \#pragma GCC system_header. MarkFileSystemHeader(const FileEntry * File)385 void MarkFileSystemHeader(const FileEntry *File) { 386 getFileInfo(File).DirInfo = SrcMgr::C_System; 387 } 388 389 /// \brief Increment the count for the number of times the specified 390 /// FileEntry has been entered. IncrementIncludeCount(const FileEntry * File)391 void IncrementIncludeCount(const FileEntry *File) { 392 ++getFileInfo(File).NumIncludes; 393 } 394 395 /// \brief Mark the specified file as having a controlling macro. 396 /// 397 /// This is used by the multiple-include optimization to eliminate 398 /// no-op \#includes. SetFileControllingMacro(const FileEntry * File,const IdentifierInfo * ControllingMacro)399 void SetFileControllingMacro(const FileEntry *File, 400 const IdentifierInfo *ControllingMacro) { 401 getFileInfo(File).ControllingMacro = ControllingMacro; 402 } 403 404 /// \brief Determine whether this file is intended to be safe from 405 /// multiple inclusions, e.g., it has \#pragma once or a controlling 406 /// macro. 407 /// 408 /// This routine does not consider the effect of \#import 409 bool isFileMultipleIncludeGuarded(const FileEntry *File); 410 411 /// CreateHeaderMap - This method returns a HeaderMap for the specified 412 /// FileEntry, uniquing them through the 'HeaderMaps' datastructure. 413 const HeaderMap *CreateHeaderMap(const FileEntry *FE); 414 415 /// \brief Retrieve the name of the module file that should be used to 416 /// load the given module. 417 /// 418 /// \param Module The module whose module file name will be returned. 419 /// 420 /// \returns The name of the module file that corresponds to this module, 421 /// or an empty string if this module does not correspond to any module file. 422 std::string getModuleFileName(Module *Module); 423 424 /// \brief Retrieve the name of the module file that should be used to 425 /// load a module with the given name. 426 /// 427 /// \param ModuleName The module whose module file name will be returned. 428 /// 429 /// \returns The name of the module file that corresponds to this module, 430 /// or an empty string if this module does not correspond to any module file. 431 std::string getModuleFileName(StringRef ModuleName); 432 433 /// \brief Lookup a module Search for a module with the given name. 434 /// 435 /// \param ModuleName The name of the module we're looking for. 436 /// 437 /// \param AllowSearch Whether we are allowed to search in the various 438 /// search directories to produce a module definition. If not, this lookup 439 /// will only return an already-known module. 440 /// 441 /// \returns The module with the given name. 442 Module *lookupModule(StringRef ModuleName, bool AllowSearch = true); 443 IncrementFrameworkLookupCount()444 void IncrementFrameworkLookupCount() { ++NumFrameworkLookups; } 445 446 /// \brief Determine whether there is a module map that may map the header 447 /// with the given file name to a (sub)module. 448 /// 449 /// \param Filename The name of the file. 450 /// 451 /// \param Root The "root" directory, at which we should stop looking for 452 /// module maps. 453 bool hasModuleMap(StringRef Filename, const DirectoryEntry *Root); 454 455 /// \brief Retrieve the module that corresponds to the given file, if any. 456 /// 457 /// \param File The header that we wish to map to a module. 458 Module *findModuleForHeader(const FileEntry *File); 459 460 /// \brief Read the contents of the given module map file. 461 /// 462 /// \param File The module map file. 463 /// 464 /// \returns true if an error occurred, false otherwise. 465 bool loadModuleMapFile(const FileEntry *File); 466 467 /// \brief Collect the set of all known, top-level modules. 468 /// 469 /// \param Modules Will be filled with the set of known, top-level modules. 470 void collectAllModules(llvm::SmallVectorImpl<Module *> &Modules); 471 472 private: 473 /// \brief Retrieve a module with the given name, which may be part of the 474 /// given framework. 475 /// 476 /// \param Name The name of the module to retrieve. 477 /// 478 /// \param Dir The framework directory (e.g., ModuleName.framework). 479 /// 480 /// \param IsSystem Whether the framework directory is part of the system 481 /// frameworks. 482 /// 483 /// \returns The module, if found; otherwise, null. 484 Module *loadFrameworkModule(StringRef Name, 485 const DirectoryEntry *Dir, 486 bool IsSystem); 487 488 public: 489 /// \brief Retrieve the module map. getModuleMap()490 ModuleMap &getModuleMap() { return ModMap; } 491 header_file_size()492 unsigned header_file_size() const { return FileInfo.size(); } 493 494 // Used by ASTReader. 495 void setHeaderFileInfoForUID(HeaderFileInfo HFI, unsigned UID); 496 497 /// \brief Return the HeaderFileInfo structure for the specified FileEntry. getFileInfo(const FileEntry * FE)498 const HeaderFileInfo &getFileInfo(const FileEntry *FE) const { 499 return const_cast<HeaderSearch*>(this)->getFileInfo(FE); 500 } 501 502 // Used by external tools 503 typedef std::vector<DirectoryLookup>::const_iterator search_dir_iterator; search_dir_begin()504 search_dir_iterator search_dir_begin() const { return SearchDirs.begin(); } search_dir_end()505 search_dir_iterator search_dir_end() const { return SearchDirs.end(); } search_dir_size()506 unsigned search_dir_size() const { return SearchDirs.size(); } 507 quoted_dir_begin()508 search_dir_iterator quoted_dir_begin() const { 509 return SearchDirs.begin(); 510 } quoted_dir_end()511 search_dir_iterator quoted_dir_end() const { 512 return SearchDirs.begin() + AngledDirIdx; 513 } 514 angled_dir_begin()515 search_dir_iterator angled_dir_begin() const { 516 return SearchDirs.begin() + AngledDirIdx; 517 } angled_dir_end()518 search_dir_iterator angled_dir_end() const { 519 return SearchDirs.begin() + SystemDirIdx; 520 } 521 system_dir_begin()522 search_dir_iterator system_dir_begin() const { 523 return SearchDirs.begin() + SystemDirIdx; 524 } system_dir_end()525 search_dir_iterator system_dir_end() const { return SearchDirs.end(); } 526 527 /// \brief Retrieve a uniqued framework name. 528 StringRef getUniqueFrameworkName(StringRef Framework); 529 530 void PrintStats(); 531 532 size_t getTotalMemory() const; 533 534 static std::string NormalizeDashIncludePath(StringRef File, 535 FileManager &FileMgr); 536 537 private: 538 /// \brief Describes what happened when we tried to load a module map file. 539 enum LoadModuleMapResult { 540 /// \brief The module map file had already been loaded. 541 LMM_AlreadyLoaded, 542 /// \brief The module map file was loaded by this invocation. 543 LMM_NewlyLoaded, 544 /// \brief There is was directory with the given name. 545 LMM_NoDirectory, 546 /// \brief There was either no module map file or the module map file was 547 /// invalid. 548 LMM_InvalidModuleMap 549 }; 550 551 /// \brief Try to load the module map file in the given directory. 552 /// 553 /// \param DirName The name of the directory where we will look for a module 554 /// map file. 555 /// 556 /// \returns The result of attempting to load the module map file from the 557 /// named directory. 558 LoadModuleMapResult loadModuleMapFile(StringRef DirName); 559 560 /// \brief Try to load the module map file in the given directory. 561 /// 562 /// \param Dir The directory where we will look for a module map file. 563 /// 564 /// \returns The result of attempting to load the module map file from the 565 /// named directory. 566 LoadModuleMapResult loadModuleMapFile(const DirectoryEntry *Dir); 567 568 /// \brief Return the HeaderFileInfo structure for the specified FileEntry. 569 HeaderFileInfo &getFileInfo(const FileEntry *FE); 570 }; 571 572 } // end namespace clang 573 574 #endif 575