PTHLexer.cpp revision 7ad629ebefa87269cc1887debc83cfa58c285a80
11cb2d742eb6635aeab6132ee5f0b5781d39487d7Nico Weber//===--- PTHLexer.cpp - Lex from a token stream ---------------------------===// 2cd9ae488ede3e26e65fe173ae90b489ce45c8b6aKaelyn Uhrain// 3cd9ae488ede3e26e65fe173ae90b489ce45c8b6aKaelyn Uhrain// The LLVM Compiler Infrastructure 4cd9ae488ede3e26e65fe173ae90b489ce45c8b6aKaelyn Uhrain// 5cd9ae488ede3e26e65fe173ae90b489ce45c8b6aKaelyn Uhrain// This file is distributed under the University of Illinois Open Source 6cd9ae488ede3e26e65fe173ae90b489ce45c8b6aKaelyn Uhrain// License. See LICENSE.TXT for details. 7cd9ae488ede3e26e65fe173ae90b489ce45c8b6aKaelyn Uhrain// 8cd9ae488ede3e26e65fe173ae90b489ce45c8b6aKaelyn Uhrain//===----------------------------------------------------------------------===// 9cd9ae488ede3e26e65fe173ae90b489ce45c8b6aKaelyn Uhrain// 10cd9ae488ede3e26e65fe173ae90b489ce45c8b6aKaelyn Uhrain// This file implements the PTHLexer interface. 11cd9ae488ede3e26e65fe173ae90b489ce45c8b6aKaelyn Uhrain// 12cd9ae488ede3e26e65fe173ae90b489ce45c8b6aKaelyn Uhrain//===----------------------------------------------------------------------===// 13cd9ae488ede3e26e65fe173ae90b489ce45c8b6aKaelyn Uhrain 14cd9ae488ede3e26e65fe173ae90b489ce45c8b6aKaelyn Uhrain#include "clang/Basic/TokenKinds.h" 15cd9ae488ede3e26e65fe173ae90b489ce45c8b6aKaelyn Uhrain#include "clang/Basic/FileManager.h" 16cd9ae488ede3e26e65fe173ae90b489ce45c8b6aKaelyn Uhrain#include "clang/Basic/IdentifierTable.h" 17cd9ae488ede3e26e65fe173ae90b489ce45c8b6aKaelyn Uhrain#include "clang/Basic/OnDiskHashTable.h" 18cd9ae488ede3e26e65fe173ae90b489ce45c8b6aKaelyn Uhrain#include "clang/Lex/LexDiagnostic.h" 19cd9ae488ede3e26e65fe173ae90b489ce45c8b6aKaelyn Uhrain#include "clang/Lex/PTHLexer.h" 20cd9ae488ede3e26e65fe173ae90b489ce45c8b6aKaelyn Uhrain#include "clang/Lex/Preprocessor.h" 21cd9ae488ede3e26e65fe173ae90b489ce45c8b6aKaelyn Uhrain#include "clang/Lex/PTHManager.h" 22cd9ae488ede3e26e65fe173ae90b489ce45c8b6aKaelyn Uhrain#include "clang/Lex/Token.h" 23cd9ae488ede3e26e65fe173ae90b489ce45c8b6aKaelyn Uhrain#include "clang/Lex/Preprocessor.h" 24cd9ae488ede3e26e65fe173ae90b489ce45c8b6aKaelyn Uhrain#include "llvm/ADT/OwningPtr.h" 25cd9ae488ede3e26e65fe173ae90b489ce45c8b6aKaelyn Uhrain#include "llvm/ADT/StringExtras.h" 26cd9ae488ede3e26e65fe173ae90b489ce45c8b6aKaelyn Uhrain#include "llvm/ADT/StringMap.h" 27cd9ae488ede3e26e65fe173ae90b489ce45c8b6aKaelyn Uhrain#include "llvm/Support/MemoryBuffer.h" 28cd9ae488ede3e26e65fe173ae90b489ce45c8b6aKaelyn Uhrain#include <sys/stat.h> 29cd9ae488ede3e26e65fe173ae90b489ce45c8b6aKaelyn Uhrainusing namespace clang; 30cd9ae488ede3e26e65fe173ae90b489ce45c8b6aKaelyn Uhrainusing namespace clang::io; 31cd9ae488ede3e26e65fe173ae90b489ce45c8b6aKaelyn Uhrain 32cd9ae488ede3e26e65fe173ae90b489ce45c8b6aKaelyn Uhrain#define DISK_TOKEN_SIZE (1+1+2+4+4) 33cd9ae488ede3e26e65fe173ae90b489ce45c8b6aKaelyn Uhrain 34//===----------------------------------------------------------------------===// 35// PTHLexer methods. 36//===----------------------------------------------------------------------===// 37 38PTHLexer::PTHLexer(Preprocessor &PP, FileID FID, const unsigned char *D, 39 const unsigned char *ppcond, PTHManager &PM) 40 : PreprocessorLexer(&PP, FID), TokBuf(D), CurPtr(D), LastHashTokPtr(0), 41 PPCond(ppcond), CurPPCondPtr(ppcond), PTHMgr(PM) { 42 43 FileStartLoc = PP.getSourceManager().getLocForStartOfFile(FID); 44} 45 46void PTHLexer::Lex(Token& Tok) { 47LexNextToken: 48 49 //===--------------------------------------==// 50 // Read the raw token data. 51 //===--------------------------------------==// 52 53 // Shadow CurPtr into an automatic variable. 54 const unsigned char *CurPtrShadow = CurPtr; 55 56 // Read in the data for the token. 57 unsigned Word0 = ReadLE32(CurPtrShadow); 58 uint32_t IdentifierID = ReadLE32(CurPtrShadow); 59 uint32_t FileOffset = ReadLE32(CurPtrShadow); 60 61 tok::TokenKind TKind = (tok::TokenKind) (Word0 & 0xFF); 62 Token::TokenFlags TFlags = (Token::TokenFlags) ((Word0 >> 8) & 0xFF); 63 uint32_t Len = Word0 >> 16; 64 65 CurPtr = CurPtrShadow; 66 67 //===--------------------------------------==// 68 // Construct the token itself. 69 //===--------------------------------------==// 70 71 Tok.startToken(); 72 Tok.setKind(TKind); 73 Tok.setFlag(TFlags); 74 assert(!LexingRawMode); 75 Tok.setLocation(FileStartLoc.getFileLocWithOffset(FileOffset)); 76 Tok.setLength(Len); 77 78 // Handle identifiers. 79 if (Tok.isLiteral()) { 80 Tok.setLiteralData((const char*) (PTHMgr.SpellingBase + IdentifierID)); 81 } 82 else if (IdentifierID) { 83 MIOpt.ReadToken(); 84 IdentifierInfo *II = PTHMgr.GetIdentifierInfo(IdentifierID-1); 85 86 Tok.setIdentifierInfo(II); 87 88 // Change the kind of this identifier to the appropriate token kind, e.g. 89 // turning "for" into a keyword. 90 Tok.setKind(II->getTokenID()); 91 92 if (II->isHandleIdentifierCase()) 93 PP->HandleIdentifier(Tok); 94 return; 95 } 96 97 //===--------------------------------------==// 98 // Process the token. 99 //===--------------------------------------==// 100 if (TKind == tok::eof) { 101 // Save the end-of-file token. 102 EofToken = Tok; 103 104 // Save 'PP' to 'PPCache' as LexEndOfFile can delete 'this'. 105 Preprocessor *PPCache = PP; 106 107 assert(!ParsingPreprocessorDirective); 108 assert(!LexingRawMode); 109 110 if (LexEndOfFile(Tok)) 111 return; 112 113 return PPCache->Lex(Tok); 114 } 115 116 if (TKind == tok::hash && Tok.isAtStartOfLine()) { 117 LastHashTokPtr = CurPtr - DISK_TOKEN_SIZE; 118 assert(!LexingRawMode); 119 PP->HandleDirective(Tok); 120 121 if (PP->isCurrentLexer(this)) 122 goto LexNextToken; 123 124 return PP->Lex(Tok); 125 } 126 127 if (TKind == tok::eom) { 128 assert(ParsingPreprocessorDirective); 129 ParsingPreprocessorDirective = false; 130 return; 131 } 132 133 MIOpt.ReadToken(); 134} 135 136bool PTHLexer::LexEndOfFile(Token &Result) { 137 // If we hit the end of the file while parsing a preprocessor directive, 138 // end the preprocessor directive first. The next token returned will 139 // then be the end of file. 140 if (ParsingPreprocessorDirective) { 141 ParsingPreprocessorDirective = false; // Done parsing the "line". 142 return true; // Have a token. 143 } 144 145 assert(!LexingRawMode); 146 147 // If we are in a #if directive, emit an error. 148 while (!ConditionalStack.empty()) { 149 if (!PP->isCodeCompletionFile(FileStartLoc)) 150 PP->Diag(ConditionalStack.back().IfLoc, 151 diag::err_pp_unterminated_conditional); 152 ConditionalStack.pop_back(); 153 } 154 155 // Finally, let the preprocessor handle this. 156 return PP->HandleEndOfFile(Result); 157} 158 159// FIXME: We can just grab the last token instead of storing a copy 160// into EofToken. 161void PTHLexer::getEOF(Token& Tok) { 162 assert(EofToken.is(tok::eof)); 163 Tok = EofToken; 164} 165 166void PTHLexer::DiscardToEndOfLine() { 167 assert(ParsingPreprocessorDirective && ParsingFilename == false && 168 "Must be in a preprocessing directive!"); 169 170 // We assume that if the preprocessor wishes to discard to the end of 171 // the line that it also means to end the current preprocessor directive. 172 ParsingPreprocessorDirective = false; 173 174 // Skip tokens by only peeking at their token kind and the flags. 175 // We don't need to actually reconstruct full tokens from the token buffer. 176 // This saves some copies and it also reduces IdentifierInfo* lookup. 177 const unsigned char* p = CurPtr; 178 while (1) { 179 // Read the token kind. Are we at the end of the file? 180 tok::TokenKind x = (tok::TokenKind) (uint8_t) *p; 181 if (x == tok::eof) break; 182 183 // Read the token flags. Are we at the start of the next line? 184 Token::TokenFlags y = (Token::TokenFlags) (uint8_t) p[1]; 185 if (y & Token::StartOfLine) break; 186 187 // Skip to the next token. 188 p += DISK_TOKEN_SIZE; 189 } 190 191 CurPtr = p; 192} 193 194/// SkipBlock - Used by Preprocessor to skip the current conditional block. 195bool PTHLexer::SkipBlock() { 196 assert(CurPPCondPtr && "No cached PP conditional information."); 197 assert(LastHashTokPtr && "No known '#' token."); 198 199 const unsigned char* HashEntryI = 0; 200 uint32_t Offset; 201 uint32_t TableIdx; 202 203 do { 204 // Read the token offset from the side-table. 205 Offset = ReadLE32(CurPPCondPtr); 206 207 // Read the target table index from the side-table. 208 TableIdx = ReadLE32(CurPPCondPtr); 209 210 // Compute the actual memory address of the '#' token data for this entry. 211 HashEntryI = TokBuf + Offset; 212 213 // Optmization: "Sibling jumping". #if...#else...#endif blocks can 214 // contain nested blocks. In the side-table we can jump over these 215 // nested blocks instead of doing a linear search if the next "sibling" 216 // entry is not at a location greater than LastHashTokPtr. 217 if (HashEntryI < LastHashTokPtr && TableIdx) { 218 // In the side-table we are still at an entry for a '#' token that 219 // is earlier than the last one we saw. Check if the location we would 220 // stride gets us closer. 221 const unsigned char* NextPPCondPtr = 222 PPCond + TableIdx*(sizeof(uint32_t)*2); 223 assert(NextPPCondPtr >= CurPPCondPtr); 224 // Read where we should jump to. 225 uint32_t TmpOffset = ReadLE32(NextPPCondPtr); 226 const unsigned char* HashEntryJ = TokBuf + TmpOffset; 227 228 if (HashEntryJ <= LastHashTokPtr) { 229 // Jump directly to the next entry in the side table. 230 HashEntryI = HashEntryJ; 231 Offset = TmpOffset; 232 TableIdx = ReadLE32(NextPPCondPtr); 233 CurPPCondPtr = NextPPCondPtr; 234 } 235 } 236 } 237 while (HashEntryI < LastHashTokPtr); 238 assert(HashEntryI == LastHashTokPtr && "No PP-cond entry found for '#'"); 239 assert(TableIdx && "No jumping from #endifs."); 240 241 // Update our side-table iterator. 242 const unsigned char* NextPPCondPtr = PPCond + TableIdx*(sizeof(uint32_t)*2); 243 assert(NextPPCondPtr >= CurPPCondPtr); 244 CurPPCondPtr = NextPPCondPtr; 245 246 // Read where we should jump to. 247 HashEntryI = TokBuf + ReadLE32(NextPPCondPtr); 248 uint32_t NextIdx = ReadLE32(NextPPCondPtr); 249 250 // By construction NextIdx will be zero if this is a #endif. This is useful 251 // to know to obviate lexing another token. 252 bool isEndif = NextIdx == 0; 253 254 // This case can occur when we see something like this: 255 // 256 // #if ... 257 // /* a comment or nothing */ 258 // #elif 259 // 260 // If we are skipping the first #if block it will be the case that CurPtr 261 // already points 'elif'. Just return. 262 263 if (CurPtr > HashEntryI) { 264 assert(CurPtr == HashEntryI + DISK_TOKEN_SIZE); 265 // Did we reach a #endif? If so, go ahead and consume that token as well. 266 if (isEndif) 267 CurPtr += DISK_TOKEN_SIZE*2; 268 else 269 LastHashTokPtr = HashEntryI; 270 271 return isEndif; 272 } 273 274 // Otherwise, we need to advance. Update CurPtr to point to the '#' token. 275 CurPtr = HashEntryI; 276 277 // Update the location of the last observed '#'. This is useful if we 278 // are skipping multiple blocks. 279 LastHashTokPtr = CurPtr; 280 281 // Skip the '#' token. 282 assert(((tok::TokenKind)*CurPtr) == tok::hash); 283 CurPtr += DISK_TOKEN_SIZE; 284 285 // Did we reach a #endif? If so, go ahead and consume that token as well. 286 if (isEndif) { CurPtr += DISK_TOKEN_SIZE*2; } 287 288 return isEndif; 289} 290 291SourceLocation PTHLexer::getSourceLocation() { 292 // getSourceLocation is not on the hot path. It is used to get the location 293 // of the next token when transitioning back to this lexer when done 294 // handling a #included file. Just read the necessary data from the token 295 // data buffer to construct the SourceLocation object. 296 // NOTE: This is a virtual function; hence it is defined out-of-line. 297 const unsigned char *OffsetPtr = CurPtr + (DISK_TOKEN_SIZE - 4); 298 uint32_t Offset = ReadLE32(OffsetPtr); 299 return FileStartLoc.getFileLocWithOffset(Offset); 300} 301 302//===----------------------------------------------------------------------===// 303// PTH file lookup: map from strings to file data. 304//===----------------------------------------------------------------------===// 305 306/// PTHFileLookup - This internal data structure is used by the PTHManager 307/// to map from FileEntry objects managed by FileManager to offsets within 308/// the PTH file. 309namespace { 310class PTHFileData { 311 const uint32_t TokenOff; 312 const uint32_t PPCondOff; 313public: 314 PTHFileData(uint32_t tokenOff, uint32_t ppCondOff) 315 : TokenOff(tokenOff), PPCondOff(ppCondOff) {} 316 317 uint32_t getTokenOffset() const { return TokenOff; } 318 uint32_t getPPCondOffset() const { return PPCondOff; } 319}; 320 321 322class PTHFileLookupCommonTrait { 323public: 324 typedef std::pair<unsigned char, const char*> internal_key_type; 325 326 static unsigned ComputeHash(internal_key_type x) { 327 return llvm::HashString(x.second); 328 } 329 330 static std::pair<unsigned, unsigned> 331 ReadKeyDataLength(const unsigned char*& d) { 332 unsigned keyLen = (unsigned) ReadUnalignedLE16(d); 333 unsigned dataLen = (unsigned) *(d++); 334 return std::make_pair(keyLen, dataLen); 335 } 336 337 static internal_key_type ReadKey(const unsigned char* d, unsigned) { 338 unsigned char k = *(d++); // Read the entry kind. 339 return std::make_pair(k, (const char*) d); 340 } 341}; 342 343class PTHFileLookupTrait : public PTHFileLookupCommonTrait { 344public: 345 typedef const FileEntry* external_key_type; 346 typedef PTHFileData data_type; 347 348 static internal_key_type GetInternalKey(const FileEntry* FE) { 349 return std::make_pair((unsigned char) 0x1, FE->getName()); 350 } 351 352 static bool EqualKey(internal_key_type a, internal_key_type b) { 353 return a.first == b.first && strcmp(a.second, b.second) == 0; 354 } 355 356 static PTHFileData ReadData(const internal_key_type& k, 357 const unsigned char* d, unsigned) { 358 assert(k.first == 0x1 && "Only file lookups can match!"); 359 uint32_t x = ::ReadUnalignedLE32(d); 360 uint32_t y = ::ReadUnalignedLE32(d); 361 return PTHFileData(x, y); 362 } 363}; 364 365class PTHStringLookupTrait { 366public: 367 typedef uint32_t 368 data_type; 369 370 typedef const std::pair<const char*, unsigned> 371 external_key_type; 372 373 typedef external_key_type internal_key_type; 374 375 static bool EqualKey(const internal_key_type& a, 376 const internal_key_type& b) { 377 return (a.second == b.second) ? memcmp(a.first, b.first, a.second) == 0 378 : false; 379 } 380 381 static unsigned ComputeHash(const internal_key_type& a) { 382 return llvm::HashString(llvm::StringRef(a.first, a.second)); 383 } 384 385 // This hopefully will just get inlined and removed by the optimizer. 386 static const internal_key_type& 387 GetInternalKey(const external_key_type& x) { return x; } 388 389 static std::pair<unsigned, unsigned> 390 ReadKeyDataLength(const unsigned char*& d) { 391 return std::make_pair((unsigned) ReadUnalignedLE16(d), sizeof(uint32_t)); 392 } 393 394 static std::pair<const char*, unsigned> 395 ReadKey(const unsigned char* d, unsigned n) { 396 assert(n >= 2 && d[n-1] == '\0'); 397 return std::make_pair((const char*) d, n-1); 398 } 399 400 static uint32_t ReadData(const internal_key_type& k, const unsigned char* d, 401 unsigned) { 402 return ::ReadUnalignedLE32(d); 403 } 404}; 405 406} // end anonymous namespace 407 408typedef OnDiskChainedHashTable<PTHFileLookupTrait> PTHFileLookup; 409typedef OnDiskChainedHashTable<PTHStringLookupTrait> PTHStringIdLookup; 410 411//===----------------------------------------------------------------------===// 412// PTHManager methods. 413//===----------------------------------------------------------------------===// 414 415PTHManager::PTHManager(const llvm::MemoryBuffer* buf, void* fileLookup, 416 const unsigned char* idDataTable, 417 IdentifierInfo** perIDCache, 418 void* stringIdLookup, unsigned numIds, 419 const unsigned char* spellingBase, 420 const char* originalSourceFile) 421: Buf(buf), PerIDCache(perIDCache), FileLookup(fileLookup), 422 IdDataTable(idDataTable), StringIdLookup(stringIdLookup), 423 NumIds(numIds), PP(0), SpellingBase(spellingBase), 424 OriginalSourceFile(originalSourceFile) {} 425 426PTHManager::~PTHManager() { 427 delete Buf; 428 delete (PTHFileLookup*) FileLookup; 429 delete (PTHStringIdLookup*) StringIdLookup; 430 free(PerIDCache); 431} 432 433static void InvalidPTH(Diagnostic &Diags, const char *Msg) { 434 Diags.Report(Diags.getCustomDiagID(Diagnostic::Error, Msg)); 435} 436 437PTHManager *PTHManager::Create(const std::string &file, FileManager &FileMgr, 438 const FileSystemOptions &FSOpts, 439 Diagnostic &Diags) { 440 // Memory map the PTH file. 441 llvm::OwningPtr<llvm::MemoryBuffer> 442 File(FileMgr.getBufferForFile(file, FSOpts)); 443 444 if (!File) { 445 Diags.Report(diag::err_invalid_pth_file) << file; 446 return 0; 447 } 448 449 // Get the buffer ranges and check if there are at least three 32-bit 450 // words at the end of the file. 451 const unsigned char *BufBeg = (unsigned char*)File->getBufferStart(); 452 const unsigned char *BufEnd = (unsigned char*)File->getBufferEnd(); 453 454 // Check the prologue of the file. 455 if ((BufEnd - BufBeg) < (signed)(sizeof("cfe-pth") + 3 + 4) || 456 memcmp(BufBeg, "cfe-pth", sizeof("cfe-pth") - 1) != 0) { 457 Diags.Report(diag::err_invalid_pth_file) << file; 458 return 0; 459 } 460 461 // Read the PTH version. 462 const unsigned char *p = BufBeg + (sizeof("cfe-pth") - 1); 463 unsigned Version = ReadLE32(p); 464 465 if (Version < PTHManager::Version) { 466 InvalidPTH(Diags, 467 Version < PTHManager::Version 468 ? "PTH file uses an older PTH format that is no longer supported" 469 : "PTH file uses a newer PTH format that cannot be read"); 470 return 0; 471 } 472 473 // Compute the address of the index table at the end of the PTH file. 474 const unsigned char *PrologueOffset = p; 475 476 if (PrologueOffset >= BufEnd) { 477 Diags.Report(diag::err_invalid_pth_file) << file; 478 return 0; 479 } 480 481 // Construct the file lookup table. This will be used for mapping from 482 // FileEntry*'s to cached tokens. 483 const unsigned char* FileTableOffset = PrologueOffset + sizeof(uint32_t)*2; 484 const unsigned char* FileTable = BufBeg + ReadLE32(FileTableOffset); 485 486 if (!(FileTable > BufBeg && FileTable < BufEnd)) { 487 Diags.Report(diag::err_invalid_pth_file) << file; 488 return 0; // FIXME: Proper error diagnostic? 489 } 490 491 llvm::OwningPtr<PTHFileLookup> FL(PTHFileLookup::Create(FileTable, BufBeg)); 492 493 // Warn if the PTH file is empty. We still want to create a PTHManager 494 // as the PTH could be used with -include-pth. 495 if (FL->isEmpty()) 496 InvalidPTH(Diags, "PTH file contains no cached source data"); 497 498 // Get the location of the table mapping from persistent ids to the 499 // data needed to reconstruct identifiers. 500 const unsigned char* IDTableOffset = PrologueOffset + sizeof(uint32_t)*0; 501 const unsigned char* IData = BufBeg + ReadLE32(IDTableOffset); 502 503 if (!(IData >= BufBeg && IData < BufEnd)) { 504 Diags.Report(diag::err_invalid_pth_file) << file; 505 return 0; 506 } 507 508 // Get the location of the hashtable mapping between strings and 509 // persistent IDs. 510 const unsigned char* StringIdTableOffset = PrologueOffset + sizeof(uint32_t)*1; 511 const unsigned char* StringIdTable = BufBeg + ReadLE32(StringIdTableOffset); 512 if (!(StringIdTable >= BufBeg && StringIdTable < BufEnd)) { 513 Diags.Report(diag::err_invalid_pth_file) << file; 514 return 0; 515 } 516 517 llvm::OwningPtr<PTHStringIdLookup> SL(PTHStringIdLookup::Create(StringIdTable, 518 BufBeg)); 519 520 // Get the location of the spelling cache. 521 const unsigned char* spellingBaseOffset = PrologueOffset + sizeof(uint32_t)*3; 522 const unsigned char* spellingBase = BufBeg + ReadLE32(spellingBaseOffset); 523 if (!(spellingBase >= BufBeg && spellingBase < BufEnd)) { 524 Diags.Report(diag::err_invalid_pth_file) << file; 525 return 0; 526 } 527 528 // Get the number of IdentifierInfos and pre-allocate the identifier cache. 529 uint32_t NumIds = ReadLE32(IData); 530 531 // Pre-allocate the peristent ID -> IdentifierInfo* cache. We use calloc() 532 // so that we in the best case only zero out memory once when the OS returns 533 // us new pages. 534 IdentifierInfo** PerIDCache = 0; 535 536 if (NumIds) { 537 PerIDCache = (IdentifierInfo**)calloc(NumIds, sizeof(*PerIDCache)); 538 if (!PerIDCache) { 539 InvalidPTH(Diags, "Could not allocate memory for processing PTH file"); 540 return 0; 541 } 542 } 543 544 // Compute the address of the original source file. 545 const unsigned char* originalSourceBase = PrologueOffset + sizeof(uint32_t)*4; 546 unsigned len = ReadUnalignedLE16(originalSourceBase); 547 if (!len) originalSourceBase = 0; 548 549 // Create the new PTHManager. 550 return new PTHManager(File.take(), FL.take(), IData, PerIDCache, 551 SL.take(), NumIds, spellingBase, 552 (const char*) originalSourceBase); 553} 554 555IdentifierInfo* PTHManager::LazilyCreateIdentifierInfo(unsigned PersistentID) { 556 // Look in the PTH file for the string data for the IdentifierInfo object. 557 const unsigned char* TableEntry = IdDataTable + sizeof(uint32_t)*PersistentID; 558 const unsigned char* IDData = 559 (const unsigned char*)Buf->getBufferStart() + ReadLE32(TableEntry); 560 assert(IDData < (const unsigned char*)Buf->getBufferEnd()); 561 562 // Allocate the object. 563 std::pair<IdentifierInfo,const unsigned char*> *Mem = 564 Alloc.Allocate<std::pair<IdentifierInfo,const unsigned char*> >(); 565 566 Mem->second = IDData; 567 assert(IDData[0] != '\0'); 568 IdentifierInfo *II = new ((void*) Mem) IdentifierInfo(); 569 570 // Store the new IdentifierInfo in the cache. 571 PerIDCache[PersistentID] = II; 572 assert(II->getNameStart() && II->getNameStart()[0] != '\0'); 573 return II; 574} 575 576IdentifierInfo* PTHManager::get(llvm::StringRef Name) { 577 PTHStringIdLookup& SL = *((PTHStringIdLookup*)StringIdLookup); 578 // Double check our assumption that the last character isn't '\0'. 579 assert(Name.empty() || Name.data()[Name.size()-1] != '\0'); 580 PTHStringIdLookup::iterator I = SL.find(std::make_pair(Name.data(), 581 Name.size())); 582 if (I == SL.end()) // No identifier found? 583 return 0; 584 585 // Match found. Return the identifier! 586 assert(*I > 0); 587 return GetIdentifierInfo(*I-1); 588} 589 590PTHLexer *PTHManager::CreateLexer(FileID FID) { 591 const FileEntry *FE = PP->getSourceManager().getFileEntryForID(FID); 592 if (!FE) 593 return 0; 594 595 // Lookup the FileEntry object in our file lookup data structure. It will 596 // return a variant that indicates whether or not there is an offset within 597 // the PTH file that contains cached tokens. 598 PTHFileLookup& PFL = *((PTHFileLookup*)FileLookup); 599 PTHFileLookup::iterator I = PFL.find(FE); 600 601 if (I == PFL.end()) // No tokens available? 602 return 0; 603 604 const PTHFileData& FileData = *I; 605 606 const unsigned char *BufStart = (const unsigned char *)Buf->getBufferStart(); 607 // Compute the offset of the token data within the buffer. 608 const unsigned char* data = BufStart + FileData.getTokenOffset(); 609 610 // Get the location of pp-conditional table. 611 const unsigned char* ppcond = BufStart + FileData.getPPCondOffset(); 612 uint32_t Len = ReadLE32(ppcond); 613 if (Len == 0) ppcond = 0; 614 615 assert(PP && "No preprocessor set yet!"); 616 return new PTHLexer(*PP, FID, data, ppcond, *this); 617} 618 619//===----------------------------------------------------------------------===// 620// 'stat' caching. 621//===----------------------------------------------------------------------===// 622 623namespace { 624class PTHStatData { 625public: 626 const bool hasStat; 627 const ino_t ino; 628 const dev_t dev; 629 const mode_t mode; 630 const time_t mtime; 631 const off_t size; 632 633 PTHStatData(ino_t i, dev_t d, mode_t mo, time_t m, off_t s) 634 : hasStat(true), ino(i), dev(d), mode(mo), mtime(m), size(s) {} 635 636 PTHStatData() 637 : hasStat(false), ino(0), dev(0), mode(0), mtime(0), size(0) {} 638}; 639 640class PTHStatLookupTrait : public PTHFileLookupCommonTrait { 641public: 642 typedef const char* external_key_type; // const char* 643 typedef PTHStatData data_type; 644 645 static internal_key_type GetInternalKey(const char *path) { 646 // The key 'kind' doesn't matter here because it is ignored in EqualKey. 647 return std::make_pair((unsigned char) 0x0, path); 648 } 649 650 static bool EqualKey(internal_key_type a, internal_key_type b) { 651 // When doing 'stat' lookups we don't care about the kind of 'a' and 'b', 652 // just the paths. 653 return strcmp(a.second, b.second) == 0; 654 } 655 656 static data_type ReadData(const internal_key_type& k, const unsigned char* d, 657 unsigned) { 658 659 if (k.first /* File or Directory */) { 660 if (k.first == 0x1 /* File */) d += 4 * 2; // Skip the first 2 words. 661 ino_t ino = (ino_t) ReadUnalignedLE32(d); 662 dev_t dev = (dev_t) ReadUnalignedLE32(d); 663 mode_t mode = (mode_t) ReadUnalignedLE16(d); 664 time_t mtime = (time_t) ReadUnalignedLE64(d); 665 return data_type(ino, dev, mode, mtime, (off_t) ReadUnalignedLE64(d)); 666 } 667 668 // Negative stat. Don't read anything. 669 return data_type(); 670 } 671}; 672 673class PTHStatCache : public StatSysCallCache { 674 typedef OnDiskChainedHashTable<PTHStatLookupTrait> CacheTy; 675 CacheTy Cache; 676 677public: 678 PTHStatCache(PTHFileLookup &FL) : 679 Cache(FL.getNumBuckets(), FL.getNumEntries(), FL.getBuckets(), 680 FL.getBase()) {} 681 682 ~PTHStatCache() {} 683 684 int stat(const char *path, struct stat *buf) { 685 // Do the lookup for the file's data in the PTH file. 686 CacheTy::iterator I = Cache.find(path); 687 688 // If we don't get a hit in the PTH file just forward to 'stat'. 689 if (I == Cache.end()) 690 return StatSysCallCache::stat(path, buf); 691 692 const PTHStatData& Data = *I; 693 694 if (!Data.hasStat) 695 return 1; 696 697 buf->st_ino = Data.ino; 698 buf->st_dev = Data.dev; 699 buf->st_mtime = Data.mtime; 700 buf->st_mode = Data.mode; 701 buf->st_size = Data.size; 702 return 0; 703 } 704}; 705} // end anonymous namespace 706 707StatSysCallCache *PTHManager::createStatCache() { 708 return new PTHStatCache(*((PTHFileLookup*) FileLookup)); 709} 710