PTHLexer.cpp revision 7ad629ebefa87269cc1887debc83cfa58c285a80
1274b20863a728cc6a31ee75c670e3733600c1531Ted Kremenek//===--- PTHLexer.cpp - Lex from a token stream ---------------------------===//
2274b20863a728cc6a31ee75c670e3733600c1531Ted Kremenek//
3274b20863a728cc6a31ee75c670e3733600c1531Ted Kremenek//                     The LLVM Compiler Infrastructure
4274b20863a728cc6a31ee75c670e3733600c1531Ted Kremenek//
5274b20863a728cc6a31ee75c670e3733600c1531Ted Kremenek// This file is distributed under the University of Illinois Open Source
6274b20863a728cc6a31ee75c670e3733600c1531Ted Kremenek// License. See LICENSE.TXT for details.
7274b20863a728cc6a31ee75c670e3733600c1531Ted Kremenek//
8274b20863a728cc6a31ee75c670e3733600c1531Ted Kremenek//===----------------------------------------------------------------------===//
9274b20863a728cc6a31ee75c670e3733600c1531Ted Kremenek//
10274b20863a728cc6a31ee75c670e3733600c1531Ted Kremenek// This file implements the PTHLexer interface.
11274b20863a728cc6a31ee75c670e3733600c1531Ted Kremenek//
12274b20863a728cc6a31ee75c670e3733600c1531Ted Kremenek//===----------------------------------------------------------------------===//
13274b20863a728cc6a31ee75c670e3733600c1531Ted Kremenek
140c6a77bc1f52f282a969538f139ebde429076ed3Ted Kremenek#include "clang/Basic/TokenKinds.h"
150c6a77bc1f52f282a969538f139ebde429076ed3Ted Kremenek#include "clang/Basic/FileManager.h"
160c6a77bc1f52f282a969538f139ebde429076ed3Ted Kremenek#include "clang/Basic/IdentifierTable.h"
179378ba44b3f46d697653003c784be87746e138d2Douglas Gregor#include "clang/Basic/OnDiskHashTable.h"
183574f46cf495ec61618fd6864b045c5b1d0d5068Daniel Dunbar#include "clang/Lex/LexDiagnostic.h"
19274b20863a728cc6a31ee75c670e3733600c1531Ted Kremenek#include "clang/Lex/PTHLexer.h"
20274b20863a728cc6a31ee75c670e3733600c1531Ted Kremenek#include "clang/Lex/Preprocessor.h"
210c6a77bc1f52f282a969538f139ebde429076ed3Ted Kremenek#include "clang/Lex/PTHManager.h"
220c6a77bc1f52f282a969538f139ebde429076ed3Ted Kremenek#include "clang/Lex/Token.h"
230c6a77bc1f52f282a969538f139ebde429076ed3Ted Kremenek#include "clang/Lex/Preprocessor.h"
240c6a77bc1f52f282a969538f139ebde429076ed3Ted Kremenek#include "llvm/ADT/OwningPtr.h"
252596e429a61602312bdd149786045b8a90cd2d10Daniel Dunbar#include "llvm/ADT/StringExtras.h"
262596e429a61602312bdd149786045b8a90cd2d10Daniel Dunbar#include "llvm/ADT/StringMap.h"
276f78c3b8b9343e7e9fbf2d457cccf00df6da5d47Chris Lattner#include "llvm/Support/MemoryBuffer.h"
28337edcdbec05316b407d0d64865c88ff8597d910Ted Kremenek#include <sys/stat.h>
29274b20863a728cc6a31ee75c670e3733600c1531Ted Kremenekusing namespace clang;
309378ba44b3f46d697653003c784be87746e138d2Douglas Gregorusing namespace clang::io;
31274b20863a728cc6a31ee75c670e3733600c1531Ted Kremenek
327b78b7c6d96deb1e63f8d0655ee6fa53de0b65efTed Kremenek#define DISK_TOKEN_SIZE (1+1+2+4+4)
33268ee7016a2811803989487c0ad3799486092c63Ted Kremenek
34e5680f3cd678014cf0872d34726dc804b0cbbdd4Ted Kremenek//===----------------------------------------------------------------------===//
35e5680f3cd678014cf0872d34726dc804b0cbbdd4Ted Kremenek// PTHLexer methods.
36e5680f3cd678014cf0872d34726dc804b0cbbdd4Ted Kremenek//===----------------------------------------------------------------------===//
37e5680f3cd678014cf0872d34726dc804b0cbbdd4Ted Kremenek
38da9d61c96c412f6babc7f824152609562f302388Chris LattnerPTHLexer::PTHLexer(Preprocessor &PP, FileID FID, const unsigned char *D,
39277faca30c9f8f72b79f55695cbe3395ec246e7cTed Kremenek                   const unsigned char *ppcond, PTHManager &PM)
402b2453a7d8fe732561795431f39ceb2b2a832d84Chris Lattner  : PreprocessorLexer(&PP, FID), TokBuf(D), CurPtr(D), LastHashTokPtr(0),
41277faca30c9f8f72b79f55695cbe3395ec246e7cTed Kremenek    PPCond(ppcond), CurPPCondPtr(ppcond), PTHMgr(PM) {
421eb4433ac451dc16f4133a88af2d002ac26c58efMike Stump
432b2453a7d8fe732561795431f39ceb2b2a832d84Chris Lattner  FileStartLoc = PP.getSourceManager().getLocForStartOfFile(FID);
445f074266cc59563036c40516c814d63825723e20Ted Kremenek}
45274b20863a728cc6a31ee75c670e3733600c1531Ted Kremenek
46e5680f3cd678014cf0872d34726dc804b0cbbdd4Ted Kremenekvoid PTHLexer::Lex(Token& Tok) {
47e5680f3cd678014cf0872d34726dc804b0cbbdd4Ted KremenekLexNextToken:
48866bdf74547efe32c320554837ffce00fcc084feTed Kremenek
49866bdf74547efe32c320554837ffce00fcc084feTed Kremenek  //===--------------------------------------==//
50866bdf74547efe32c320554837ffce00fcc084feTed Kremenek  // Read the raw token data.
51866bdf74547efe32c320554837ffce00fcc084feTed Kremenek  //===--------------------------------------==//
521eb4433ac451dc16f4133a88af2d002ac26c58efMike Stump
53866bdf74547efe32c320554837ffce00fcc084feTed Kremenek  // Shadow CurPtr into an automatic variable.
541eb4433ac451dc16f4133a88af2d002ac26c58efMike Stump  const unsigned char *CurPtrShadow = CurPtr;
55866bdf74547efe32c320554837ffce00fcc084feTed Kremenek
561b5285e1ba31975864da356b2ed927e87670e654Chris Lattner  // Read in the data for the token.
575ff4317536dbd7f03332bb250c8b35ec04a6f5dbChris Lattner  unsigned Word0 = ReadLE32(CurPtrShadow);
585ff4317536dbd7f03332bb250c8b35ec04a6f5dbChris Lattner  uint32_t IdentifierID = ReadLE32(CurPtrShadow);
595ff4317536dbd7f03332bb250c8b35ec04a6f5dbChris Lattner  uint32_t FileOffset = ReadLE32(CurPtrShadow);
601eb4433ac451dc16f4133a88af2d002ac26c58efMike Stump
617b78b7c6d96deb1e63f8d0655ee6fa53de0b65efTed Kremenek  tok::TokenKind TKind = (tok::TokenKind) (Word0 & 0xFF);
627b78b7c6d96deb1e63f8d0655ee6fa53de0b65efTed Kremenek  Token::TokenFlags TFlags = (Token::TokenFlags) ((Word0 >> 8) & 0xFF);
63aff6ef8e7bc3c3739f984c390e0af693e60be064Chris Lattner  uint32_t Len = Word0 >> 16;
647b78b7c6d96deb1e63f8d0655ee6fa53de0b65efTed Kremenek
65aff6ef8e7bc3c3739f984c390e0af693e60be064Chris Lattner  CurPtr = CurPtrShadow;
661eb4433ac451dc16f4133a88af2d002ac26c58efMike Stump
67866bdf74547efe32c320554837ffce00fcc084feTed Kremenek  //===--------------------------------------==//
68866bdf74547efe32c320554837ffce00fcc084feTed Kremenek  // Construct the token itself.
69866bdf74547efe32c320554837ffce00fcc084feTed Kremenek  //===--------------------------------------==//
701eb4433ac451dc16f4133a88af2d002ac26c58efMike Stump
71866bdf74547efe32c320554837ffce00fcc084feTed Kremenek  Tok.startToken();
72898a0bb1972efb6e03cb1151412ec7392cef07deChris Lattner  Tok.setKind(TKind);
73898a0bb1972efb6e03cb1151412ec7392cef07deChris Lattner  Tok.setFlag(TFlags);
7459d08cb672136322375e5400578ee1fbd0947de2Ted Kremenek  assert(!LexingRawMode);
752b2453a7d8fe732561795431f39ceb2b2a832d84Chris Lattner  Tok.setLocation(FileStartLoc.getFileLocWithOffset(FileOffset));
76866bdf74547efe32c320554837ffce00fcc084feTed Kremenek  Tok.setLength(Len);
7789d7ee9619d2dbdfa8d956a695c612a104a92cadTed Kremenek
78d0a69696acca62798dfc8b98f97c92bfa7fa0490Chris Lattner  // Handle identifiers.
79277faca30c9f8f72b79f55695cbe3395ec246e7cTed Kremenek  if (Tok.isLiteral()) {
80277faca30c9f8f72b79f55695cbe3395ec246e7cTed Kremenek    Tok.setLiteralData((const char*) (PTHMgr.SpellingBase + IdentifierID));
81277faca30c9f8f72b79f55695cbe3395ec246e7cTed Kremenek  }
82277faca30c9f8f72b79f55695cbe3395ec246e7cTed Kremenek  else if (IdentifierID) {
83d0a69696acca62798dfc8b98f97c92bfa7fa0490Chris Lattner    MIOpt.ReadToken();
84d0a69696acca62798dfc8b98f97c92bfa7fa0490Chris Lattner    IdentifierInfo *II = PTHMgr.GetIdentifierInfo(IdentifierID-1);
851eb4433ac451dc16f4133a88af2d002ac26c58efMike Stump
86d0a69696acca62798dfc8b98f97c92bfa7fa0490Chris Lattner    Tok.setIdentifierInfo(II);
871eb4433ac451dc16f4133a88af2d002ac26c58efMike Stump
88863c486fcb6162495a94fddf7ac8409de2638995Chris Lattner    // Change the kind of this identifier to the appropriate token kind, e.g.
89863c486fcb6162495a94fddf7ac8409de2638995Chris Lattner    // turning "for" into a keyword.
90863c486fcb6162495a94fddf7ac8409de2638995Chris Lattner    Tok.setKind(II->getTokenID());
911eb4433ac451dc16f4133a88af2d002ac26c58efMike Stump
92d0a69696acca62798dfc8b98f97c92bfa7fa0490Chris Lattner    if (II->isHandleIdentifierCase())
93d0a69696acca62798dfc8b98f97c92bfa7fa0490Chris Lattner      PP->HandleIdentifier(Tok);
94d0a69696acca62798dfc8b98f97c92bfa7fa0490Chris Lattner    return;
95d0a69696acca62798dfc8b98f97c92bfa7fa0490Chris Lattner  }
961eb4433ac451dc16f4133a88af2d002ac26c58efMike Stump
97866bdf74547efe32c320554837ffce00fcc084feTed Kremenek  //===--------------------------------------==//
98866bdf74547efe32c320554837ffce00fcc084feTed Kremenek  // Process the token.
99866bdf74547efe32c320554837ffce00fcc084feTed Kremenek  //===--------------------------------------==//
100898a0bb1972efb6e03cb1151412ec7392cef07deChris Lattner  if (TKind == tok::eof) {
101e5680f3cd678014cf0872d34726dc804b0cbbdd4Ted Kremenek    // Save the end-of-file token.
102e5680f3cd678014cf0872d34726dc804b0cbbdd4Ted Kremenek    EofToken = Tok;
1031eb4433ac451dc16f4133a88af2d002ac26c58efMike Stump
10494e3d1f0349634235606be77c08b3a48a6d563d6Ted Kremenek    // Save 'PP' to 'PPCache' as LexEndOfFile can delete 'this'.
105cd4e2aecde5bb7810715d5d5a88ac63ce7946f34Ted Kremenek    Preprocessor *PPCache = PP;
1061eb4433ac451dc16f4133a88af2d002ac26c58efMike Stump
10759d08cb672136322375e5400578ee1fbd0947de2Ted Kremenek    assert(!ParsingPreprocessorDirective);
10859d08cb672136322375e5400578ee1fbd0947de2Ted Kremenek    assert(!LexingRawMode);
10994e3d1f0349634235606be77c08b3a48a6d563d6Ted Kremenek
11094e3d1f0349634235606be77c08b3a48a6d563d6Ted Kremenek    if (LexEndOfFile(Tok))
111d6f53dc4951aace69014619761760addac9e59ecTed Kremenek      return;
1121eb4433ac451dc16f4133a88af2d002ac26c58efMike Stump
113cd4e2aecde5bb7810715d5d5a88ac63ce7946f34Ted Kremenek    return PPCache->Lex(Tok);
114cd4e2aecde5bb7810715d5d5a88ac63ce7946f34Ted Kremenek  }
1151eb4433ac451dc16f4133a88af2d002ac26c58efMike Stump
116898a0bb1972efb6e03cb1151412ec7392cef07deChris Lattner  if (TKind == tok::hash && Tok.isAtStartOfLine()) {
11759d08cb672136322375e5400578ee1fbd0947de2Ted Kremenek    LastHashTokPtr = CurPtr - DISK_TOKEN_SIZE;
11859d08cb672136322375e5400578ee1fbd0947de2Ted Kremenek    assert(!LexingRawMode);
11959d08cb672136322375e5400578ee1fbd0947de2Ted Kremenek    PP->HandleDirective(Tok);
1201eb4433ac451dc16f4133a88af2d002ac26c58efMike Stump
12159d08cb672136322375e5400578ee1fbd0947de2Ted Kremenek    if (PP->isCurrentLexer(this))
12259d08cb672136322375e5400578ee1fbd0947de2Ted Kremenek      goto LexNextToken;
1231eb4433ac451dc16f4133a88af2d002ac26c58efMike Stump
12459d08cb672136322375e5400578ee1fbd0947de2Ted Kremenek    return PP->Lex(Tok);
125e5680f3cd678014cf0872d34726dc804b0cbbdd4Ted Kremenek  }
1261eb4433ac451dc16f4133a88af2d002ac26c58efMike Stump
127898a0bb1972efb6e03cb1151412ec7392cef07deChris Lattner  if (TKind == tok::eom) {
12859d08cb672136322375e5400578ee1fbd0947de2Ted Kremenek    assert(ParsingPreprocessorDirective);
12959d08cb672136322375e5400578ee1fbd0947de2Ted Kremenek    ParsingPreprocessorDirective = false;
13059d08cb672136322375e5400578ee1fbd0947de2Ted Kremenek    return;
13159d08cb672136322375e5400578ee1fbd0947de2Ted Kremenek  }
132274b20863a728cc6a31ee75c670e3733600c1531Ted Kremenek
13359d08cb672136322375e5400578ee1fbd0947de2Ted Kremenek  MIOpt.ReadToken();
134cd4e2aecde5bb7810715d5d5a88ac63ce7946f34Ted Kremenek}
135cd4e2aecde5bb7810715d5d5a88ac63ce7946f34Ted Kremenek
13694e3d1f0349634235606be77c08b3a48a6d563d6Ted Kremenekbool PTHLexer::LexEndOfFile(Token &Result) {
13794e3d1f0349634235606be77c08b3a48a6d563d6Ted Kremenek  // If we hit the end of the file while parsing a preprocessor directive,
13894e3d1f0349634235606be77c08b3a48a6d563d6Ted Kremenek  // end the preprocessor directive first.  The next token returned will
13994e3d1f0349634235606be77c08b3a48a6d563d6Ted Kremenek  // then be the end of file.
14094e3d1f0349634235606be77c08b3a48a6d563d6Ted Kremenek  if (ParsingPreprocessorDirective) {
14194e3d1f0349634235606be77c08b3a48a6d563d6Ted Kremenek    ParsingPreprocessorDirective = false; // Done parsing the "line".
14294e3d1f0349634235606be77c08b3a48a6d563d6Ted Kremenek    return true;  // Have a token.
14394e3d1f0349634235606be77c08b3a48a6d563d6Ted Kremenek  }
14494e3d1f0349634235606be77c08b3a48a6d563d6Ted Kremenek
14594e3d1f0349634235606be77c08b3a48a6d563d6Ted Kremenek  assert(!LexingRawMode);
14694e3d1f0349634235606be77c08b3a48a6d563d6Ted Kremenek
14794e3d1f0349634235606be77c08b3a48a6d563d6Ted Kremenek  // If we are in a #if directive, emit an error.
14894e3d1f0349634235606be77c08b3a48a6d563d6Ted Kremenek  while (!ConditionalStack.empty()) {
1492d474ba9e8ae43a1a5a9f72718c0d79092b9453fDouglas Gregor    if (!PP->isCodeCompletionFile(FileStartLoc))
1502d474ba9e8ae43a1a5a9f72718c0d79092b9453fDouglas Gregor      PP->Diag(ConditionalStack.back().IfLoc,
1512d474ba9e8ae43a1a5a9f72718c0d79092b9453fDouglas Gregor               diag::err_pp_unterminated_conditional);
15294e3d1f0349634235606be77c08b3a48a6d563d6Ted Kremenek    ConditionalStack.pop_back();
15394e3d1f0349634235606be77c08b3a48a6d563d6Ted Kremenek  }
15494e3d1f0349634235606be77c08b3a48a6d563d6Ted Kremenek
15594e3d1f0349634235606be77c08b3a48a6d563d6Ted Kremenek  // Finally, let the preprocessor handle this.
15694e3d1f0349634235606be77c08b3a48a6d563d6Ted Kremenek  return PP->HandleEndOfFile(Result);
15794e3d1f0349634235606be77c08b3a48a6d563d6Ted Kremenek}
15894e3d1f0349634235606be77c08b3a48a6d563d6Ted Kremenek
159e5680f3cd678014cf0872d34726dc804b0cbbdd4Ted Kremenek// FIXME: We can just grab the last token instead of storing a copy
160e5680f3cd678014cf0872d34726dc804b0cbbdd4Ted Kremenek// into EofToken.
16159d08cb672136322375e5400578ee1fbd0947de2Ted Kremenekvoid PTHLexer::getEOF(Token& Tok) {
162defb7094c835998bb821e894253287625ce8c74dTed Kremenek  assert(EofToken.is(tok::eof));
1630c6a77bc1f52f282a969538f139ebde429076ed3Ted Kremenek  Tok = EofToken;
164274b20863a728cc6a31ee75c670e3733600c1531Ted Kremenek}
16517ff58a63197b398ae52697b088dc0fb8b255519Ted Kremenek
16617ff58a63197b398ae52697b088dc0fb8b255519Ted Kremenekvoid PTHLexer::DiscardToEndOfLine() {
16717ff58a63197b398ae52697b088dc0fb8b255519Ted Kremenek  assert(ParsingPreprocessorDirective && ParsingFilename == false &&
16817ff58a63197b398ae52697b088dc0fb8b255519Ted Kremenek         "Must be in a preprocessing directive!");
1694d35da2e41941965bbee8ed7e8c30e7c21000d71Ted Kremenek
170e5680f3cd678014cf0872d34726dc804b0cbbdd4Ted Kremenek  // We assume that if the preprocessor wishes to discard to the end of
171e5680f3cd678014cf0872d34726dc804b0cbbdd4Ted Kremenek  // the line that it also means to end the current preprocessor directive.
172e5680f3cd678014cf0872d34726dc804b0cbbdd4Ted Kremenek  ParsingPreprocessorDirective = false;
1731eb4433ac451dc16f4133a88af2d002ac26c58efMike Stump
17474c3e6e5e95af08096aab415d1ce15f15ffff02aTed Kremenek  // Skip tokens by only peeking at their token kind and the flags.
17574c3e6e5e95af08096aab415d1ce15f15ffff02aTed Kremenek  // We don't need to actually reconstruct full tokens from the token buffer.
17674c3e6e5e95af08096aab415d1ce15f15ffff02aTed Kremenek  // This saves some copies and it also reduces IdentifierInfo* lookup.
177da9d61c96c412f6babc7f824152609562f302388Chris Lattner  const unsigned char* p = CurPtr;
17874c3e6e5e95af08096aab415d1ce15f15ffff02aTed Kremenek  while (1) {
17974c3e6e5e95af08096aab415d1ce15f15ffff02aTed Kremenek    // Read the token kind.  Are we at the end of the file?
18074c3e6e5e95af08096aab415d1ce15f15ffff02aTed Kremenek    tok::TokenKind x = (tok::TokenKind) (uint8_t) *p;
18174c3e6e5e95af08096aab415d1ce15f15ffff02aTed Kremenek    if (x == tok::eof) break;
1821eb4433ac451dc16f4133a88af2d002ac26c58efMike Stump
18374c3e6e5e95af08096aab415d1ce15f15ffff02aTed Kremenek    // Read the token flags.  Are we at the start of the next line?
18474c3e6e5e95af08096aab415d1ce15f15ffff02aTed Kremenek    Token::TokenFlags y = (Token::TokenFlags) (uint8_t) p[1];
18580d2f3059326f99ebf7c867db1c7f106ec9485f5Ted Kremenek    if (y & Token::StartOfLine) break;
18674c3e6e5e95af08096aab415d1ce15f15ffff02aTed Kremenek
18774c3e6e5e95af08096aab415d1ce15f15ffff02aTed Kremenek    // Skip to the next token.
18874c3e6e5e95af08096aab415d1ce15f15ffff02aTed Kremenek    p += DISK_TOKEN_SIZE;
18974c3e6e5e95af08096aab415d1ce15f15ffff02aTed Kremenek  }
1901eb4433ac451dc16f4133a88af2d002ac26c58efMike Stump
19174c3e6e5e95af08096aab415d1ce15f15ffff02aTed Kremenek  CurPtr = p;
19217ff58a63197b398ae52697b088dc0fb8b255519Ted Kremenek}
1930c6a77bc1f52f282a969538f139ebde429076ed3Ted Kremenek
194268ee7016a2811803989487c0ad3799486092c63Ted Kremenek/// SkipBlock - Used by Preprocessor to skip the current conditional block.
195268ee7016a2811803989487c0ad3799486092c63Ted Kremenekbool PTHLexer::SkipBlock() {
196268ee7016a2811803989487c0ad3799486092c63Ted Kremenek  assert(CurPPCondPtr && "No cached PP conditional information.");
197268ee7016a2811803989487c0ad3799486092c63Ted Kremenek  assert(LastHashTokPtr && "No known '#' token.");
1981eb4433ac451dc16f4133a88af2d002ac26c58efMike Stump
199da9d61c96c412f6babc7f824152609562f302388Chris Lattner  const unsigned char* HashEntryI = 0;
2001eb4433ac451dc16f4133a88af2d002ac26c58efMike Stump  uint32_t Offset;
201268ee7016a2811803989487c0ad3799486092c63Ted Kremenek  uint32_t TableIdx;
2021eb4433ac451dc16f4133a88af2d002ac26c58efMike Stump
203268ee7016a2811803989487c0ad3799486092c63Ted Kremenek  do {
20441a2660377d215d004fe413c03874bd066b5384cTed Kremenek    // Read the token offset from the side-table.
2055ff4317536dbd7f03332bb250c8b35ec04a6f5dbChris Lattner    Offset = ReadLE32(CurPPCondPtr);
2061eb4433ac451dc16f4133a88af2d002ac26c58efMike Stump
2071eb4433ac451dc16f4133a88af2d002ac26c58efMike Stump    // Read the target table index from the side-table.
2085ff4317536dbd7f03332bb250c8b35ec04a6f5dbChris Lattner    TableIdx = ReadLE32(CurPPCondPtr);
2091eb4433ac451dc16f4133a88af2d002ac26c58efMike Stump
21041a2660377d215d004fe413c03874bd066b5384cTed Kremenek    // Compute the actual memory address of the '#' token data for this entry.
21141a2660377d215d004fe413c03874bd066b5384cTed Kremenek    HashEntryI = TokBuf + Offset;
21241a2660377d215d004fe413c03874bd066b5384cTed Kremenek
21341a2660377d215d004fe413c03874bd066b5384cTed Kremenek    // Optmization: "Sibling jumping".  #if...#else...#endif blocks can
21441a2660377d215d004fe413c03874bd066b5384cTed Kremenek    //  contain nested blocks.  In the side-table we can jump over these
21541a2660377d215d004fe413c03874bd066b5384cTed Kremenek    //  nested blocks instead of doing a linear search if the next "sibling"
21641a2660377d215d004fe413c03874bd066b5384cTed Kremenek    //  entry is not at a location greater than LastHashTokPtr.
21741a2660377d215d004fe413c03874bd066b5384cTed Kremenek    if (HashEntryI < LastHashTokPtr && TableIdx) {
21841a2660377d215d004fe413c03874bd066b5384cTed Kremenek      // In the side-table we are still at an entry for a '#' token that
21941a2660377d215d004fe413c03874bd066b5384cTed Kremenek      // is earlier than the last one we saw.  Check if the location we would
22041a2660377d215d004fe413c03874bd066b5384cTed Kremenek      // stride gets us closer.
221da9d61c96c412f6babc7f824152609562f302388Chris Lattner      const unsigned char* NextPPCondPtr =
222da9d61c96c412f6babc7f824152609562f302388Chris Lattner        PPCond + TableIdx*(sizeof(uint32_t)*2);
22341a2660377d215d004fe413c03874bd066b5384cTed Kremenek      assert(NextPPCondPtr >= CurPPCondPtr);
22441a2660377d215d004fe413c03874bd066b5384cTed Kremenek      // Read where we should jump to.
2255ff4317536dbd7f03332bb250c8b35ec04a6f5dbChris Lattner      uint32_t TmpOffset = ReadLE32(NextPPCondPtr);
226da9d61c96c412f6babc7f824152609562f302388Chris Lattner      const unsigned char* HashEntryJ = TokBuf + TmpOffset;
2271eb4433ac451dc16f4133a88af2d002ac26c58efMike Stump
22841a2660377d215d004fe413c03874bd066b5384cTed Kremenek      if (HashEntryJ <= LastHashTokPtr) {
22941a2660377d215d004fe413c03874bd066b5384cTed Kremenek        // Jump directly to the next entry in the side table.
23041a2660377d215d004fe413c03874bd066b5384cTed Kremenek        HashEntryI = HashEntryJ;
23141a2660377d215d004fe413c03874bd066b5384cTed Kremenek        Offset = TmpOffset;
2325ff4317536dbd7f03332bb250c8b35ec04a6f5dbChris Lattner        TableIdx = ReadLE32(NextPPCondPtr);
23341a2660377d215d004fe413c03874bd066b5384cTed Kremenek        CurPPCondPtr = NextPPCondPtr;
23441a2660377d215d004fe413c03874bd066b5384cTed Kremenek      }
23541a2660377d215d004fe413c03874bd066b5384cTed Kremenek    }
236268ee7016a2811803989487c0ad3799486092c63Ted Kremenek  }
2371eb4433ac451dc16f4133a88af2d002ac26c58efMike Stump  while (HashEntryI < LastHashTokPtr);
23841a2660377d215d004fe413c03874bd066b5384cTed Kremenek  assert(HashEntryI == LastHashTokPtr && "No PP-cond entry found for '#'");
239268ee7016a2811803989487c0ad3799486092c63Ted Kremenek  assert(TableIdx && "No jumping from #endifs.");
2401eb4433ac451dc16f4133a88af2d002ac26c58efMike Stump
241268ee7016a2811803989487c0ad3799486092c63Ted Kremenek  // Update our side-table iterator.
242da9d61c96c412f6babc7f824152609562f302388Chris Lattner  const unsigned char* NextPPCondPtr = PPCond + TableIdx*(sizeof(uint32_t)*2);
243268ee7016a2811803989487c0ad3799486092c63Ted Kremenek  assert(NextPPCondPtr >= CurPPCondPtr);
244268ee7016a2811803989487c0ad3799486092c63Ted Kremenek  CurPPCondPtr = NextPPCondPtr;
2451eb4433ac451dc16f4133a88af2d002ac26c58efMike Stump
246268ee7016a2811803989487c0ad3799486092c63Ted Kremenek  // Read where we should jump to.
2475ff4317536dbd7f03332bb250c8b35ec04a6f5dbChris Lattner  HashEntryI = TokBuf + ReadLE32(NextPPCondPtr);
2485ff4317536dbd7f03332bb250c8b35ec04a6f5dbChris Lattner  uint32_t NextIdx = ReadLE32(NextPPCondPtr);
2491eb4433ac451dc16f4133a88af2d002ac26c58efMike Stump
250268ee7016a2811803989487c0ad3799486092c63Ted Kremenek  // By construction NextIdx will be zero if this is a #endif.  This is useful
251268ee7016a2811803989487c0ad3799486092c63Ted Kremenek  // to know to obviate lexing another token.
252268ee7016a2811803989487c0ad3799486092c63Ted Kremenek  bool isEndif = NextIdx == 0;
2531eb4433ac451dc16f4133a88af2d002ac26c58efMike Stump
254268ee7016a2811803989487c0ad3799486092c63Ted Kremenek  // This case can occur when we see something like this:
255268ee7016a2811803989487c0ad3799486092c63Ted Kremenek  //
256268ee7016a2811803989487c0ad3799486092c63Ted Kremenek  //  #if ...
257268ee7016a2811803989487c0ad3799486092c63Ted Kremenek  //   /* a comment or nothing */
258268ee7016a2811803989487c0ad3799486092c63Ted Kremenek  //  #elif
259268ee7016a2811803989487c0ad3799486092c63Ted Kremenek  //
260268ee7016a2811803989487c0ad3799486092c63Ted Kremenek  // If we are skipping the first #if block it will be the case that CurPtr
261268ee7016a2811803989487c0ad3799486092c63Ted Kremenek  // already points 'elif'.  Just return.
2621eb4433ac451dc16f4133a88af2d002ac26c58efMike Stump
26341a2660377d215d004fe413c03874bd066b5384cTed Kremenek  if (CurPtr > HashEntryI) {
26441a2660377d215d004fe413c03874bd066b5384cTed Kremenek    assert(CurPtr == HashEntryI + DISK_TOKEN_SIZE);
265268ee7016a2811803989487c0ad3799486092c63Ted Kremenek    // Did we reach a #endif?  If so, go ahead and consume that token as well.
266268ee7016a2811803989487c0ad3799486092c63Ted Kremenek    if (isEndif)
267e5680f3cd678014cf0872d34726dc804b0cbbdd4Ted Kremenek      CurPtr += DISK_TOKEN_SIZE*2;
268268ee7016a2811803989487c0ad3799486092c63Ted Kremenek    else
26941a2660377d215d004fe413c03874bd066b5384cTed Kremenek      LastHashTokPtr = HashEntryI;
2701eb4433ac451dc16f4133a88af2d002ac26c58efMike Stump
271268ee7016a2811803989487c0ad3799486092c63Ted Kremenek    return isEndif;
272268ee7016a2811803989487c0ad3799486092c63Ted Kremenek  }
273268ee7016a2811803989487c0ad3799486092c63Ted Kremenek
274268ee7016a2811803989487c0ad3799486092c63Ted Kremenek  // Otherwise, we need to advance.  Update CurPtr to point to the '#' token.
27541a2660377d215d004fe413c03874bd066b5384cTed Kremenek  CurPtr = HashEntryI;
2761eb4433ac451dc16f4133a88af2d002ac26c58efMike Stump
277268ee7016a2811803989487c0ad3799486092c63Ted Kremenek  // Update the location of the last observed '#'.  This is useful if we
278268ee7016a2811803989487c0ad3799486092c63Ted Kremenek  // are skipping multiple blocks.
279268ee7016a2811803989487c0ad3799486092c63Ted Kremenek  LastHashTokPtr = CurPtr;
280268ee7016a2811803989487c0ad3799486092c63Ted Kremenek
281e5680f3cd678014cf0872d34726dc804b0cbbdd4Ted Kremenek  // Skip the '#' token.
282da9d61c96c412f6babc7f824152609562f302388Chris Lattner  assert(((tok::TokenKind)*CurPtr) == tok::hash);
283e5680f3cd678014cf0872d34726dc804b0cbbdd4Ted Kremenek  CurPtr += DISK_TOKEN_SIZE;
2841eb4433ac451dc16f4133a88af2d002ac26c58efMike Stump
285268ee7016a2811803989487c0ad3799486092c63Ted Kremenek  // Did we reach a #endif?  If so, go ahead and consume that token as well.
286e5680f3cd678014cf0872d34726dc804b0cbbdd4Ted Kremenek  if (isEndif) { CurPtr += DISK_TOKEN_SIZE*2; }
287268ee7016a2811803989487c0ad3799486092c63Ted Kremenek
288268ee7016a2811803989487c0ad3799486092c63Ted Kremenek  return isEndif;
289268ee7016a2811803989487c0ad3799486092c63Ted Kremenek}
290268ee7016a2811803989487c0ad3799486092c63Ted Kremenek
29130a12ec2a7f331d9e08acabe7cda853aaa7ba54bTed KremenekSourceLocation PTHLexer::getSourceLocation() {
2921b5285e1ba31975864da356b2ed927e87670e654Chris Lattner  // getSourceLocation is not on the hot path.  It is used to get the location
2931b5285e1ba31975864da356b2ed927e87670e654Chris Lattner  // of the next token when transitioning back to this lexer when done
29430a12ec2a7f331d9e08acabe7cda853aaa7ba54bTed Kremenek  // handling a #included file.  Just read the necessary data from the token
29530a12ec2a7f331d9e08acabe7cda853aaa7ba54bTed Kremenek  // data buffer to construct the SourceLocation object.
29630a12ec2a7f331d9e08acabe7cda853aaa7ba54bTed Kremenek  // NOTE: This is a virtual function; hence it is defined out-of-line.
297b248d53f2599d8e7b53b144b713e163ca521ffcaTed Kremenek  const unsigned char *OffsetPtr = CurPtr + (DISK_TOKEN_SIZE - 4);
2985ff4317536dbd7f03332bb250c8b35ec04a6f5dbChris Lattner  uint32_t Offset = ReadLE32(OffsetPtr);
2991b5285e1ba31975864da356b2ed927e87670e654Chris Lattner  return FileStartLoc.getFileLocWithOffset(Offset);
30030a12ec2a7f331d9e08acabe7cda853aaa7ba54bTed Kremenek}
30130a12ec2a7f331d9e08acabe7cda853aaa7ba54bTed Kremenek
3025f074266cc59563036c40516c814d63825723e20Ted Kremenek//===----------------------------------------------------------------------===//
303d8c02929fe70f03111be73e7b8c402c724238ee9Ted Kremenek// PTH file lookup: map from strings to file data.
304d8c02929fe70f03111be73e7b8c402c724238ee9Ted Kremenek//===----------------------------------------------------------------------===//
3050c6a77bc1f52f282a969538f139ebde429076ed3Ted Kremenek
3060c6a77bc1f52f282a969538f139ebde429076ed3Ted Kremenek/// PTHFileLookup - This internal data structure is used by the PTHManager
3070c6a77bc1f52f282a969538f139ebde429076ed3Ted Kremenek///  to map from FileEntry objects managed by FileManager to offsets within
3080c6a77bc1f52f282a969538f139ebde429076ed3Ted Kremenek///  the PTH file.
3090c6a77bc1f52f282a969538f139ebde429076ed3Ted Kremeneknamespace {
31085b4521e34dcd4a0a4a1f0819e1123128e5a3125Benjamin Kramerclass PTHFileData {
311d8c02929fe70f03111be73e7b8c402c724238ee9Ted Kremenek  const uint32_t TokenOff;
312d8c02929fe70f03111be73e7b8c402c724238ee9Ted Kremenek  const uint32_t PPCondOff;
3130c6a77bc1f52f282a969538f139ebde429076ed3Ted Kremenekpublic:
314d8c02929fe70f03111be73e7b8c402c724238ee9Ted Kremenek  PTHFileData(uint32_t tokenOff, uint32_t ppCondOff)
315d8c02929fe70f03111be73e7b8c402c724238ee9Ted Kremenek    : TokenOff(tokenOff), PPCondOff(ppCondOff) {}
3161eb4433ac451dc16f4133a88af2d002ac26c58efMike Stump
3171eb4433ac451dc16f4133a88af2d002ac26c58efMike Stump  uint32_t getTokenOffset() const { return TokenOff; }
3181eb4433ac451dc16f4133a88af2d002ac26c58efMike Stump  uint32_t getPPCondOffset() const { return PPCondOff; }
319d8c02929fe70f03111be73e7b8c402c724238ee9Ted Kremenek};
3201eb4433ac451dc16f4133a88af2d002ac26c58efMike Stump
3211eb4433ac451dc16f4133a88af2d002ac26c58efMike Stump
32285b4521e34dcd4a0a4a1f0819e1123128e5a3125Benjamin Kramerclass PTHFileLookupCommonTrait {
3230c6a77bc1f52f282a969538f139ebde429076ed3Ted Kremenekpublic:
324a4b44dd9d30929a35c44d85102e5241ee847b2f2Ted Kremenek  typedef std::pair<unsigned char, const char*> internal_key_type;
325a4b44dd9d30929a35c44d85102e5241ee847b2f2Ted Kremenek
326a4b44dd9d30929a35c44d85102e5241ee847b2f2Ted Kremenek  static unsigned ComputeHash(internal_key_type x) {
3272596e429a61602312bdd149786045b8a90cd2d10Daniel Dunbar    return llvm::HashString(x.second);
328d8c02929fe70f03111be73e7b8c402c724238ee9Ted Kremenek  }
3291eb4433ac451dc16f4133a88af2d002ac26c58efMike Stump
330d8c02929fe70f03111be73e7b8c402c724238ee9Ted Kremenek  static std::pair<unsigned, unsigned>
331d8c02929fe70f03111be73e7b8c402c724238ee9Ted Kremenek  ReadKeyDataLength(const unsigned char*& d) {
332a4b44dd9d30929a35c44d85102e5241ee847b2f2Ted Kremenek    unsigned keyLen = (unsigned) ReadUnalignedLE16(d);
333a4b44dd9d30929a35c44d85102e5241ee847b2f2Ted Kremenek    unsigned dataLen = (unsigned) *(d++);
334a4b44dd9d30929a35c44d85102e5241ee847b2f2Ted Kremenek    return std::make_pair(keyLen, dataLen);
3350c6a77bc1f52f282a969538f139ebde429076ed3Ted Kremenek  }
3361eb4433ac451dc16f4133a88af2d002ac26c58efMike Stump
337a4b44dd9d30929a35c44d85102e5241ee847b2f2Ted Kremenek  static internal_key_type ReadKey(const unsigned char* d, unsigned) {
338a4b44dd9d30929a35c44d85102e5241ee847b2f2Ted Kremenek    unsigned char k = *(d++); // Read the entry kind.
339a4b44dd9d30929a35c44d85102e5241ee847b2f2Ted Kremenek    return std::make_pair(k, (const char*) d);
340d8c02929fe70f03111be73e7b8c402c724238ee9Ted Kremenek  }
341337edcdbec05316b407d0d64865c88ff8597d910Ted Kremenek};
3421eb4433ac451dc16f4133a88af2d002ac26c58efMike Stump
34385b4521e34dcd4a0a4a1f0819e1123128e5a3125Benjamin Kramerclass PTHFileLookupTrait : public PTHFileLookupCommonTrait {
344337edcdbec05316b407d0d64865c88ff8597d910Ted Kremenekpublic:
345337edcdbec05316b407d0d64865c88ff8597d910Ted Kremenek  typedef const FileEntry* external_key_type;
346337edcdbec05316b407d0d64865c88ff8597d910Ted Kremenek  typedef PTHFileData      data_type;
3471eb4433ac451dc16f4133a88af2d002ac26c58efMike Stump
348a4b44dd9d30929a35c44d85102e5241ee847b2f2Ted Kremenek  static internal_key_type GetInternalKey(const FileEntry* FE) {
349a4b44dd9d30929a35c44d85102e5241ee847b2f2Ted Kremenek    return std::make_pair((unsigned char) 0x1, FE->getName());
350337edcdbec05316b407d0d64865c88ff8597d910Ted Kremenek  }
351a4b44dd9d30929a35c44d85102e5241ee847b2f2Ted Kremenek
352a4b44dd9d30929a35c44d85102e5241ee847b2f2Ted Kremenek  static bool EqualKey(internal_key_type a, internal_key_type b) {
353a4b44dd9d30929a35c44d85102e5241ee847b2f2Ted Kremenek    return a.first == b.first && strcmp(a.second, b.second) == 0;
3541eb4433ac451dc16f4133a88af2d002ac26c58efMike Stump  }
3551eb4433ac451dc16f4133a88af2d002ac26c58efMike Stump
3561eb4433ac451dc16f4133a88af2d002ac26c58efMike Stump  static PTHFileData ReadData(const internal_key_type& k,
3571eb4433ac451dc16f4133a88af2d002ac26c58efMike Stump                              const unsigned char* d, unsigned) {
358a4b44dd9d30929a35c44d85102e5241ee847b2f2Ted Kremenek    assert(k.first == 0x1 && "Only file lookups can match!");
359d8c02929fe70f03111be73e7b8c402c724238ee9Ted Kremenek    uint32_t x = ::ReadUnalignedLE32(d);
360d8c02929fe70f03111be73e7b8c402c724238ee9Ted Kremenek    uint32_t y = ::ReadUnalignedLE32(d);
3611eb4433ac451dc16f4133a88af2d002ac26c58efMike Stump    return PTHFileData(x, y);
3620c6a77bc1f52f282a969538f139ebde429076ed3Ted Kremenek  }
3630c6a77bc1f52f282a969538f139ebde429076ed3Ted Kremenek};
3647e3a004c6ed1fe87912203b9c5a113f8da89d261Ted Kremenek
36585b4521e34dcd4a0a4a1f0819e1123128e5a3125Benjamin Kramerclass PTHStringLookupTrait {
3667e3a004c6ed1fe87912203b9c5a113f8da89d261Ted Kremenekpublic:
3671eb4433ac451dc16f4133a88af2d002ac26c58efMike Stump  typedef uint32_t
3687e3a004c6ed1fe87912203b9c5a113f8da89d261Ted Kremenek          data_type;
3697e3a004c6ed1fe87912203b9c5a113f8da89d261Ted Kremenek
3707e3a004c6ed1fe87912203b9c5a113f8da89d261Ted Kremenek  typedef const std::pair<const char*, unsigned>
3717e3a004c6ed1fe87912203b9c5a113f8da89d261Ted Kremenek          external_key_type;
3727e3a004c6ed1fe87912203b9c5a113f8da89d261Ted Kremenek
3737e3a004c6ed1fe87912203b9c5a113f8da89d261Ted Kremenek  typedef external_key_type internal_key_type;
3741eb4433ac451dc16f4133a88af2d002ac26c58efMike Stump
3757e3a004c6ed1fe87912203b9c5a113f8da89d261Ted Kremenek  static bool EqualKey(const internal_key_type& a,
3767e3a004c6ed1fe87912203b9c5a113f8da89d261Ted Kremenek                       const internal_key_type& b) {
3777e3a004c6ed1fe87912203b9c5a113f8da89d261Ted Kremenek    return (a.second == b.second) ? memcmp(a.first, b.first, a.second) == 0
3787e3a004c6ed1fe87912203b9c5a113f8da89d261Ted Kremenek                                  : false;
3797e3a004c6ed1fe87912203b9c5a113f8da89d261Ted Kremenek  }
3801eb4433ac451dc16f4133a88af2d002ac26c58efMike Stump
3817e3a004c6ed1fe87912203b9c5a113f8da89d261Ted Kremenek  static unsigned ComputeHash(const internal_key_type& a) {
3822596e429a61602312bdd149786045b8a90cd2d10Daniel Dunbar    return llvm::HashString(llvm::StringRef(a.first, a.second));
3837e3a004c6ed1fe87912203b9c5a113f8da89d261Ted Kremenek  }
3841eb4433ac451dc16f4133a88af2d002ac26c58efMike Stump
3857e3a004c6ed1fe87912203b9c5a113f8da89d261Ted Kremenek  // This hopefully will just get inlined and removed by the optimizer.
3867e3a004c6ed1fe87912203b9c5a113f8da89d261Ted Kremenek  static const internal_key_type&
3877e3a004c6ed1fe87912203b9c5a113f8da89d261Ted Kremenek  GetInternalKey(const external_key_type& x) { return x; }
3881eb4433ac451dc16f4133a88af2d002ac26c58efMike Stump
3897e3a004c6ed1fe87912203b9c5a113f8da89d261Ted Kremenek  static std::pair<unsigned, unsigned>
3907e3a004c6ed1fe87912203b9c5a113f8da89d261Ted Kremenek  ReadKeyDataLength(const unsigned char*& d) {
3917e3a004c6ed1fe87912203b9c5a113f8da89d261Ted Kremenek    return std::make_pair((unsigned) ReadUnalignedLE16(d), sizeof(uint32_t));
3927e3a004c6ed1fe87912203b9c5a113f8da89d261Ted Kremenek  }
3931eb4433ac451dc16f4133a88af2d002ac26c58efMike Stump
3947e3a004c6ed1fe87912203b9c5a113f8da89d261Ted Kremenek  static std::pair<const char*, unsigned>
3957e3a004c6ed1fe87912203b9c5a113f8da89d261Ted Kremenek  ReadKey(const unsigned char* d, unsigned n) {
3967e3a004c6ed1fe87912203b9c5a113f8da89d261Ted Kremenek      assert(n >= 2 && d[n-1] == '\0');
3977e3a004c6ed1fe87912203b9c5a113f8da89d261Ted Kremenek      return std::make_pair((const char*) d, n-1);
3987e3a004c6ed1fe87912203b9c5a113f8da89d261Ted Kremenek    }
3991eb4433ac451dc16f4133a88af2d002ac26c58efMike Stump
400a4b44dd9d30929a35c44d85102e5241ee847b2f2Ted Kremenek  static uint32_t ReadData(const internal_key_type& k, const unsigned char* d,
401a4b44dd9d30929a35c44d85102e5241ee847b2f2Ted Kremenek                           unsigned) {
4027e3a004c6ed1fe87912203b9c5a113f8da89d261Ted Kremenek    return ::ReadUnalignedLE32(d);
4037e3a004c6ed1fe87912203b9c5a113f8da89d261Ted Kremenek  }
4047e3a004c6ed1fe87912203b9c5a113f8da89d261Ted Kremenek};
4051eb4433ac451dc16f4133a88af2d002ac26c58efMike Stump
4061eb4433ac451dc16f4133a88af2d002ac26c58efMike Stump} // end anonymous namespace
407d8c02929fe70f03111be73e7b8c402c724238ee9Ted Kremenek
4087e3a004c6ed1fe87912203b9c5a113f8da89d261Ted Kremenektypedef OnDiskChainedHashTable<PTHFileLookupTrait>   PTHFileLookup;
4097e3a004c6ed1fe87912203b9c5a113f8da89d261Ted Kremenektypedef OnDiskChainedHashTable<PTHStringLookupTrait> PTHStringIdLookup;
4100c6a77bc1f52f282a969538f139ebde429076ed3Ted Kremenek
4110c6a77bc1f52f282a969538f139ebde429076ed3Ted Kremenek//===----------------------------------------------------------------------===//
4120c6a77bc1f52f282a969538f139ebde429076ed3Ted Kremenek// PTHManager methods.
4130c6a77bc1f52f282a969538f139ebde429076ed3Ted Kremenek//===----------------------------------------------------------------------===//
4140c6a77bc1f52f282a969538f139ebde429076ed3Ted Kremenek
4150c6a77bc1f52f282a969538f139ebde429076ed3Ted KremenekPTHManager::PTHManager(const llvm::MemoryBuffer* buf, void* fileLookup,
416da9d61c96c412f6babc7f824152609562f302388Chris Lattner                       const unsigned char* idDataTable,
4171eb4433ac451dc16f4133a88af2d002ac26c58efMike Stump                       IdentifierInfo** perIDCache,
4187e3a004c6ed1fe87912203b9c5a113f8da89d261Ted Kremenek                       void* stringIdLookup, unsigned numIds,
41968228634016f644a1164fa1f024a9ce2093656bfTed Kremenek                       const unsigned char* spellingBase,
42068228634016f644a1164fa1f024a9ce2093656bfTed Kremenek                       const char* originalSourceFile)
4216183e4815a4019e97ad01bd880f12355599b75fdTed Kremenek: Buf(buf), PerIDCache(perIDCache), FileLookup(fileLookup),
4227e3a004c6ed1fe87912203b9c5a113f8da89d261Ted Kremenek  IdDataTable(idDataTable), StringIdLookup(stringIdLookup),
42368228634016f644a1164fa1f024a9ce2093656bfTed Kremenek  NumIds(numIds), PP(0), SpellingBase(spellingBase),
42468228634016f644a1164fa1f024a9ce2093656bfTed Kremenek  OriginalSourceFile(originalSourceFile) {}
4250c6a77bc1f52f282a969538f139ebde429076ed3Ted Kremenek
4260c6a77bc1f52f282a969538f139ebde429076ed3Ted KremenekPTHManager::~PTHManager() {
4270c6a77bc1f52f282a969538f139ebde429076ed3Ted Kremenek  delete Buf;
4280c6a77bc1f52f282a969538f139ebde429076ed3Ted Kremenek  delete (PTHFileLookup*) FileLookup;
4297e3a004c6ed1fe87912203b9c5a113f8da89d261Ted Kremenek  delete (PTHStringIdLookup*) StringIdLookup;
4300e50b6e7c104d00614baa3d80df62f1630a94d9cTed Kremenek  free(PerIDCache);
4310c6a77bc1f52f282a969538f139ebde429076ed3Ted Kremenek}
4320c6a77bc1f52f282a969538f139ebde429076ed3Ted Kremenek
4333574f46cf495ec61618fd6864b045c5b1d0d5068Daniel Dunbarstatic void InvalidPTH(Diagnostic &Diags, const char *Msg) {
4343574f46cf495ec61618fd6864b045c5b1d0d5068Daniel Dunbar  Diags.Report(Diags.getCustomDiagID(Diagnostic::Error, Msg));
43526555b18aa2c3b78744e77927acd3faa53ae7369Ted Kremenek}
43626555b18aa2c3b78744e77927acd3faa53ae7369Ted Kremenek
4377ad629ebefa87269cc1887debc83cfa58c285a80Chris LattnerPTHManager *PTHManager::Create(const std::string &file, FileManager &FileMgr,
438389db16c63eec6ecfa9b235155252d8da766e94eArgyrios Kyrtzidis                               const FileSystemOptions &FSOpts,
439389db16c63eec6ecfa9b235155252d8da766e94eArgyrios Kyrtzidis                               Diagnostic &Diags) {
4400c6a77bc1f52f282a969538f139ebde429076ed3Ted Kremenek  // Memory map the PTH file.
4410c6a77bc1f52f282a969538f139ebde429076ed3Ted Kremenek  llvm::OwningPtr<llvm::MemoryBuffer>
442389db16c63eec6ecfa9b235155252d8da766e94eArgyrios Kyrtzidis  File(FileMgr.getBufferForFile(file, FSOpts));
4431eb4433ac451dc16f4133a88af2d002ac26c58efMike Stump
4448a6aec620dbec1f292fe4116c0373ac81ab90234Ted Kremenek  if (!File) {
4453574f46cf495ec61618fd6864b045c5b1d0d5068Daniel Dunbar    Diags.Report(diag::err_invalid_pth_file) << file;
4460c6a77bc1f52f282a969538f139ebde429076ed3Ted Kremenek    return 0;
4478a6aec620dbec1f292fe4116c0373ac81ab90234Ted Kremenek  }
4481eb4433ac451dc16f4133a88af2d002ac26c58efMike Stump
4490c6a77bc1f52f282a969538f139ebde429076ed3Ted Kremenek  // Get the buffer ranges and check if there are at least three 32-bit
4500c6a77bc1f52f282a969538f139ebde429076ed3Ted Kremenek  // words at the end of the file.
4517ad629ebefa87269cc1887debc83cfa58c285a80Chris Lattner  const unsigned char *BufBeg = (unsigned char*)File->getBufferStart();
4527ad629ebefa87269cc1887debc83cfa58c285a80Chris Lattner  const unsigned char *BufEnd = (unsigned char*)File->getBufferEnd();
453e1b6498c41b94c3bc5cede17b0702282543385efTed Kremenek
454e1b6498c41b94c3bc5cede17b0702282543385efTed Kremenek  // Check the prologue of the file.
4557ad629ebefa87269cc1887debc83cfa58c285a80Chris Lattner  if ((BufEnd - BufBeg) < (signed)(sizeof("cfe-pth") + 3 + 4) ||
45626555b18aa2c3b78744e77927acd3faa53ae7369Ted Kremenek      memcmp(BufBeg, "cfe-pth", sizeof("cfe-pth") - 1) != 0) {
4573574f46cf495ec61618fd6864b045c5b1d0d5068Daniel Dunbar    Diags.Report(diag::err_invalid_pth_file) << file;
458e1b6498c41b94c3bc5cede17b0702282543385efTed Kremenek    return 0;
45926555b18aa2c3b78744e77927acd3faa53ae7369Ted Kremenek  }
4601eb4433ac451dc16f4133a88af2d002ac26c58efMike Stump
46167d15050bbea16ae256e204ecd464f2e454c3c99Ted Kremenek  // Read the PTH version.
462e1b6498c41b94c3bc5cede17b0702282543385efTed Kremenek  const unsigned char *p = BufBeg + (sizeof("cfe-pth") - 1);
46367d15050bbea16ae256e204ecd464f2e454c3c99Ted Kremenek  unsigned Version = ReadLE32(p);
4641eb4433ac451dc16f4133a88af2d002ac26c58efMike Stump
4653574f46cf495ec61618fd6864b045c5b1d0d5068Daniel Dunbar  if (Version < PTHManager::Version) {
4663574f46cf495ec61618fd6864b045c5b1d0d5068Daniel Dunbar    InvalidPTH(Diags,
4671eb4433ac451dc16f4133a88af2d002ac26c58efMike Stump        Version < PTHManager::Version
46826555b18aa2c3b78744e77927acd3faa53ae7369Ted Kremenek        ? "PTH file uses an older PTH format that is no longer supported"
46926555b18aa2c3b78744e77927acd3faa53ae7369Ted Kremenek        : "PTH file uses a newer PTH format that cannot be read");
47067d15050bbea16ae256e204ecd464f2e454c3c99Ted Kremenek    return 0;
47126555b18aa2c3b78744e77927acd3faa53ae7369Ted Kremenek  }
47267d15050bbea16ae256e204ecd464f2e454c3c99Ted Kremenek
4731eb4433ac451dc16f4133a88af2d002ac26c58efMike Stump  // Compute the address of the index table at the end of the PTH file.
474a4bd8eb4d6d4b625f6bbb62fc180b02eab6433edTed Kremenek  const unsigned char *PrologueOffset = p;
4751eb4433ac451dc16f4133a88af2d002ac26c58efMike Stump
476a4bd8eb4d6d4b625f6bbb62fc180b02eab6433edTed Kremenek  if (PrologueOffset >= BufEnd) {
4773574f46cf495ec61618fd6864b045c5b1d0d5068Daniel Dunbar    Diags.Report(diag::err_invalid_pth_file) << file;
478e1b6498c41b94c3bc5cede17b0702282543385efTed Kremenek    return 0;
47926555b18aa2c3b78744e77927acd3faa53ae7369Ted Kremenek  }
4801eb4433ac451dc16f4133a88af2d002ac26c58efMike Stump
4810c6a77bc1f52f282a969538f139ebde429076ed3Ted Kremenek  // Construct the file lookup table.  This will be used for mapping from
4820c6a77bc1f52f282a969538f139ebde429076ed3Ted Kremenek  // FileEntry*'s to cached tokens.
483a4bd8eb4d6d4b625f6bbb62fc180b02eab6433edTed Kremenek  const unsigned char* FileTableOffset = PrologueOffset + sizeof(uint32_t)*2;
4845ff4317536dbd7f03332bb250c8b35ec04a6f5dbChris Lattner  const unsigned char* FileTable = BufBeg + ReadLE32(FileTableOffset);
4851eb4433ac451dc16f4133a88af2d002ac26c58efMike Stump
4860c6a77bc1f52f282a969538f139ebde429076ed3Ted Kremenek  if (!(FileTable > BufBeg && FileTable < BufEnd)) {
4873574f46cf495ec61618fd6864b045c5b1d0d5068Daniel Dunbar    Diags.Report(diag::err_invalid_pth_file) << file;
4880c6a77bc1f52f282a969538f139ebde429076ed3Ted Kremenek    return 0; // FIXME: Proper error diagnostic?
4890c6a77bc1f52f282a969538f139ebde429076ed3Ted Kremenek  }
4901eb4433ac451dc16f4133a88af2d002ac26c58efMike Stump
491d8c02929fe70f03111be73e7b8c402c724238ee9Ted Kremenek  llvm::OwningPtr<PTHFileLookup> FL(PTHFileLookup::Create(FileTable, BufBeg));
4921eb4433ac451dc16f4133a88af2d002ac26c58efMike Stump
4931d20197cb9478f3db17cbcfc57a1f8182843fc6aTed Kremenek  // Warn if the PTH file is empty.  We still want to create a PTHManager
4941d20197cb9478f3db17cbcfc57a1f8182843fc6aTed Kremenek  // as the PTH could be used with -include-pth.
4951d20197cb9478f3db17cbcfc57a1f8182843fc6aTed Kremenek  if (FL->isEmpty())
4963574f46cf495ec61618fd6864b045c5b1d0d5068Daniel Dunbar    InvalidPTH(Diags, "PTH file contains no cached source data");
4971eb4433ac451dc16f4133a88af2d002ac26c58efMike Stump
4980c6a77bc1f52f282a969538f139ebde429076ed3Ted Kremenek  // Get the location of the table mapping from persistent ids to the
4990c6a77bc1f52f282a969538f139ebde429076ed3Ted Kremenek  // data needed to reconstruct identifiers.
500a4bd8eb4d6d4b625f6bbb62fc180b02eab6433edTed Kremenek  const unsigned char* IDTableOffset = PrologueOffset + sizeof(uint32_t)*0;
5015ff4317536dbd7f03332bb250c8b35ec04a6f5dbChris Lattner  const unsigned char* IData = BufBeg + ReadLE32(IDTableOffset);
5021eb4433ac451dc16f4133a88af2d002ac26c58efMike Stump
503cdd8f2153e18796e9e2a126ebcbd4f3e1bd7135bTed Kremenek  if (!(IData >= BufBeg && IData < BufEnd)) {
5043574f46cf495ec61618fd6864b045c5b1d0d5068Daniel Dunbar    Diags.Report(diag::err_invalid_pth_file) << file;
50526555b18aa2c3b78744e77927acd3faa53ae7369Ted Kremenek    return 0;
5060c6a77bc1f52f282a969538f139ebde429076ed3Ted Kremenek  }
5071eb4433ac451dc16f4133a88af2d002ac26c58efMike Stump
5087e3a004c6ed1fe87912203b9c5a113f8da89d261Ted Kremenek  // Get the location of the hashtable mapping between strings and
5097e3a004c6ed1fe87912203b9c5a113f8da89d261Ted Kremenek  // persistent IDs.
510a4bd8eb4d6d4b625f6bbb62fc180b02eab6433edTed Kremenek  const unsigned char* StringIdTableOffset = PrologueOffset + sizeof(uint32_t)*1;
5117e3a004c6ed1fe87912203b9c5a113f8da89d261Ted Kremenek  const unsigned char* StringIdTable = BufBeg + ReadLE32(StringIdTableOffset);
5127e3a004c6ed1fe87912203b9c5a113f8da89d261Ted Kremenek  if (!(StringIdTable >= BufBeg && StringIdTable < BufEnd)) {
5133574f46cf495ec61618fd6864b045c5b1d0d5068Daniel Dunbar    Diags.Report(diag::err_invalid_pth_file) << file;
51426555b18aa2c3b78744e77927acd3faa53ae7369Ted Kremenek    return 0;
51572b1b15ee88aac0a63e2c1dc53fe22f5ab297b20Ted Kremenek  }
5167e3a004c6ed1fe87912203b9c5a113f8da89d261Ted Kremenek
5177e3a004c6ed1fe87912203b9c5a113f8da89d261Ted Kremenek  llvm::OwningPtr<PTHStringIdLookup> SL(PTHStringIdLookup::Create(StringIdTable,
5187e3a004c6ed1fe87912203b9c5a113f8da89d261Ted Kremenek                                                                  BufBeg));
5191eb4433ac451dc16f4133a88af2d002ac26c58efMike Stump
520277faca30c9f8f72b79f55695cbe3395ec246e7cTed Kremenek  // Get the location of the spelling cache.
521a4bd8eb4d6d4b625f6bbb62fc180b02eab6433edTed Kremenek  const unsigned char* spellingBaseOffset = PrologueOffset + sizeof(uint32_t)*3;
522277faca30c9f8f72b79f55695cbe3395ec246e7cTed Kremenek  const unsigned char* spellingBase = BufBeg + ReadLE32(spellingBaseOffset);
523277faca30c9f8f72b79f55695cbe3395ec246e7cTed Kremenek  if (!(spellingBase >= BufBeg && spellingBase < BufEnd)) {
5243574f46cf495ec61618fd6864b045c5b1d0d5068Daniel Dunbar    Diags.Report(diag::err_invalid_pth_file) << file;
525277faca30c9f8f72b79f55695cbe3395ec246e7cTed Kremenek    return 0;
526277faca30c9f8f72b79f55695cbe3395ec246e7cTed Kremenek  }
5271eb4433ac451dc16f4133a88af2d002ac26c58efMike Stump
5286183e4815a4019e97ad01bd880f12355599b75fdTed Kremenek  // Get the number of IdentifierInfos and pre-allocate the identifier cache.
5295ff4317536dbd7f03332bb250c8b35ec04a6f5dbChris Lattner  uint32_t NumIds = ReadLE32(IData);
5301eb4433ac451dc16f4133a88af2d002ac26c58efMike Stump
5316183e4815a4019e97ad01bd880f12355599b75fdTed Kremenek  // Pre-allocate the peristent ID -> IdentifierInfo* cache.  We use calloc()
5326183e4815a4019e97ad01bd880f12355599b75fdTed Kremenek  // so that we in the best case only zero out memory once when the OS returns
5336183e4815a4019e97ad01bd880f12355599b75fdTed Kremenek  // us new pages.
534cdd8f2153e18796e9e2a126ebcbd4f3e1bd7135bTed Kremenek  IdentifierInfo** PerIDCache = 0;
5351eb4433ac451dc16f4133a88af2d002ac26c58efMike Stump
536cdd8f2153e18796e9e2a126ebcbd4f3e1bd7135bTed Kremenek  if (NumIds) {
5371eb4433ac451dc16f4133a88af2d002ac26c58efMike Stump    PerIDCache = (IdentifierInfo**)calloc(NumIds, sizeof(*PerIDCache));
538cdd8f2153e18796e9e2a126ebcbd4f3e1bd7135bTed Kremenek    if (!PerIDCache) {
5393574f46cf495ec61618fd6864b045c5b1d0d5068Daniel Dunbar      InvalidPTH(Diags, "Could not allocate memory for processing PTH file");
540cdd8f2153e18796e9e2a126ebcbd4f3e1bd7135bTed Kremenek      return 0;
541cdd8f2153e18796e9e2a126ebcbd4f3e1bd7135bTed Kremenek    }
5426183e4815a4019e97ad01bd880f12355599b75fdTed Kremenek  }
543cdd8f2153e18796e9e2a126ebcbd4f3e1bd7135bTed Kremenek
54468228634016f644a1164fa1f024a9ce2093656bfTed Kremenek  // Compute the address of the original source file.
54568228634016f644a1164fa1f024a9ce2093656bfTed Kremenek  const unsigned char* originalSourceBase = PrologueOffset + sizeof(uint32_t)*4;
54668228634016f644a1164fa1f024a9ce2093656bfTed Kremenek  unsigned len = ReadUnalignedLE16(originalSourceBase);
5471eb4433ac451dc16f4133a88af2d002ac26c58efMike Stump  if (!len) originalSourceBase = 0;
5481eb4433ac451dc16f4133a88af2d002ac26c58efMike Stump
54972b1b15ee88aac0a63e2c1dc53fe22f5ab297b20Ted Kremenek  // Create the new PTHManager.
55072b1b15ee88aac0a63e2c1dc53fe22f5ab297b20Ted Kremenek  return new PTHManager(File.take(), FL.take(), IData, PerIDCache,
55168228634016f644a1164fa1f024a9ce2093656bfTed Kremenek                        SL.take(), NumIds, spellingBase,
55268228634016f644a1164fa1f024a9ce2093656bfTed Kremenek                        (const char*) originalSourceBase);
5530c6a77bc1f52f282a969538f139ebde429076ed3Ted Kremenek}
55468228634016f644a1164fa1f024a9ce2093656bfTed Kremenek
55577ecb3a28f21496ecfdbb3d5f5b66b0d2abf48c9Chris LattnerIdentifierInfo* PTHManager::LazilyCreateIdentifierInfo(unsigned PersistentID) {
5560c6a77bc1f52f282a969538f139ebde429076ed3Ted Kremenek  // Look in the PTH file for the string data for the IdentifierInfo object.
55777ecb3a28f21496ecfdbb3d5f5b66b0d2abf48c9Chris Lattner  const unsigned char* TableEntry = IdDataTable + sizeof(uint32_t)*PersistentID;
558da9d61c96c412f6babc7f824152609562f302388Chris Lattner  const unsigned char* IDData =
5595ff4317536dbd7f03332bb250c8b35ec04a6f5dbChris Lattner    (const unsigned char*)Buf->getBufferStart() + ReadLE32(TableEntry);
560da9d61c96c412f6babc7f824152609562f302388Chris Lattner  assert(IDData < (const unsigned char*)Buf->getBufferEnd());
5611eb4433ac451dc16f4133a88af2d002ac26c58efMike Stump
56272b1b15ee88aac0a63e2c1dc53fe22f5ab297b20Ted Kremenek  // Allocate the object.
563da9d61c96c412f6babc7f824152609562f302388Chris Lattner  std::pair<IdentifierInfo,const unsigned char*> *Mem =
564da9d61c96c412f6babc7f824152609562f302388Chris Lattner    Alloc.Allocate<std::pair<IdentifierInfo,const unsigned char*> >();
56572b1b15ee88aac0a63e2c1dc53fe22f5ab297b20Ted Kremenek
56672b1b15ee88aac0a63e2c1dc53fe22f5ab297b20Ted Kremenek  Mem->second = IDData;
5677e3a004c6ed1fe87912203b9c5a113f8da89d261Ted Kremenek  assert(IDData[0] != '\0');
568ea9c26b3dbd74a1497f5609ae6e19a85f42b6073Ted Kremenek  IdentifierInfo *II = new ((void*) Mem) IdentifierInfo();
5691eb4433ac451dc16f4133a88af2d002ac26c58efMike Stump
57072b1b15ee88aac0a63e2c1dc53fe22f5ab297b20Ted Kremenek  // Store the new IdentifierInfo in the cache.
57177ecb3a28f21496ecfdbb3d5f5b66b0d2abf48c9Chris Lattner  PerIDCache[PersistentID] = II;
572e013d685c6689ac7ae103ee88acf573422d1ed6aDaniel Dunbar  assert(II->getNameStart() && II->getNameStart()[0] != '\0');
5730c6a77bc1f52f282a969538f139ebde429076ed3Ted Kremenek  return II;
5740c6a77bc1f52f282a969538f139ebde429076ed3Ted Kremenek}
5750c6a77bc1f52f282a969538f139ebde429076ed3Ted Kremenek
576700030ebddb987936d4fee14d9412821d96e4840Kovarththanan RajaratnamIdentifierInfo* PTHManager::get(llvm::StringRef Name) {
5777e3a004c6ed1fe87912203b9c5a113f8da89d261Ted Kremenek  PTHStringIdLookup& SL = *((PTHStringIdLookup*)StringIdLookup);
5787e3a004c6ed1fe87912203b9c5a113f8da89d261Ted Kremenek  // Double check our assumption that the last character isn't '\0'.
579700030ebddb987936d4fee14d9412821d96e4840Kovarththanan Rajaratnam  assert(Name.empty() || Name.data()[Name.size()-1] != '\0');
580700030ebddb987936d4fee14d9412821d96e4840Kovarththanan Rajaratnam  PTHStringIdLookup::iterator I = SL.find(std::make_pair(Name.data(),
581700030ebddb987936d4fee14d9412821d96e4840Kovarththanan Rajaratnam                                                         Name.size()));
5827e3a004c6ed1fe87912203b9c5a113f8da89d261Ted Kremenek  if (I == SL.end()) // No identifier found?
5837e3a004c6ed1fe87912203b9c5a113f8da89d261Ted Kremenek    return 0;
58472b1b15ee88aac0a63e2c1dc53fe22f5ab297b20Ted Kremenek
5857e3a004c6ed1fe87912203b9c5a113f8da89d261Ted Kremenek  // Match found.  Return the identifier!
5867e3a004c6ed1fe87912203b9c5a113f8da89d261Ted Kremenek  assert(*I > 0);
5877e3a004c6ed1fe87912203b9c5a113f8da89d261Ted Kremenek  return GetIdentifierInfo(*I-1);
5887e3a004c6ed1fe87912203b9c5a113f8da89d261Ted Kremenek}
58972b1b15ee88aac0a63e2c1dc53fe22f5ab297b20Ted Kremenek
590f056d92e182cbe4f62c8d14102544dc38066dabcChris LattnerPTHLexer *PTHManager::CreateLexer(FileID FID) {
591f056d92e182cbe4f62c8d14102544dc38066dabcChris Lattner  const FileEntry *FE = PP->getSourceManager().getFileEntryForID(FID);
5920c6a77bc1f52f282a969538f139ebde429076ed3Ted Kremenek  if (!FE)
5930c6a77bc1f52f282a969538f139ebde429076ed3Ted Kremenek    return 0;
5941eb4433ac451dc16f4133a88af2d002ac26c58efMike Stump
5950c6a77bc1f52f282a969538f139ebde429076ed3Ted Kremenek  // Lookup the FileEntry object in our file lookup data structure.  It will
5960c6a77bc1f52f282a969538f139ebde429076ed3Ted Kremenek  // return a variant that indicates whether or not there is an offset within
5970c6a77bc1f52f282a969538f139ebde429076ed3Ted Kremenek  // the PTH file that contains cached tokens.
598d8c02929fe70f03111be73e7b8c402c724238ee9Ted Kremenek  PTHFileLookup& PFL = *((PTHFileLookup*)FileLookup);
599d8c02929fe70f03111be73e7b8c402c724238ee9Ted Kremenek  PTHFileLookup::iterator I = PFL.find(FE);
6001eb4433ac451dc16f4133a88af2d002ac26c58efMike Stump
601d8c02929fe70f03111be73e7b8c402c724238ee9Ted Kremenek  if (I == PFL.end()) // No tokens available?
6020c6a77bc1f52f282a969538f139ebde429076ed3Ted Kremenek    return 0;
6031eb4433ac451dc16f4133a88af2d002ac26c58efMike Stump
6041eb4433ac451dc16f4133a88af2d002ac26c58efMike Stump  const PTHFileData& FileData = *I;
6051eb4433ac451dc16f4133a88af2d002ac26c58efMike Stump
606da9d61c96c412f6babc7f824152609562f302388Chris Lattner  const unsigned char *BufStart = (const unsigned char *)Buf->getBufferStart();
6070c6a77bc1f52f282a969538f139ebde429076ed3Ted Kremenek  // Compute the offset of the token data within the buffer.
608da9d61c96c412f6babc7f824152609562f302388Chris Lattner  const unsigned char* data = BufStart + FileData.getTokenOffset();
609268ee7016a2811803989487c0ad3799486092c63Ted Kremenek
610268ee7016a2811803989487c0ad3799486092c63Ted Kremenek  // Get the location of pp-conditional table.
611da9d61c96c412f6babc7f824152609562f302388Chris Lattner  const unsigned char* ppcond = BufStart + FileData.getPPCondOffset();
6125ff4317536dbd7f03332bb250c8b35ec04a6f5dbChris Lattner  uint32_t Len = ReadLE32(ppcond);
6131b5285e1ba31975864da356b2ed927e87670e654Chris Lattner  if (Len == 0) ppcond = 0;
6141eb4433ac451dc16f4133a88af2d002ac26c58efMike Stump
61572b1b15ee88aac0a63e2c1dc53fe22f5ab297b20Ted Kremenek  assert(PP && "No preprocessor set yet!");
6161eb4433ac451dc16f4133a88af2d002ac26c58efMike Stump  return new PTHLexer(*PP, FID, data, ppcond, *this);
6170c6a77bc1f52f282a969538f139ebde429076ed3Ted Kremenek}
618337edcdbec05316b407d0d64865c88ff8597d910Ted Kremenek
619337edcdbec05316b407d0d64865c88ff8597d910Ted Kremenek//===----------------------------------------------------------------------===//
620337edcdbec05316b407d0d64865c88ff8597d910Ted Kremenek// 'stat' caching.
621337edcdbec05316b407d0d64865c88ff8597d910Ted Kremenek//===----------------------------------------------------------------------===//
622337edcdbec05316b407d0d64865c88ff8597d910Ted Kremenek
623337edcdbec05316b407d0d64865c88ff8597d910Ted Kremeneknamespace {
62485b4521e34dcd4a0a4a1f0819e1123128e5a3125Benjamin Kramerclass PTHStatData {
625337edcdbec05316b407d0d64865c88ff8597d910Ted Kremenekpublic:
626a4b44dd9d30929a35c44d85102e5241ee847b2f2Ted Kremenek  const bool hasStat;
627337edcdbec05316b407d0d64865c88ff8597d910Ted Kremenek  const ino_t ino;
628337edcdbec05316b407d0d64865c88ff8597d910Ted Kremenek  const dev_t dev;
629337edcdbec05316b407d0d64865c88ff8597d910Ted Kremenek  const mode_t mode;
630337edcdbec05316b407d0d64865c88ff8597d910Ted Kremenek  const time_t mtime;
631337edcdbec05316b407d0d64865c88ff8597d910Ted Kremenek  const off_t size;
6321eb4433ac451dc16f4133a88af2d002ac26c58efMike Stump
633337edcdbec05316b407d0d64865c88ff8597d910Ted Kremenek  PTHStatData(ino_t i, dev_t d, mode_t mo, time_t m, off_t s)
6341eb4433ac451dc16f4133a88af2d002ac26c58efMike Stump  : hasStat(true), ino(i), dev(d), mode(mo), mtime(m), size(s) {}
6351eb4433ac451dc16f4133a88af2d002ac26c58efMike Stump
636a4b44dd9d30929a35c44d85102e5241ee847b2f2Ted Kremenek  PTHStatData()
637a4b44dd9d30929a35c44d85102e5241ee847b2f2Ted Kremenek    : hasStat(false), ino(0), dev(0), mode(0), mtime(0), size(0) {}
638337edcdbec05316b407d0d64865c88ff8597d910Ted Kremenek};
6391eb4433ac451dc16f4133a88af2d002ac26c58efMike Stump
64085b4521e34dcd4a0a4a1f0819e1123128e5a3125Benjamin Kramerclass PTHStatLookupTrait : public PTHFileLookupCommonTrait {
641337edcdbec05316b407d0d64865c88ff8597d910Ted Kremenekpublic:
642a4b44dd9d30929a35c44d85102e5241ee847b2f2Ted Kremenek  typedef const char* external_key_type;  // const char*
643337edcdbec05316b407d0d64865c88ff8597d910Ted Kremenek  typedef PTHStatData data_type;
6441eb4433ac451dc16f4133a88af2d002ac26c58efMike Stump
645a4b44dd9d30929a35c44d85102e5241ee847b2f2Ted Kremenek  static internal_key_type GetInternalKey(const char *path) {
646a4b44dd9d30929a35c44d85102e5241ee847b2f2Ted Kremenek    // The key 'kind' doesn't matter here because it is ignored in EqualKey.
647a4b44dd9d30929a35c44d85102e5241ee847b2f2Ted Kremenek    return std::make_pair((unsigned char) 0x0, path);
648a4b44dd9d30929a35c44d85102e5241ee847b2f2Ted Kremenek  }
649a4b44dd9d30929a35c44d85102e5241ee847b2f2Ted Kremenek
650a4b44dd9d30929a35c44d85102e5241ee847b2f2Ted Kremenek  static bool EqualKey(internal_key_type a, internal_key_type b) {
651a4b44dd9d30929a35c44d85102e5241ee847b2f2Ted Kremenek    // When doing 'stat' lookups we don't care about the kind of 'a' and 'b',
652a4b44dd9d30929a35c44d85102e5241ee847b2f2Ted Kremenek    // just the paths.
653a4b44dd9d30929a35c44d85102e5241ee847b2f2Ted Kremenek    return strcmp(a.second, b.second) == 0;
6541eb4433ac451dc16f4133a88af2d002ac26c58efMike Stump  }
6551eb4433ac451dc16f4133a88af2d002ac26c58efMike Stump
656a4b44dd9d30929a35c44d85102e5241ee847b2f2Ted Kremenek  static data_type ReadData(const internal_key_type& k, const unsigned char* d,
6571eb4433ac451dc16f4133a88af2d002ac26c58efMike Stump                            unsigned) {
6581eb4433ac451dc16f4133a88af2d002ac26c58efMike Stump
659ad6ce5cb0e3b5dd853d2b1e337797a6fc1091e21Ted Kremenek    if (k.first /* File or Directory */) {
660ad6ce5cb0e3b5dd853d2b1e337797a6fc1091e21Ted Kremenek      if (k.first == 0x1 /* File */) d += 4 * 2; // Skip the first 2 words.
661a4b44dd9d30929a35c44d85102e5241ee847b2f2Ted Kremenek      ino_t ino = (ino_t) ReadUnalignedLE32(d);
662a4b44dd9d30929a35c44d85102e5241ee847b2f2Ted Kremenek      dev_t dev = (dev_t) ReadUnalignedLE32(d);
663a4b44dd9d30929a35c44d85102e5241ee847b2f2Ted Kremenek      mode_t mode = (mode_t) ReadUnalignedLE16(d);
6641eb4433ac451dc16f4133a88af2d002ac26c58efMike Stump      time_t mtime = (time_t) ReadUnalignedLE64(d);
665a4b44dd9d30929a35c44d85102e5241ee847b2f2Ted Kremenek      return data_type(ino, dev, mode, mtime, (off_t) ReadUnalignedLE64(d));
666a4b44dd9d30929a35c44d85102e5241ee847b2f2Ted Kremenek    }
667ad6ce5cb0e3b5dd853d2b1e337797a6fc1091e21Ted Kremenek
668ad6ce5cb0e3b5dd853d2b1e337797a6fc1091e21Ted Kremenek    // Negative stat.  Don't read anything.
669a4b44dd9d30929a35c44d85102e5241ee847b2f2Ted Kremenek    return data_type();
670337edcdbec05316b407d0d64865c88ff8597d910Ted Kremenek  }
671337edcdbec05316b407d0d64865c88ff8597d910Ted Kremenek};
672337edcdbec05316b407d0d64865c88ff8597d910Ted Kremenek
67385b4521e34dcd4a0a4a1f0819e1123128e5a3125Benjamin Kramerclass PTHStatCache : public StatSysCallCache {
674337edcdbec05316b407d0d64865c88ff8597d910Ted Kremenek  typedef OnDiskChainedHashTable<PTHStatLookupTrait> CacheTy;
675337edcdbec05316b407d0d64865c88ff8597d910Ted Kremenek  CacheTy Cache;
676337edcdbec05316b407d0d64865c88ff8597d910Ted Kremenek
6771eb4433ac451dc16f4133a88af2d002ac26c58efMike Stumppublic:
678337edcdbec05316b407d0d64865c88ff8597d910Ted Kremenek  PTHStatCache(PTHFileLookup &FL) :
679337edcdbec05316b407d0d64865c88ff8597d910Ted Kremenek    Cache(FL.getNumBuckets(), FL.getNumEntries(), FL.getBuckets(),
680337edcdbec05316b407d0d64865c88ff8597d910Ted Kremenek          FL.getBase()) {}
681337edcdbec05316b407d0d64865c88ff8597d910Ted Kremenek
682337edcdbec05316b407d0d64865c88ff8597d910Ted Kremenek  ~PTHStatCache() {}
6831eb4433ac451dc16f4133a88af2d002ac26c58efMike Stump
684337edcdbec05316b407d0d64865c88ff8597d910Ted Kremenek  int stat(const char *path, struct stat *buf) {
685337edcdbec05316b407d0d64865c88ff8597d910Ted Kremenek    // Do the lookup for the file's data in the PTH file.
686337edcdbec05316b407d0d64865c88ff8597d910Ted Kremenek    CacheTy::iterator I = Cache.find(path);
687337edcdbec05316b407d0d64865c88ff8597d910Ted Kremenek
688337edcdbec05316b407d0d64865c88ff8597d910Ted Kremenek    // If we don't get a hit in the PTH file just forward to 'stat'.
689700030ebddb987936d4fee14d9412821d96e4840Kovarththanan Rajaratnam    if (I == Cache.end())
69052e7108f51a4a9f4d6e84f33fb594d06e1d79560Douglas Gregor      return StatSysCallCache::stat(path, buf);
6911eb4433ac451dc16f4133a88af2d002ac26c58efMike Stump
692337edcdbec05316b407d0d64865c88ff8597d910Ted Kremenek    const PTHStatData& Data = *I;
6931eb4433ac451dc16f4133a88af2d002ac26c58efMike Stump
694ad6ce5cb0e3b5dd853d2b1e337797a6fc1091e21Ted Kremenek    if (!Data.hasStat)
695ad6ce5cb0e3b5dd853d2b1e337797a6fc1091e21Ted Kremenek      return 1;
696ad6ce5cb0e3b5dd853d2b1e337797a6fc1091e21Ted Kremenek
697337edcdbec05316b407d0d64865c88ff8597d910Ted Kremenek    buf->st_ino = Data.ino;
698337edcdbec05316b407d0d64865c88ff8597d910Ted Kremenek    buf->st_dev = Data.dev;
699337edcdbec05316b407d0d64865c88ff8597d910Ted Kremenek    buf->st_mtime = Data.mtime;
700337edcdbec05316b407d0d64865c88ff8597d910Ted Kremenek    buf->st_mode = Data.mode;
701337edcdbec05316b407d0d64865c88ff8597d910Ted Kremenek    buf->st_size = Data.size;
702337edcdbec05316b407d0d64865c88ff8597d910Ted Kremenek    return 0;
703337edcdbec05316b407d0d64865c88ff8597d910Ted Kremenek  }
704337edcdbec05316b407d0d64865c88ff8597d910Ted Kremenek};
705d578569d50adc6e9b1a2f91931add6b471b2378eTed Kremenek} // end anonymous namespace
706337edcdbec05316b407d0d64865c88ff8597d910Ted Kremenek
707337edcdbec05316b407d0d64865c88ff8597d910Ted KremenekStatSysCallCache *PTHManager::createStatCache() {
7085f747d187bf8dc779a4acc180f9c21f1dbf83f6aTed Kremenek  return new PTHStatCache(*((PTHFileLookup*) FileLookup));
709337edcdbec05316b407d0d64865c88ff8597d910Ted Kremenek}
710