HTMLRewrite.cpp revision d7407dc92c7d19cafce429e7e1cf9819d3fc0b92
16a34083e9f74a45e2f79c9fab66f177809a5db66Ted Kremenek//== HTMLRewrite.cpp - Translate source code into prettified HTML --*- C++ -*-//
26a34083e9f74a45e2f79c9fab66f177809a5db66Ted Kremenek//
36a34083e9f74a45e2f79c9fab66f177809a5db66Ted Kremenek//                     The LLVM Compiler Infrastructure
46a34083e9f74a45e2f79c9fab66f177809a5db66Ted Kremenek//
56a34083e9f74a45e2f79c9fab66f177809a5db66Ted Kremenek// This file is distributed under the University of Illinois Open Source
66a34083e9f74a45e2f79c9fab66f177809a5db66Ted Kremenek// License. See LICENSE.TXT for details.
76a34083e9f74a45e2f79c9fab66f177809a5db66Ted Kremenek//
86a34083e9f74a45e2f79c9fab66f177809a5db66Ted Kremenek//===----------------------------------------------------------------------===//
96a34083e9f74a45e2f79c9fab66f177809a5db66Ted Kremenek//
106a34083e9f74a45e2f79c9fab66f177809a5db66Ted Kremenek//  This file defines the HTMLRewriter clas, which is used to translate the
116a34083e9f74a45e2f79c9fab66f177809a5db66Ted Kremenek//  text of a source file into prettified HTML.
126a34083e9f74a45e2f79c9fab66f177809a5db66Ted Kremenek//
136a34083e9f74a45e2f79c9fab66f177809a5db66Ted Kremenek//===----------------------------------------------------------------------===//
146a34083e9f74a45e2f79c9fab66f177809a5db66Ted Kremenek
15339b9c27759d7b6a53e2370f83f66e78b3254595Ted Kremenek#include "clang/Lex/Preprocessor.h"
166a34083e9f74a45e2f79c9fab66f177809a5db66Ted Kremenek#include "clang/Rewrite/Rewriter.h"
176a34083e9f74a45e2f79c9fab66f177809a5db66Ted Kremenek#include "clang/Rewrite/HTMLRewrite.h"
18867924dbeca06870573fd58d620032da6994b223Chris Lattner#include "clang/Lex/TokenConcatenation.h"
193245a0a1c7a4fd74fca845b2edba275bb126d773Chris Lattner#include "clang/Lex/Preprocessor.h"
206a34083e9f74a45e2f79c9fab66f177809a5db66Ted Kremenek#include "clang/Basic/SourceManager.h"
2157df3b950061c73d13d3116f747e79d7955a216aChris Lattner#include "llvm/ADT/SmallString.h"
22339b9c27759d7b6a53e2370f83f66e78b3254595Ted Kremenek#include "llvm/ADT/OwningPtr.h"
236a34083e9f74a45e2f79c9fab66f177809a5db66Ted Kremenek#include "llvm/Support/MemoryBuffer.h"
24a95d3750441ac8ad03e36af8e6e74039c9a3109dTed Kremenek#include "llvm/Support/raw_ostream.h"
256a34083e9f74a45e2f79c9fab66f177809a5db66Ted Kremenekusing namespace clang;
266a34083e9f74a45e2f79c9fab66f177809a5db66Ted Kremenek
279402b57a0dca4058fe56d7fd84e97fc496421125Chris Lattner
285ef3e2c45f13fccdb0d7bbcf24c1beee8eee6f64Chris Lattner/// HighlightRange - Highlight a range in the source code with the specified
295ef3e2c45f13fccdb0d7bbcf24c1beee8eee6f64Chris Lattner/// start/end tags.  B/E must be in the same file.  This ensures that
305ef3e2c45f13fccdb0d7bbcf24c1beee8eee6f64Chris Lattner/// start/end tags are placed at the start/end of each line if the range is
315ef3e2c45f13fccdb0d7bbcf24c1beee8eee6f64Chris Lattner/// multiline.
325ef3e2c45f13fccdb0d7bbcf24c1beee8eee6f64Chris Lattnervoid html::HighlightRange(Rewriter &R, SourceLocation B, SourceLocation E,
335ef3e2c45f13fccdb0d7bbcf24c1beee8eee6f64Chris Lattner                          const char *StartTag, const char *EndTag) {
345ef3e2c45f13fccdb0d7bbcf24c1beee8eee6f64Chris Lattner  SourceManager &SM = R.getSourceMgr();
35f7cf85b330bedd2877e1371fb0a83e99751ae162Chris Lattner  B = SM.getInstantiationLoc(B);
36f7cf85b330bedd2877e1371fb0a83e99751ae162Chris Lattner  E = SM.getInstantiationLoc(E);
37a11d61793341fea195c29a0dab3fbd74f2b39a8cChris Lattner  FileID FID = SM.getFileID(B);
38a11d61793341fea195c29a0dab3fbd74f2b39a8cChris Lattner  assert(SM.getFileID(E) == FID && "B/E not in the same file!");
395ef3e2c45f13fccdb0d7bbcf24c1beee8eee6f64Chris Lattner
4052c29081281955d3db9e11d10573b2d38f709099Chris Lattner  unsigned BOffset = SM.getFileOffset(B);
4152c29081281955d3db9e11d10573b2d38f709099Chris Lattner  unsigned EOffset = SM.getFileOffset(E);
425ef3e2c45f13fccdb0d7bbcf24c1beee8eee6f64Chris Lattner
435ef3e2c45f13fccdb0d7bbcf24c1beee8eee6f64Chris Lattner  // Include the whole end token in the range.
442c78b873f4f3823ae859c15674cb3d76c8554113Chris Lattner  EOffset += Lexer::MeasureTokenLength(E, R.getSourceMgr(), R.getLangOpts());
455ef3e2c45f13fccdb0d7bbcf24c1beee8eee6f64Chris Lattner
462b2453a7d8fe732561795431f39ceb2b2a832d84Chris Lattner  HighlightRange(R.getEditBuffer(FID), BOffset, EOffset,
472b2453a7d8fe732561795431f39ceb2b2a832d84Chris Lattner                 SM.getBufferData(FID).first, StartTag, EndTag);
485ef3e2c45f13fccdb0d7bbcf24c1beee8eee6f64Chris Lattner}
495ef3e2c45f13fccdb0d7bbcf24c1beee8eee6f64Chris Lattner
505ef3e2c45f13fccdb0d7bbcf24c1beee8eee6f64Chris Lattner/// HighlightRange - This is the same as the above method, but takes
515ef3e2c45f13fccdb0d7bbcf24c1beee8eee6f64Chris Lattner/// decomposed file locations.
525ef3e2c45f13fccdb0d7bbcf24c1beee8eee6f64Chris Lattnervoid html::HighlightRange(RewriteBuffer &RB, unsigned B, unsigned E,
535ef3e2c45f13fccdb0d7bbcf24c1beee8eee6f64Chris Lattner                          const char *BufferStart,
545ef3e2c45f13fccdb0d7bbcf24c1beee8eee6f64Chris Lattner                          const char *StartTag, const char *EndTag) {
559402b57a0dca4058fe56d7fd84e97fc496421125Chris Lattner  // Insert the tag at the absolute start/end of the range.
56d7407dc92c7d19cafce429e7e1cf9819d3fc0b92Daniel Dunbar  RB.InsertTextAfter(B, StartTag);
57d7407dc92c7d19cafce429e7e1cf9819d3fc0b92Daniel Dunbar  RB.InsertTextBefore(E, EndTag);
585ef3e2c45f13fccdb0d7bbcf24c1beee8eee6f64Chris Lattner
599402b57a0dca4058fe56d7fd84e97fc496421125Chris Lattner  // Scan the range to see if there is a \r or \n.  If so, and if the line is
609402b57a0dca4058fe56d7fd84e97fc496421125Chris Lattner  // not blank, insert tags on that line as well.
619402b57a0dca4058fe56d7fd84e97fc496421125Chris Lattner  bool HadOpenTag = true;
629402b57a0dca4058fe56d7fd84e97fc496421125Chris Lattner
639402b57a0dca4058fe56d7fd84e97fc496421125Chris Lattner  unsigned LastNonWhiteSpace = B;
649402b57a0dca4058fe56d7fd84e97fc496421125Chris Lattner  for (unsigned i = B; i != E; ++i) {
659402b57a0dca4058fe56d7fd84e97fc496421125Chris Lattner    switch (BufferStart[i]) {
669402b57a0dca4058fe56d7fd84e97fc496421125Chris Lattner    case '\r':
679402b57a0dca4058fe56d7fd84e97fc496421125Chris Lattner    case '\n':
689402b57a0dca4058fe56d7fd84e97fc496421125Chris Lattner      // Okay, we found a newline in the range.  If we have an open tag, we need
699402b57a0dca4058fe56d7fd84e97fc496421125Chris Lattner      // to insert a close tag at the first non-whitespace before the newline.
709402b57a0dca4058fe56d7fd84e97fc496421125Chris Lattner      if (HadOpenTag)
71d7407dc92c7d19cafce429e7e1cf9819d3fc0b92Daniel Dunbar        RB.InsertTextBefore(LastNonWhiteSpace+1, EndTag);
729402b57a0dca4058fe56d7fd84e97fc496421125Chris Lattner
739402b57a0dca4058fe56d7fd84e97fc496421125Chris Lattner      // Instead of inserting an open tag immediately after the newline, we
749402b57a0dca4058fe56d7fd84e97fc496421125Chris Lattner      // wait until we see a non-whitespace character.  This prevents us from
759402b57a0dca4058fe56d7fd84e97fc496421125Chris Lattner      // inserting tags around blank lines, and also allows the open tag to
769402b57a0dca4058fe56d7fd84e97fc496421125Chris Lattner      // be put *after* whitespace on a non-blank line.
779402b57a0dca4058fe56d7fd84e97fc496421125Chris Lattner      HadOpenTag = false;
789402b57a0dca4058fe56d7fd84e97fc496421125Chris Lattner      break;
799402b57a0dca4058fe56d7fd84e97fc496421125Chris Lattner    case '\0':
809402b57a0dca4058fe56d7fd84e97fc496421125Chris Lattner    case ' ':
819402b57a0dca4058fe56d7fd84e97fc496421125Chris Lattner    case '\t':
829402b57a0dca4058fe56d7fd84e97fc496421125Chris Lattner    case '\f':
839402b57a0dca4058fe56d7fd84e97fc496421125Chris Lattner    case '\v':
849402b57a0dca4058fe56d7fd84e97fc496421125Chris Lattner      // Ignore whitespace.
859402b57a0dca4058fe56d7fd84e97fc496421125Chris Lattner      break;
869402b57a0dca4058fe56d7fd84e97fc496421125Chris Lattner
879402b57a0dca4058fe56d7fd84e97fc496421125Chris Lattner    default:
889402b57a0dca4058fe56d7fd84e97fc496421125Chris Lattner      // If there is no tag open, do it now.
899402b57a0dca4058fe56d7fd84e97fc496421125Chris Lattner      if (!HadOpenTag) {
90d7407dc92c7d19cafce429e7e1cf9819d3fc0b92Daniel Dunbar        RB.InsertTextAfter(i, StartTag);
919402b57a0dca4058fe56d7fd84e97fc496421125Chris Lattner        HadOpenTag = true;
929402b57a0dca4058fe56d7fd84e97fc496421125Chris Lattner      }
939402b57a0dca4058fe56d7fd84e97fc496421125Chris Lattner
949402b57a0dca4058fe56d7fd84e97fc496421125Chris Lattner      // Remember this character.
959402b57a0dca4058fe56d7fd84e97fc496421125Chris Lattner      LastNonWhiteSpace = i;
969402b57a0dca4058fe56d7fd84e97fc496421125Chris Lattner      break;
979402b57a0dca4058fe56d7fd84e97fc496421125Chris Lattner    }
989402b57a0dca4058fe56d7fd84e97fc496421125Chris Lattner  }
995ef3e2c45f13fccdb0d7bbcf24c1beee8eee6f64Chris Lattner}
1005ef3e2c45f13fccdb0d7bbcf24c1beee8eee6f64Chris Lattner
1012b2453a7d8fe732561795431f39ceb2b2a832d84Chris Lattnervoid html::EscapeText(Rewriter &R, FileID FID,
102fa5be3617294f0e3c341f0ecb6b2076478b1b5acTed Kremenek                      bool EscapeSpaces, bool ReplaceTabs) {
1036a34083e9f74a45e2f79c9fab66f177809a5db66Ted Kremenek
1042b2453a7d8fe732561795431f39ceb2b2a832d84Chris Lattner  const llvm::MemoryBuffer *Buf = R.getSourceMgr().getBuffer(FID);
1056a34083e9f74a45e2f79c9fab66f177809a5db66Ted Kremenek  const char* C = Buf->getBufferStart();
1066a34083e9f74a45e2f79c9fab66f177809a5db66Ted Kremenek  const char* FileEnd = Buf->getBufferEnd();
1076a34083e9f74a45e2f79c9fab66f177809a5db66Ted Kremenek
1086a34083e9f74a45e2f79c9fab66f177809a5db66Ted Kremenek  assert (C <= FileEnd);
1096a34083e9f74a45e2f79c9fab66f177809a5db66Ted Kremenek
1102b2453a7d8fe732561795431f39ceb2b2a832d84Chris Lattner  RewriteBuffer &RB = R.getEditBuffer(FID);
1115c176f7a9ba9f7084b903393845be24f85e091daChris Lattner
1125c176f7a9ba9f7084b903393845be24f85e091daChris Lattner  unsigned ColNo = 0;
1136a34083e9f74a45e2f79c9fab66f177809a5db66Ted Kremenek  for (unsigned FilePos = 0; C != FileEnd ; ++C, ++FilePos) {
1146a34083e9f74a45e2f79c9fab66f177809a5db66Ted Kremenek    switch (*C) {
1155c176f7a9ba9f7084b903393845be24f85e091daChris Lattner    default: ++ColNo; break;
1165c176f7a9ba9f7084b903393845be24f85e091daChris Lattner    case '\n':
1175c176f7a9ba9f7084b903393845be24f85e091daChris Lattner    case '\r':
1185c176f7a9ba9f7084b903393845be24f85e091daChris Lattner      ColNo = 0;
1195c176f7a9ba9f7084b903393845be24f85e091daChris Lattner      break;
120735271479ac57c27f744806859efd5b001dea248Chris Lattner
121735271479ac57c27f744806859efd5b001dea248Chris Lattner    case ' ':
122735271479ac57c27f744806859efd5b001dea248Chris Lattner      if (EscapeSpaces)
123d7407dc92c7d19cafce429e7e1cf9819d3fc0b92Daniel Dunbar        RB.ReplaceText(FilePos, 1, "&nbsp;");
1245c176f7a9ba9f7084b903393845be24f85e091daChris Lattner      ++ColNo;
125735271479ac57c27f744806859efd5b001dea248Chris Lattner      break;
126f3d8d19caf6f1a21785eee8d62c45ef5a0a0e72eChris Lattner    case '\f':
127d7407dc92c7d19cafce429e7e1cf9819d3fc0b92Daniel Dunbar      RB.ReplaceText(FilePos, 1, "<hr>");
128f3d8d19caf6f1a21785eee8d62c45ef5a0a0e72eChris Lattner      ColNo = 0;
129f3d8d19caf6f1a21785eee8d62c45ef5a0a0e72eChris Lattner      break;
130f3d8d19caf6f1a21785eee8d62c45ef5a0a0e72eChris Lattner
1315c176f7a9ba9f7084b903393845be24f85e091daChris Lattner    case '\t': {
132735271479ac57c27f744806859efd5b001dea248Chris Lattner      if (!ReplaceTabs)
13349cd6354d5373245dd2e69ca7b7113e6a795d36eTed Kremenek        break;
1345c176f7a9ba9f7084b903393845be24f85e091daChris Lattner      unsigned NumSpaces = 8-(ColNo&7);
135735271479ac57c27f744806859efd5b001dea248Chris Lattner      if (EscapeSpaces)
136d7407dc92c7d19cafce429e7e1cf9819d3fc0b92Daniel Dunbar        RB.ReplaceText(FilePos, 1,
137d7407dc92c7d19cafce429e7e1cf9819d3fc0b92Daniel Dunbar                       llvm::StringRef("&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;"
138d7407dc92c7d19cafce429e7e1cf9819d3fc0b92Daniel Dunbar                                       "&nbsp;&nbsp;&nbsp;", 6*NumSpaces));
139735271479ac57c27f744806859efd5b001dea248Chris Lattner      else
140d7407dc92c7d19cafce429e7e1cf9819d3fc0b92Daniel Dunbar        RB.ReplaceText(FilePos, 1, llvm::StringRef("        ", NumSpaces));
1415c176f7a9ba9f7084b903393845be24f85e091daChris Lattner      ColNo += NumSpaces;
142735271479ac57c27f744806859efd5b001dea248Chris Lattner      break;
1435c176f7a9ba9f7084b903393845be24f85e091daChris Lattner    }
144735271479ac57c27f744806859efd5b001dea248Chris Lattner    case '<':
145d7407dc92c7d19cafce429e7e1cf9819d3fc0b92Daniel Dunbar      RB.ReplaceText(FilePos, 1, "&lt;");
1465c176f7a9ba9f7084b903393845be24f85e091daChris Lattner      ++ColNo;
147735271479ac57c27f744806859efd5b001dea248Chris Lattner      break;
148735271479ac57c27f744806859efd5b001dea248Chris Lattner
149735271479ac57c27f744806859efd5b001dea248Chris Lattner    case '>':
150d7407dc92c7d19cafce429e7e1cf9819d3fc0b92Daniel Dunbar      RB.ReplaceText(FilePos, 1, "&gt;");
1515c176f7a9ba9f7084b903393845be24f85e091daChris Lattner      ++ColNo;
152735271479ac57c27f744806859efd5b001dea248Chris Lattner      break;
153735271479ac57c27f744806859efd5b001dea248Chris Lattner
154735271479ac57c27f744806859efd5b001dea248Chris Lattner    case '&':
155d7407dc92c7d19cafce429e7e1cf9819d3fc0b92Daniel Dunbar      RB.ReplaceText(FilePos, 1, "&amp;");
1565c176f7a9ba9f7084b903393845be24f85e091daChris Lattner      ++ColNo;
157735271479ac57c27f744806859efd5b001dea248Chris Lattner      break;
1586a34083e9f74a45e2f79c9fab66f177809a5db66Ted Kremenek    }
1596a34083e9f74a45e2f79c9fab66f177809a5db66Ted Kremenek  }
1606a34083e9f74a45e2f79c9fab66f177809a5db66Ted Kremenek}
1616a34083e9f74a45e2f79c9fab66f177809a5db66Ted Kremenek
162fa5be3617294f0e3c341f0ecb6b2076478b1b5acTed Kremenekstd::string html::EscapeText(const std::string& s, bool EscapeSpaces,
163fa5be3617294f0e3c341f0ecb6b2076478b1b5acTed Kremenek                             bool ReplaceTabs) {
164053ef593fa9d2b890645a914eee203231fb34458Ted Kremenek
165053ef593fa9d2b890645a914eee203231fb34458Ted Kremenek  unsigned len = s.size();
166a95d3750441ac8ad03e36af8e6e74039c9a3109dTed Kremenek  std::string Str;
167a95d3750441ac8ad03e36af8e6e74039c9a3109dTed Kremenek  llvm::raw_string_ostream os(Str);
168053ef593fa9d2b890645a914eee203231fb34458Ted Kremenek
169053ef593fa9d2b890645a914eee203231fb34458Ted Kremenek  for (unsigned i = 0 ; i < len; ++i) {
170053ef593fa9d2b890645a914eee203231fb34458Ted Kremenek
171053ef593fa9d2b890645a914eee203231fb34458Ted Kremenek    char c = s[i];
172053ef593fa9d2b890645a914eee203231fb34458Ted Kremenek    switch (c) {
1738570f0b0fde7ca812f8d37f52305f3df4dd2ce01Chris Lattner    default:
1748570f0b0fde7ca812f8d37f52305f3df4dd2ce01Chris Lattner      os << c; break;
1758570f0b0fde7ca812f8d37f52305f3df4dd2ce01Chris Lattner
1768570f0b0fde7ca812f8d37f52305f3df4dd2ce01Chris Lattner    case ' ':
1778570f0b0fde7ca812f8d37f52305f3df4dd2ce01Chris Lattner      if (EscapeSpaces) os << "&nbsp;";
1788570f0b0fde7ca812f8d37f52305f3df4dd2ce01Chris Lattner      else os << ' ';
1798570f0b0fde7ca812f8d37f52305f3df4dd2ce01Chris Lattner      break;
1808570f0b0fde7ca812f8d37f52305f3df4dd2ce01Chris Lattner
181c01b46e2f115bed83f2f6f4a55809bf4003ee015Zhongxing Xu    case '\t':
182c01b46e2f115bed83f2f6f4a55809bf4003ee015Zhongxing Xu      if (ReplaceTabs) {
183c01b46e2f115bed83f2f6f4a55809bf4003ee015Zhongxing Xu        if (EscapeSpaces)
184c01b46e2f115bed83f2f6f4a55809bf4003ee015Zhongxing Xu          for (unsigned i = 0; i < 4; ++i)
185c01b46e2f115bed83f2f6f4a55809bf4003ee015Zhongxing Xu            os << "&nbsp;";
186c01b46e2f115bed83f2f6f4a55809bf4003ee015Zhongxing Xu        else
187c01b46e2f115bed83f2f6f4a55809bf4003ee015Zhongxing Xu          for (unsigned i = 0; i < 4; ++i)
188c01b46e2f115bed83f2f6f4a55809bf4003ee015Zhongxing Xu            os << " ";
189c01b46e2f115bed83f2f6f4a55809bf4003ee015Zhongxing Xu      }
190c01b46e2f115bed83f2f6f4a55809bf4003ee015Zhongxing Xu      else
191c01b46e2f115bed83f2f6f4a55809bf4003ee015Zhongxing Xu        os << c;
1928570f0b0fde7ca812f8d37f52305f3df4dd2ce01Chris Lattner
193c01b46e2f115bed83f2f6f4a55809bf4003ee015Zhongxing Xu      break;
1948570f0b0fde7ca812f8d37f52305f3df4dd2ce01Chris Lattner
195c01b46e2f115bed83f2f6f4a55809bf4003ee015Zhongxing Xu    case '<': os << "&lt;"; break;
196c01b46e2f115bed83f2f6f4a55809bf4003ee015Zhongxing Xu    case '>': os << "&gt;"; break;
197c01b46e2f115bed83f2f6f4a55809bf4003ee015Zhongxing Xu    case '&': os << "&amp;"; break;
198053ef593fa9d2b890645a914eee203231fb34458Ted Kremenek    }
199053ef593fa9d2b890645a914eee203231fb34458Ted Kremenek  }
200053ef593fa9d2b890645a914eee203231fb34458Ted Kremenek
201053ef593fa9d2b890645a914eee203231fb34458Ted Kremenek  return os.str();
202053ef593fa9d2b890645a914eee203231fb34458Ted Kremenek}
203053ef593fa9d2b890645a914eee203231fb34458Ted Kremenek
2048570f0b0fde7ca812f8d37f52305f3df4dd2ce01Chris Lattnerstatic void AddLineNumber(RewriteBuffer &RB, unsigned LineNo,
2058570f0b0fde7ca812f8d37f52305f3df4dd2ce01Chris Lattner                          unsigned B, unsigned E) {
2067e37c818f9f77608c602ffb32c1135e3cd0132a8Daniel Dunbar  llvm::SmallString<256> Str;
2077e37c818f9f77608c602ffb32c1135e3cd0132a8Daniel Dunbar  llvm::raw_svector_ostream OS(Str);
2087e37c818f9f77608c602ffb32c1135e3cd0132a8Daniel Dunbar
2097e37c818f9f77608c602ffb32c1135e3cd0132a8Daniel Dunbar  OS << "<tr><td class=\"num\" id=\"LN"
2107e37c818f9f77608c602ffb32c1135e3cd0132a8Daniel Dunbar     << LineNo << "\">"
2117e37c818f9f77608c602ffb32c1135e3cd0132a8Daniel Dunbar     << LineNo << "</td><td class=\"line\">";
21257df3b950061c73d13d3116f747e79d7955a216aChris Lattner
21349cd6354d5373245dd2e69ca7b7113e6a795d36eTed Kremenek  if (B == E) { // Handle empty lines.
2147e37c818f9f77608c602ffb32c1135e3cd0132a8Daniel Dunbar    OS << " </td></tr>";
215d7407dc92c7d19cafce429e7e1cf9819d3fc0b92Daniel Dunbar    RB.InsertTextBefore(B, OS.str());
21657df3b950061c73d13d3116f747e79d7955a216aChris Lattner  } else {
217d7407dc92c7d19cafce429e7e1cf9819d3fc0b92Daniel Dunbar    RB.InsertTextBefore(B, OS.str());
218d7407dc92c7d19cafce429e7e1cf9819d3fc0b92Daniel Dunbar    RB.InsertTextBefore(E, "</td></tr>");
21949cd6354d5373245dd2e69ca7b7113e6a795d36eTed Kremenek  }
220b485cd1e0a5a1e942d0e682b9b1c4bc9df111528Ted Kremenek}
221b485cd1e0a5a1e942d0e682b9b1c4bc9df111528Ted Kremenek
2222b2453a7d8fe732561795431f39ceb2b2a832d84Chris Lattnervoid html::AddLineNumbers(Rewriter& R, FileID FID) {
223b485cd1e0a5a1e942d0e682b9b1c4bc9df111528Ted Kremenek
2242b2453a7d8fe732561795431f39ceb2b2a832d84Chris Lattner  const llvm::MemoryBuffer *Buf = R.getSourceMgr().getBuffer(FID);
225b485cd1e0a5a1e942d0e682b9b1c4bc9df111528Ted Kremenek  const char* FileBeg = Buf->getBufferStart();
226b485cd1e0a5a1e942d0e682b9b1c4bc9df111528Ted Kremenek  const char* FileEnd = Buf->getBufferEnd();
227b485cd1e0a5a1e942d0e682b9b1c4bc9df111528Ted Kremenek  const char* C = FileBeg;
2282b2453a7d8fe732561795431f39ceb2b2a832d84Chris Lattner  RewriteBuffer &RB = R.getEditBuffer(FID);
229b485cd1e0a5a1e942d0e682b9b1c4bc9df111528Ted Kremenek
230b485cd1e0a5a1e942d0e682b9b1c4bc9df111528Ted Kremenek  assert (C <= FileEnd);
231b485cd1e0a5a1e942d0e682b9b1c4bc9df111528Ted Kremenek
232b485cd1e0a5a1e942d0e682b9b1c4bc9df111528Ted Kremenek  unsigned LineNo = 0;
233b485cd1e0a5a1e942d0e682b9b1c4bc9df111528Ted Kremenek  unsigned FilePos = 0;
234b485cd1e0a5a1e942d0e682b9b1c4bc9df111528Ted Kremenek
235b485cd1e0a5a1e942d0e682b9b1c4bc9df111528Ted Kremenek  while (C != FileEnd) {
236b485cd1e0a5a1e942d0e682b9b1c4bc9df111528Ted Kremenek
237b485cd1e0a5a1e942d0e682b9b1c4bc9df111528Ted Kremenek    ++LineNo;
238b485cd1e0a5a1e942d0e682b9b1c4bc9df111528Ted Kremenek    unsigned LineStartPos = FilePos;
239b485cd1e0a5a1e942d0e682b9b1c4bc9df111528Ted Kremenek    unsigned LineEndPos = FileEnd - FileBeg;
240b485cd1e0a5a1e942d0e682b9b1c4bc9df111528Ted Kremenek
241b485cd1e0a5a1e942d0e682b9b1c4bc9df111528Ted Kremenek    assert (FilePos <= LineEndPos);
242b485cd1e0a5a1e942d0e682b9b1c4bc9df111528Ted Kremenek    assert (C < FileEnd);
243b485cd1e0a5a1e942d0e682b9b1c4bc9df111528Ted Kremenek
244b485cd1e0a5a1e942d0e682b9b1c4bc9df111528Ted Kremenek    // Scan until the newline (or end-of-file).
245b485cd1e0a5a1e942d0e682b9b1c4bc9df111528Ted Kremenek
24649cd6354d5373245dd2e69ca7b7113e6a795d36eTed Kremenek    while (C != FileEnd) {
24749cd6354d5373245dd2e69ca7b7113e6a795d36eTed Kremenek      char c = *C;
24849cd6354d5373245dd2e69ca7b7113e6a795d36eTed Kremenek      ++C;
24949cd6354d5373245dd2e69ca7b7113e6a795d36eTed Kremenek
25049cd6354d5373245dd2e69ca7b7113e6a795d36eTed Kremenek      if (c == '\n') {
25149cd6354d5373245dd2e69ca7b7113e6a795d36eTed Kremenek        LineEndPos = FilePos++;
252b485cd1e0a5a1e942d0e682b9b1c4bc9df111528Ted Kremenek        break;
253b485cd1e0a5a1e942d0e682b9b1c4bc9df111528Ted Kremenek      }
25449cd6354d5373245dd2e69ca7b7113e6a795d36eTed Kremenek
25549cd6354d5373245dd2e69ca7b7113e6a795d36eTed Kremenek      ++FilePos;
25649cd6354d5373245dd2e69ca7b7113e6a795d36eTed Kremenek    }
257b485cd1e0a5a1e942d0e682b9b1c4bc9df111528Ted Kremenek
2588570f0b0fde7ca812f8d37f52305f3df4dd2ce01Chris Lattner    AddLineNumber(RB, LineNo, LineStartPos, LineEndPos);
259d6c1360c2bf234c73572a865f119d0518aca8154Ted Kremenek  }
260d6c1360c2bf234c73572a865f119d0518aca8154Ted Kremenek
2618570f0b0fde7ca812f8d37f52305f3df4dd2ce01Chris Lattner  // Add one big table tag that surrounds all of the code.
262d7407dc92c7d19cafce429e7e1cf9819d3fc0b92Daniel Dunbar  RB.InsertTextBefore(0, "<table class=\"code\">\n");
263d7407dc92c7d19cafce429e7e1cf9819d3fc0b92Daniel Dunbar  RB.InsertTextAfter(FileEnd - FileBeg, "</table>");
264b485cd1e0a5a1e942d0e682b9b1c4bc9df111528Ted Kremenek}
265ad0a203130dc5d1fb7231b88767174511424fa98Ted Kremenek
2662b2453a7d8fe732561795431f39ceb2b2a832d84Chris Lattnervoid html::AddHeaderFooterInternalBuiltinCSS(Rewriter& R, FileID FID,
267f6f593fae2f0531b4bc06891941f7fbba5217618Ted Kremenek                                             const char *title) {
268ad0a203130dc5d1fb7231b88767174511424fa98Ted Kremenek
2692b2453a7d8fe732561795431f39ceb2b2a832d84Chris Lattner  const llvm::MemoryBuffer *Buf = R.getSourceMgr().getBuffer(FID);
270ad0a203130dc5d1fb7231b88767174511424fa98Ted Kremenek  const char* FileStart = Buf->getBufferStart();
271ad0a203130dc5d1fb7231b88767174511424fa98Ted Kremenek  const char* FileEnd = Buf->getBufferEnd();
272ad0a203130dc5d1fb7231b88767174511424fa98Ted Kremenek
2732b2453a7d8fe732561795431f39ceb2b2a832d84Chris Lattner  SourceLocation StartLoc = R.getSourceMgr().getLocForStartOfFile(FID);
2742b2453a7d8fe732561795431f39ceb2b2a832d84Chris Lattner  SourceLocation EndLoc = StartLoc.getFileLocWithOffset(FileEnd-FileStart);
275ad0a203130dc5d1fb7231b88767174511424fa98Ted Kremenek
276a95d3750441ac8ad03e36af8e6e74039c9a3109dTed Kremenek  std::string s;
277a95d3750441ac8ad03e36af8e6e74039c9a3109dTed Kremenek  llvm::raw_string_ostream os(s);
278f6f593fae2f0531b4bc06891941f7fbba5217618Ted Kremenek  os << "<!doctype html>\n" // Use HTML 5 doctype
279f6f593fae2f0531b4bc06891941f7fbba5217618Ted Kremenek        "<html>\n<head>\n";
280f6f593fae2f0531b4bc06891941f7fbba5217618Ted Kremenek
281f6f593fae2f0531b4bc06891941f7fbba5217618Ted Kremenek  if (title)
282f6f593fae2f0531b4bc06891941f7fbba5217618Ted Kremenek    os << "<title>" << html::EscapeText(title) << "</title>\n";
283f6f593fae2f0531b4bc06891941f7fbba5217618Ted Kremenek
284f6f593fae2f0531b4bc06891941f7fbba5217618Ted Kremenek  os << "<style type=\"text/css\">\n"
28570bcba6030a76edf46c4f941ad9a5297a1f98c47Ted Kremenek      " body { color:#000000; background-color:#ffffff }\n"
28670bcba6030a76edf46c4f941ad9a5297a1f98c47Ted Kremenek      " body { font-family:Helvetica, sans-serif; font-size:10pt }\n"
2874b0f81323b518429203051bbcd4864bbf4b000a9Ted Kremenek      " h1 { font-size:14pt }\n"
288f5016260522e449e9bacdb0e5a87ad3932d9fbd4Ted Kremenek      " .code { border-collapse:collapse; width:100%; }\n"
28970bcba6030a76edf46c4f941ad9a5297a1f98c47Ted Kremenek      " .code { font-family: \"Andale Mono\", monospace; font-size:10pt }\n"
29070bcba6030a76edf46c4f941ad9a5297a1f98c47Ted Kremenek      " .code { line-height: 1.2em }\n"
291f5016260522e449e9bacdb0e5a87ad3932d9fbd4Ted Kremenek      " .comment { color: green; font-style: oblique }\n"
292f5016260522e449e9bacdb0e5a87ad3932d9fbd4Ted Kremenek      " .keyword { color: blue }\n"
293cc1b8532a113fa3216096757b3b4e203867bd5e0Ted Kremenek      " .string_literal { color: red }\n"
294f5016260522e449e9bacdb0e5a87ad3932d9fbd4Ted Kremenek      " .directive { color: darkmagenta }\n"
2956f46be279f4bc8fc24611f060258bcfbe1c175c4Chris Lattner      // Macro expansions.
29607339a63b46e38c954fcccbef721c609d0c2040eTed Kremenek      " .expansion { display: none; }\n"
29707339a63b46e38c954fcccbef721c609d0c2040eTed Kremenek      " .macro:hover .expansion { display: block; border: 2px solid #FF0000; "
298dc5be47542e6d4a28d20abf9c0f0a0edd72939b6Chris Lattner          "padding: 2px; background-color:#FFF0F0; font-weight: normal; "
2996f46be279f4bc8fc24611f060258bcfbe1c175c4Chris Lattner          "  -webkit-border-radius:5px;  -webkit-box-shadow:1px 1px 7px #000; "
3008aa06aca8b2d3771a5405d789b2e704149045dd4Chris Lattner          "position: absolute; top: -1em; left:10em; z-index: 1 } \n"
301f5016260522e449e9bacdb0e5a87ad3932d9fbd4Ted Kremenek      " .macro { color: darkmagenta; background-color:LemonChiffon;"
3026f46be279f4bc8fc24611f060258bcfbe1c175c4Chris Lattner             // Macros are position: relative to provide base for expansions.
3036f46be279f4bc8fc24611f060258bcfbe1c175c4Chris Lattner             " position: relative }\n"
30470bcba6030a76edf46c4f941ad9a5297a1f98c47Ted Kremenek      " .num { width:2.5em; padding-right:2ex; background-color:#eeeeee }\n"
3052223622d113d7cba04c2dfdbe032e2ba6ba10bc4Ted Kremenek      " .num { text-align:right; font-size:8pt }\n"
30670bcba6030a76edf46c4f941ad9a5297a1f98c47Ted Kremenek      " .num { color:#444444 }\n"
30770bcba6030a76edf46c4f941ad9a5297a1f98c47Ted Kremenek      " .line { padding-left: 1ex; border-left: 3px solid #ccc }\n"
30870bcba6030a76edf46c4f941ad9a5297a1f98c47Ted Kremenek      " .line { white-space: pre }\n"
30970bcba6030a76edf46c4f941ad9a5297a1f98c47Ted Kremenek      " .msg { -webkit-box-shadow:1px 1px 7px #000 }\n"
31070bcba6030a76edf46c4f941ad9a5297a1f98c47Ted Kremenek      " .msg { -webkit-border-radius:5px }\n"
3112223622d113d7cba04c2dfdbe032e2ba6ba10bc4Ted Kremenek      " .msg { font-family:Helvetica, sans-serif; font-size:8pt }\n"
31270bcba6030a76edf46c4f941ad9a5297a1f98c47Ted Kremenek      " .msg { float:left }\n"
3133c59823096fe28a69a81f899c7f9f0e6eb8071a0Ted Kremenek      " .msg { padding:0.25em 1ex 0.25em 1ex }\n"
31470bcba6030a76edf46c4f941ad9a5297a1f98c47Ted Kremenek      " .msg { margin-top:10px; margin-bottom:10px }\n"
3152f10398814e8d58cce029a7e73af21bb274dcd42Ted Kremenek      " .msg { font-weight:bold }\n"
31680bae763da8bf3f3c73379a1e5d10f5bce266bcaTed Kremenek      " .msg { max-width:60em; word-wrap: break-word; white-space: pre-wrap }\n"
31780bae763da8bf3f3c73379a1e5d10f5bce266bcaTed Kremenek      " .msgT { padding:0x; spacing:0x }\n"
3182f10398814e8d58cce029a7e73af21bb274dcd42Ted Kremenek      " .msgEvent { background-color:#fff8b4; color:#000000 }\n"
31980bae763da8bf3f3c73379a1e5d10f5bce266bcaTed Kremenek      " .msgControl { background-color:#bbbbbb; color:#000000 }\n"
32070bcba6030a76edf46c4f941ad9a5297a1f98c47Ted Kremenek      " .mrange { background-color:#dfddf3 }\n"
32170bcba6030a76edf46c4f941ad9a5297a1f98c47Ted Kremenek      " .mrange { border-bottom:1px solid #6F9DBE }\n"
3223c59823096fe28a69a81f899c7f9f0e6eb8071a0Ted Kremenek      " .PathIndex { font-weight: bold; padding:0px 5px 0px 5px; "
3233c59823096fe28a69a81f899c7f9f0e6eb8071a0Ted Kremenek        "margin-right:5px; }\n"
32400f01e440573b2bdf6549991e0ca48cc6747e3a2Ted Kremenek      " .PathIndex { -webkit-border-radius:8px }\n"
32500f01e440573b2bdf6549991e0ca48cc6747e3a2Ted Kremenek      " .PathIndexEvent { background-color:#bfba87 }\n"
32600f01e440573b2bdf6549991e0ca48cc6747e3a2Ted Kremenek      " .PathIndexControl { background-color:#8c8c8c }\n"
3274b2d3f7bcc4df31157df443af1b80bcaa9b58bbaDouglas Gregor      " .CodeInsertionHint { font-weight: bold; background-color: #10dd10 }\n"
3284b2d3f7bcc4df31157df443af1b80bcaa9b58bbaDouglas Gregor      " .CodeRemovalHint { background-color:#de1010 }\n"
3294b2d3f7bcc4df31157df443af1b80bcaa9b58bbaDouglas Gregor      " .CodeRemovalHint { border-bottom:1px solid #6F9DBE }\n"
3304b0f81323b518429203051bbcd4864bbf4b000a9Ted Kremenek      " table.simpletable {\n"
3314b0f81323b518429203051bbcd4864bbf4b000a9Ted Kremenek      "   padding: 5px;\n"
3324b0f81323b518429203051bbcd4864bbf4b000a9Ted Kremenek      "   font-size:12pt;\n"
3334b0f81323b518429203051bbcd4864bbf4b000a9Ted Kremenek      "   margin:20px;\n"
3344b0f81323b518429203051bbcd4864bbf4b000a9Ted Kremenek      "   border-collapse: collapse; border-spacing: 0px;\n"
3354b0f81323b518429203051bbcd4864bbf4b000a9Ted Kremenek      " }\n"
3364b0f81323b518429203051bbcd4864bbf4b000a9Ted Kremenek      " td.rowname {\n"
3374b0f81323b518429203051bbcd4864bbf4b000a9Ted Kremenek      "   text-align:right; font-weight:bold; color:#444444;\n"
3384b0f81323b518429203051bbcd4864bbf4b000a9Ted Kremenek      "   padding-right:2ex; }\n"
339f6f593fae2f0531b4bc06891941f7fbba5217618Ted Kremenek      "</style>\n</head>\n<body>";
34070bcba6030a76edf46c4f941ad9a5297a1f98c47Ted Kremenek
341f6f593fae2f0531b4bc06891941f7fbba5217618Ted Kremenek  // Generate header
342f6f593fae2f0531b4bc06891941f7fbba5217618Ted Kremenek  R.InsertStrBefore(StartLoc, os.str());
343ad0a203130dc5d1fb7231b88767174511424fa98Ted Kremenek  // Generate footer
344ad0a203130dc5d1fb7231b88767174511424fa98Ted Kremenek
34570bcba6030a76edf46c4f941ad9a5297a1f98c47Ted Kremenek  R.InsertCStrAfter(EndLoc, "</body></html>\n");
346ad0a203130dc5d1fb7231b88767174511424fa98Ted Kremenek}
3473245a0a1c7a4fd74fca845b2edba275bb126d773Chris Lattner
3483245a0a1c7a4fd74fca845b2edba275bb126d773Chris Lattner/// SyntaxHighlight - Relex the specified FileID and annotate the HTML with
3493245a0a1c7a4fd74fca845b2edba275bb126d773Chris Lattner/// information about keywords, macro expansions etc.  This uses the macro
3503245a0a1c7a4fd74fca845b2edba275bb126d773Chris Lattner/// table state from the end of the file, so it won't be perfectly perfect,
3513245a0a1c7a4fd74fca845b2edba275bb126d773Chris Lattner/// but it will be reasonably close.
3522b2453a7d8fe732561795431f39ceb2b2a832d84Chris Lattnervoid html::SyntaxHighlight(Rewriter &R, FileID FID, Preprocessor &PP) {
3532b2453a7d8fe732561795431f39ceb2b2a832d84Chris Lattner  RewriteBuffer &RB = R.getEditBuffer(FID);
3543245a0a1c7a4fd74fca845b2edba275bb126d773Chris Lattner
35505db4278ecd193edcff63fb8c54818226fceaad2Chris Lattner  const SourceManager &SM = PP.getSourceManager();
35605db4278ecd193edcff63fb8c54818226fceaad2Chris Lattner  Lexer L(FID, SM, PP.getLangOptions());
357025c3a66402fb713c2d9bf5dc174ff264765379aChris Lattner  const char *BufferStart = L.getBufferStart();
358a745e8c52839d9c8dd0fd8d5276b4eab182ec7f2Chris Lattner
3593245a0a1c7a4fd74fca845b2edba275bb126d773Chris Lattner  // Inform the preprocessor that we want to retain comments as tokens, so we
3603245a0a1c7a4fd74fca845b2edba275bb126d773Chris Lattner  // can highlight them.
361678c6358c8d4e368c78629099142397c63c1ee35Chris Lattner  L.SetCommentRetentionState(true);
3623245a0a1c7a4fd74fca845b2edba275bb126d773Chris Lattner
363c54d50a4180520370c12dd7d06d035263d357d56Chris Lattner  // Lex all the tokens in raw mode, to avoid entering #includes or expanding
364c54d50a4180520370c12dd7d06d035263d357d56Chris Lattner  // macros.
3653245a0a1c7a4fd74fca845b2edba275bb126d773Chris Lattner  Token Tok;
366590f0cc643274267d4d41125b62557e1d87886c3Chris Lattner  L.LexFromRawLexer(Tok);
36774ea3e5c57c087c046223096a97ea4e365f85eb6Chris Lattner
36874ea3e5c57c087c046223096a97ea4e365f85eb6Chris Lattner  while (Tok.isNot(tok::eof)) {
36974ea3e5c57c087c046223096a97ea4e365f85eb6Chris Lattner    // Since we are lexing unexpanded tokens, all tokens are from the main
37074ea3e5c57c087c046223096a97ea4e365f85eb6Chris Lattner    // FileID.
37105db4278ecd193edcff63fb8c54818226fceaad2Chris Lattner    unsigned TokOffs = SM.getFileOffset(Tok.getLocation());
3723245a0a1c7a4fd74fca845b2edba275bb126d773Chris Lattner    unsigned TokLen = Tok.getLength();
3733245a0a1c7a4fd74fca845b2edba275bb126d773Chris Lattner    switch (Tok.getKind()) {
374a745e8c52839d9c8dd0fd8d5276b4eab182ec7f2Chris Lattner    default: break;
375a745e8c52839d9c8dd0fd8d5276b4eab182ec7f2Chris Lattner    case tok::identifier: {
376a745e8c52839d9c8dd0fd8d5276b4eab182ec7f2Chris Lattner      // Fill in Result.IdentifierInfo, looking up the identifier in the
377a745e8c52839d9c8dd0fd8d5276b4eab182ec7f2Chris Lattner      // identifier table.
378a745e8c52839d9c8dd0fd8d5276b4eab182ec7f2Chris Lattner      IdentifierInfo *II = PP.LookUpIdentifierInfo(Tok, BufferStart+TokOffs);
379a745e8c52839d9c8dd0fd8d5276b4eab182ec7f2Chris Lattner
380a745e8c52839d9c8dd0fd8d5276b4eab182ec7f2Chris Lattner      // If this is a pp-identifier, for a keyword, highlight it as such.
3815ef3e2c45f13fccdb0d7bbcf24c1beee8eee6f64Chris Lattner      if (II->getTokenID() != tok::identifier)
3825ef3e2c45f13fccdb0d7bbcf24c1beee8eee6f64Chris Lattner        HighlightRange(RB, TokOffs, TokOffs+TokLen, BufferStart,
3835ef3e2c45f13fccdb0d7bbcf24c1beee8eee6f64Chris Lattner                       "<span class='keyword'>", "</span>");
384c4586c234edd8df0477a895aebcbc3eb220aed6bChris Lattner      break;
385a745e8c52839d9c8dd0fd8d5276b4eab182ec7f2Chris Lattner    }
3863245a0a1c7a4fd74fca845b2edba275bb126d773Chris Lattner    case tok::comment:
3875ef3e2c45f13fccdb0d7bbcf24c1beee8eee6f64Chris Lattner      HighlightRange(RB, TokOffs, TokOffs+TokLen, BufferStart,
3885ef3e2c45f13fccdb0d7bbcf24c1beee8eee6f64Chris Lattner                     "<span class='comment'>", "</span>");
3893245a0a1c7a4fd74fca845b2edba275bb126d773Chris Lattner      break;
390cc1b8532a113fa3216096757b3b4e203867bd5e0Ted Kremenek    case tok::wide_string_literal:
391cc1b8532a113fa3216096757b3b4e203867bd5e0Ted Kremenek      // Chop off the L prefix
392cc1b8532a113fa3216096757b3b4e203867bd5e0Ted Kremenek      ++TokOffs;
393cc1b8532a113fa3216096757b3b4e203867bd5e0Ted Kremenek      --TokLen;
394cc1b8532a113fa3216096757b3b4e203867bd5e0Ted Kremenek      // FALL THROUGH.
395cc1b8532a113fa3216096757b3b4e203867bd5e0Ted Kremenek    case tok::string_literal:
396cc1b8532a113fa3216096757b3b4e203867bd5e0Ted Kremenek      HighlightRange(RB, TokOffs, TokOffs+TokLen, BufferStart,
397cc1b8532a113fa3216096757b3b4e203867bd5e0Ted Kremenek                     "<span class='string_literal'>", "</span>");
398cc1b8532a113fa3216096757b3b4e203867bd5e0Ted Kremenek      break;
3995deb96d06583abb751463427457d46041af262d0Chris Lattner    case tok::hash: {
40074ea3e5c57c087c046223096a97ea4e365f85eb6Chris Lattner      // If this is a preprocessor directive, all tokens to end of line are too.
4015deb96d06583abb751463427457d46041af262d0Chris Lattner      if (!Tok.isAtStartOfLine())
4025deb96d06583abb751463427457d46041af262d0Chris Lattner        break;
4035deb96d06583abb751463427457d46041af262d0Chris Lattner
4045deb96d06583abb751463427457d46041af262d0Chris Lattner      // Eat all of the tokens until we get to the next one at the start of
4055deb96d06583abb751463427457d46041af262d0Chris Lattner      // line.
4065deb96d06583abb751463427457d46041af262d0Chris Lattner      unsigned TokEnd = TokOffs+TokLen;
407590f0cc643274267d4d41125b62557e1d87886c3Chris Lattner      L.LexFromRawLexer(Tok);
4085deb96d06583abb751463427457d46041af262d0Chris Lattner      while (!Tok.isAtStartOfLine() && Tok.isNot(tok::eof)) {
40905db4278ecd193edcff63fb8c54818226fceaad2Chris Lattner        TokEnd = SM.getFileOffset(Tok.getLocation())+Tok.getLength();
410590f0cc643274267d4d41125b62557e1d87886c3Chris Lattner        L.LexFromRawLexer(Tok);
41174ea3e5c57c087c046223096a97ea4e365f85eb6Chris Lattner      }
4125deb96d06583abb751463427457d46041af262d0Chris Lattner
4135deb96d06583abb751463427457d46041af262d0Chris Lattner      // Find end of line.  This is a hack.
4145deb96d06583abb751463427457d46041af262d0Chris Lattner      HighlightRange(RB, TokOffs, TokEnd, BufferStart,
4155deb96d06583abb751463427457d46041af262d0Chris Lattner                     "<span class='directive'>", "</span>");
4165deb96d06583abb751463427457d46041af262d0Chris Lattner
4175deb96d06583abb751463427457d46041af262d0Chris Lattner      // Don't skip the next token.
4185deb96d06583abb751463427457d46041af262d0Chris Lattner      continue;
4195deb96d06583abb751463427457d46041af262d0Chris Lattner    }
4203245a0a1c7a4fd74fca845b2edba275bb126d773Chris Lattner    }
4213245a0a1c7a4fd74fca845b2edba275bb126d773Chris Lattner
422590f0cc643274267d4d41125b62557e1d87886c3Chris Lattner    L.LexFromRawLexer(Tok);
42374ea3e5c57c087c046223096a97ea4e365f85eb6Chris Lattner  }
4243245a0a1c7a4fd74fca845b2edba275bb126d773Chris Lattner}
425c54d50a4180520370c12dd7d06d035263d357d56Chris Lattner
4267c175fb196a2bc3dbc86ea3865c713e1875f3f6dChris Lattnernamespace {
4277c175fb196a2bc3dbc86ea3865c713e1875f3f6dChris Lattner/// IgnoringDiagClient - This is a diagnostic client that just ignores all
4287c175fb196a2bc3dbc86ea3865c713e1875f3f6dChris Lattner/// diags.
4297c175fb196a2bc3dbc86ea3865c713e1875f3f6dChris Lattnerclass IgnoringDiagClient : public DiagnosticClient {
4307c175fb196a2bc3dbc86ea3865c713e1875f3f6dChris Lattner  void HandleDiagnostic(Diagnostic::Level DiagLevel,
4317c175fb196a2bc3dbc86ea3865c713e1875f3f6dChris Lattner                        const DiagnosticInfo &Info) {
4327c175fb196a2bc3dbc86ea3865c713e1875f3f6dChris Lattner    // Just ignore it.
4337c175fb196a2bc3dbc86ea3865c713e1875f3f6dChris Lattner  }
4347c175fb196a2bc3dbc86ea3865c713e1875f3f6dChris Lattner};
4357c175fb196a2bc3dbc86ea3865c713e1875f3f6dChris Lattner}
4367c175fb196a2bc3dbc86ea3865c713e1875f3f6dChris Lattner
437c54d50a4180520370c12dd7d06d035263d357d56Chris Lattner/// HighlightMacros - This uses the macro table state from the end of the
43805db4278ecd193edcff63fb8c54818226fceaad2Chris Lattner/// file, to re-expand macros and insert (into the HTML) information about the
439c54d50a4180520370c12dd7d06d035263d357d56Chris Lattner/// macro expansions.  This won't be perfectly perfect, but it will be
440c54d50a4180520370c12dd7d06d035263d357d56Chris Lattner/// reasonably close.
4412b2453a7d8fe732561795431f39ceb2b2a832d84Chris Lattnervoid html::HighlightMacros(Rewriter &R, FileID FID, Preprocessor& PP) {
44205db4278ecd193edcff63fb8c54818226fceaad2Chris Lattner  // Re-lex the raw token stream into a token buffer.
44305db4278ecd193edcff63fb8c54818226fceaad2Chris Lattner  const SourceManager &SM = PP.getSourceManager();
44405db4278ecd193edcff63fb8c54818226fceaad2Chris Lattner  std::vector<Token> TokenStream;
44505db4278ecd193edcff63fb8c54818226fceaad2Chris Lattner
44605db4278ecd193edcff63fb8c54818226fceaad2Chris Lattner  Lexer L(FID, SM, PP.getLangOptions());
44705db4278ecd193edcff63fb8c54818226fceaad2Chris Lattner
44805db4278ecd193edcff63fb8c54818226fceaad2Chris Lattner  // Lex all the tokens in raw mode, to avoid entering #includes or expanding
44905db4278ecd193edcff63fb8c54818226fceaad2Chris Lattner  // macros.
45005db4278ecd193edcff63fb8c54818226fceaad2Chris Lattner  while (1) {
45105db4278ecd193edcff63fb8c54818226fceaad2Chris Lattner    Token Tok;
45205db4278ecd193edcff63fb8c54818226fceaad2Chris Lattner    L.LexFromRawLexer(Tok);
45305db4278ecd193edcff63fb8c54818226fceaad2Chris Lattner
45405db4278ecd193edcff63fb8c54818226fceaad2Chris Lattner    // If this is a # at the start of a line, discard it from the token stream.
45505db4278ecd193edcff63fb8c54818226fceaad2Chris Lattner    // We don't want the re-preprocess step to see #defines, #includes or other
45605db4278ecd193edcff63fb8c54818226fceaad2Chris Lattner    // preprocessor directives.
45705db4278ecd193edcff63fb8c54818226fceaad2Chris Lattner    if (Tok.is(tok::hash) && Tok.isAtStartOfLine())
45805db4278ecd193edcff63fb8c54818226fceaad2Chris Lattner      continue;
459f0b26b1d9dee57c84e55f05200802658a7312683Chris Lattner
460f0b26b1d9dee57c84e55f05200802658a7312683Chris Lattner    // If this is a ## token, change its kind to unknown so that repreprocessing
461f0b26b1d9dee57c84e55f05200802658a7312683Chris Lattner    // it will not produce an error.
462f0b26b1d9dee57c84e55f05200802658a7312683Chris Lattner    if (Tok.is(tok::hashhash))
463f0b26b1d9dee57c84e55f05200802658a7312683Chris Lattner      Tok.setKind(tok::unknown);
46405db4278ecd193edcff63fb8c54818226fceaad2Chris Lattner
46505db4278ecd193edcff63fb8c54818226fceaad2Chris Lattner    // If this raw token is an identifier, the raw lexer won't have looked up
46605db4278ecd193edcff63fb8c54818226fceaad2Chris Lattner    // the corresponding identifier info for it.  Do this now so that it will be
46705db4278ecd193edcff63fb8c54818226fceaad2Chris Lattner    // macro expanded when we re-preprocess it.
46805db4278ecd193edcff63fb8c54818226fceaad2Chris Lattner    if (Tok.is(tok::identifier)) {
46905db4278ecd193edcff63fb8c54818226fceaad2Chris Lattner      // Change the kind of this identifier to the appropriate token kind, e.g.
47005db4278ecd193edcff63fb8c54818226fceaad2Chris Lattner      // turning "for" into a keyword.
47105db4278ecd193edcff63fb8c54818226fceaad2Chris Lattner      Tok.setKind(PP.LookUpIdentifierInfo(Tok)->getTokenID());
47205db4278ecd193edcff63fb8c54818226fceaad2Chris Lattner    }
47305db4278ecd193edcff63fb8c54818226fceaad2Chris Lattner
47405db4278ecd193edcff63fb8c54818226fceaad2Chris Lattner    TokenStream.push_back(Tok);
47505db4278ecd193edcff63fb8c54818226fceaad2Chris Lattner
47605db4278ecd193edcff63fb8c54818226fceaad2Chris Lattner    if (Tok.is(tok::eof)) break;
47705db4278ecd193edcff63fb8c54818226fceaad2Chris Lattner  }
47805db4278ecd193edcff63fb8c54818226fceaad2Chris Lattner
4797c175fb196a2bc3dbc86ea3865c713e1875f3f6dChris Lattner  // Temporarily change the diagnostics object so that we ignore any generated
4807c175fb196a2bc3dbc86ea3865c713e1875f3f6dChris Lattner  // diagnostics from this pass.
4817c175fb196a2bc3dbc86ea3865c713e1875f3f6dChris Lattner  IgnoringDiagClient TmpDC;
4827c175fb196a2bc3dbc86ea3865c713e1875f3f6dChris Lattner  Diagnostic TmpDiags(&TmpDC);
4837c175fb196a2bc3dbc86ea3865c713e1875f3f6dChris Lattner
4847c175fb196a2bc3dbc86ea3865c713e1875f3f6dChris Lattner  Diagnostic *OldDiags = &PP.getDiagnostics();
4857c175fb196a2bc3dbc86ea3865c713e1875f3f6dChris Lattner  PP.setDiagnostics(TmpDiags);
4867c175fb196a2bc3dbc86ea3865c713e1875f3f6dChris Lattner
487c54d50a4180520370c12dd7d06d035263d357d56Chris Lattner  // Inform the preprocessor that we don't want comments.
488fb58609c5b3f0d665ea58e37ef39eb7ea74758a4Ted Kremenek  PP.SetCommentRetentionState(false, false);
48905db4278ecd193edcff63fb8c54818226fceaad2Chris Lattner
49005db4278ecd193edcff63fb8c54818226fceaad2Chris Lattner  // Enter the tokens we just lexed.  This will cause them to be macro expanded
49105db4278ecd193edcff63fb8c54818226fceaad2Chris Lattner  // but won't enter sub-files (because we removed #'s).
49205db4278ecd193edcff63fb8c54818226fceaad2Chris Lattner  PP.EnterTokenStream(&TokenStream[0], TokenStream.size(), false, false);
493c54d50a4180520370c12dd7d06d035263d357d56Chris Lattner
494867924dbeca06870573fd58d620032da6994b223Chris Lattner  TokenConcatenation ConcatInfo(PP);
495867924dbeca06870573fd58d620032da6994b223Chris Lattner
496c54d50a4180520370c12dd7d06d035263d357d56Chris Lattner  // Lex all the tokens.
497c54d50a4180520370c12dd7d06d035263d357d56Chris Lattner  Token Tok;
498fb58609c5b3f0d665ea58e37ef39eb7ea74758a4Ted Kremenek  PP.Lex(Tok);
499c54d50a4180520370c12dd7d06d035263d357d56Chris Lattner  while (Tok.isNot(tok::eof)) {
500c54d50a4180520370c12dd7d06d035263d357d56Chris Lattner    // Ignore non-macro tokens.
501c54d50a4180520370c12dd7d06d035263d357d56Chris Lattner    if (!Tok.getLocation().isMacroID()) {
502fb58609c5b3f0d665ea58e37ef39eb7ea74758a4Ted Kremenek      PP.Lex(Tok);
503c54d50a4180520370c12dd7d06d035263d357d56Chris Lattner      continue;
504c54d50a4180520370c12dd7d06d035263d357d56Chris Lattner    }
505c54d50a4180520370c12dd7d06d035263d357d56Chris Lattner
506b7949a9a91ad8e49124cd6a82ff98972d7efaadcChris Lattner    // Okay, we have the first token of a macro expansion: highlight the
507b7949a9a91ad8e49124cd6a82ff98972d7efaadcChris Lattner    // instantiation by inserting a start tag before the macro instantiation and
508b7949a9a91ad8e49124cd6a82ff98972d7efaadcChris Lattner    // end tag after it.
509b7949a9a91ad8e49124cd6a82ff98972d7efaadcChris Lattner    std::pair<SourceLocation, SourceLocation> LLoc =
510b7949a9a91ad8e49124cd6a82ff98972d7efaadcChris Lattner      SM.getInstantiationRange(Tok.getLocation());
511c54d50a4180520370c12dd7d06d035263d357d56Chris Lattner
512b7949a9a91ad8e49124cd6a82ff98972d7efaadcChris Lattner    // Ignore tokens whose instantiation location was not the main file.
513b7949a9a91ad8e49124cd6a82ff98972d7efaadcChris Lattner    if (SM.getFileID(LLoc.first) != FID) {
514fb58609c5b3f0d665ea58e37ef39eb7ea74758a4Ted Kremenek      PP.Lex(Tok);
515c54d50a4180520370c12dd7d06d035263d357d56Chris Lattner      continue;
516c54d50a4180520370c12dd7d06d035263d357d56Chris Lattner    }
517b7949a9a91ad8e49124cd6a82ff98972d7efaadcChris Lattner
518b7949a9a91ad8e49124cd6a82ff98972d7efaadcChris Lattner    assert(SM.getFileID(LLoc.second) == FID &&
519b7949a9a91ad8e49124cd6a82ff98972d7efaadcChris Lattner           "Start and end of expansion must be in the same ultimate file!");
520e9e6cb93afa51eee1f83abc7e2cb7d8a0453d810Chris Lattner
521b83ded0db9824b3b0417bf46540ed34d48776673Ted Kremenek    std::string Expansion = EscapeText(PP.getSpelling(Tok));
5226f46be279f4bc8fc24611f060258bcfbe1c175c4Chris Lattner    unsigned LineLen = Expansion.size();
5236f46be279f4bc8fc24611f060258bcfbe1c175c4Chris Lattner
524867924dbeca06870573fd58d620032da6994b223Chris Lattner    Token PrevTok = Tok;
525c54d50a4180520370c12dd7d06d035263d357d56Chris Lattner    // Okay, eat this token, getting the next one.
526fb58609c5b3f0d665ea58e37ef39eb7ea74758a4Ted Kremenek    PP.Lex(Tok);
527c54d50a4180520370c12dd7d06d035263d357d56Chris Lattner
528c54d50a4180520370c12dd7d06d035263d357d56Chris Lattner    // Skip all the rest of the tokens that are part of this macro
529c54d50a4180520370c12dd7d06d035263d357d56Chris Lattner    // instantiation.  It would be really nice to pop up a window with all the
530c54d50a4180520370c12dd7d06d035263d357d56Chris Lattner    // spelling of the tokens or something.
531c54d50a4180520370c12dd7d06d035263d357d56Chris Lattner    while (!Tok.is(tok::eof) &&
532b7949a9a91ad8e49124cd6a82ff98972d7efaadcChris Lattner           SM.getInstantiationLoc(Tok.getLocation()) == LLoc.first) {
5336f46be279f4bc8fc24611f060258bcfbe1c175c4Chris Lattner      // Insert a newline if the macro expansion is getting large.
5346f46be279f4bc8fc24611f060258bcfbe1c175c4Chris Lattner      if (LineLen > 60) {
5356f46be279f4bc8fc24611f060258bcfbe1c175c4Chris Lattner        Expansion += "<br>";
5366f46be279f4bc8fc24611f060258bcfbe1c175c4Chris Lattner        LineLen = 0;
5376f46be279f4bc8fc24611f060258bcfbe1c175c4Chris Lattner      }
5386f46be279f4bc8fc24611f060258bcfbe1c175c4Chris Lattner
5396f46be279f4bc8fc24611f060258bcfbe1c175c4Chris Lattner      LineLen -= Expansion.size();
540867924dbeca06870573fd58d620032da6994b223Chris Lattner
541867924dbeca06870573fd58d620032da6994b223Chris Lattner      // If the tokens were already space separated, or if they must be to avoid
542867924dbeca06870573fd58d620032da6994b223Chris Lattner      // them being implicitly pasted, add a space between them.
543867924dbeca06870573fd58d620032da6994b223Chris Lattner      if (Tok.hasLeadingSpace() ||
544867924dbeca06870573fd58d620032da6994b223Chris Lattner          ConcatInfo.AvoidConcat(PrevTok, Tok))
545867924dbeca06870573fd58d620032da6994b223Chris Lattner        Expansion += ' ';
546867924dbeca06870573fd58d620032da6994b223Chris Lattner
5479227c6953497be34281354f949d6f4cd34a696ccChris Lattner      // Escape any special characters in the token text.
548867924dbeca06870573fd58d620032da6994b223Chris Lattner      Expansion += EscapeText(PP.getSpelling(Tok));
5496f46be279f4bc8fc24611f060258bcfbe1c175c4Chris Lattner      LineLen += Expansion.size();
550867924dbeca06870573fd58d620032da6994b223Chris Lattner
551867924dbeca06870573fd58d620032da6994b223Chris Lattner      PrevTok = Tok;
552fb58609c5b3f0d665ea58e37ef39eb7ea74758a4Ted Kremenek      PP.Lex(Tok);
5536f46be279f4bc8fc24611f060258bcfbe1c175c4Chris Lattner    }
5549227c6953497be34281354f949d6f4cd34a696ccChris Lattner
555e9e6cb93afa51eee1f83abc7e2cb7d8a0453d810Chris Lattner
556e9e6cb93afa51eee1f83abc7e2cb7d8a0453d810Chris Lattner    // Insert the expansion as the end tag, so that multi-line macros all get
557e9e6cb93afa51eee1f83abc7e2cb7d8a0453d810Chris Lattner    // highlighted.
558e9e6cb93afa51eee1f83abc7e2cb7d8a0453d810Chris Lattner    Expansion = "<span class='expansion'>" + Expansion + "</span></span>";
559e9e6cb93afa51eee1f83abc7e2cb7d8a0453d810Chris Lattner
560e9e6cb93afa51eee1f83abc7e2cb7d8a0453d810Chris Lattner    HighlightRange(R, LLoc.first, LLoc.second,
561e9e6cb93afa51eee1f83abc7e2cb7d8a0453d810Chris Lattner                   "<span class='macro'>", Expansion.c_str());
562c54d50a4180520370c12dd7d06d035263d357d56Chris Lattner  }
5637c175fb196a2bc3dbc86ea3865c713e1875f3f6dChris Lattner
5647c175fb196a2bc3dbc86ea3865c713e1875f3f6dChris Lattner  // Restore diagnostics object back to its own thing.
5657c175fb196a2bc3dbc86ea3865c713e1875f3f6dChris Lattner  PP.setDiagnostics(*OldDiags);
566c54d50a4180520370c12dd7d06d035263d357d56Chris Lattner}
567c54d50a4180520370c12dd7d06d035263d357d56Chris Lattner
5682b2453a7d8fe732561795431f39ceb2b2a832d84Chris Lattnervoid html::HighlightMacros(Rewriter &R, FileID FID,
569fb58609c5b3f0d665ea58e37ef39eb7ea74758a4Ted Kremenek                           PreprocessorFactory &PPF) {
570fb58609c5b3f0d665ea58e37ef39eb7ea74758a4Ted Kremenek
571fb58609c5b3f0d665ea58e37ef39eb7ea74758a4Ted Kremenek  llvm::OwningPtr<Preprocessor> PP(PPF.CreatePreprocessor());
5722b2453a7d8fe732561795431f39ceb2b2a832d84Chris Lattner  HighlightMacros(R, FID, *PP);
573fb58609c5b3f0d665ea58e37ef39eb7ea74758a4Ted Kremenek}
574