Ted Kremenek | 7dcc822 | 2008-03-18 21:19:49 +0000 | [diff] [blame] | 1 | //== HTMLRewrite.cpp - Translate source code into prettified HTML --*- C++ -*-// |
| 2 | // |
| 3 | // The LLVM Compiler Infrastructure |
| 4 | // |
| 5 | // This file is distributed under the University of Illinois Open Source |
| 6 | // License. See LICENSE.TXT for details. |
| 7 | // |
| 8 | //===----------------------------------------------------------------------===// |
| 9 | // |
Alp Toker | f6a24ce | 2013-12-05 16:25:25 +0000 | [diff] [blame] | 10 | // This file defines the HTMLRewriter class, which is used to translate the |
Ted Kremenek | 7dcc822 | 2008-03-18 21:19:49 +0000 | [diff] [blame] | 11 | // text of a source file into prettified HTML. |
| 12 | // |
| 13 | //===----------------------------------------------------------------------===// |
| 14 | |
Ted Kremenek | cdf8149 | 2012-09-01 05:09:24 +0000 | [diff] [blame] | 15 | #include "clang/Rewrite/Core/HTMLRewrite.h" |
Ted Kremenek | 7dcc822 | 2008-03-18 21:19:49 +0000 | [diff] [blame] | 16 | #include "clang/Basic/SourceManager.h" |
Chandler Carruth | 3a02247 | 2012-12-04 09:13:33 +0000 | [diff] [blame] | 17 | #include "clang/Lex/Preprocessor.h" |
Chandler Carruth | 3a02247 | 2012-12-04 09:13:33 +0000 | [diff] [blame] | 18 | #include "clang/Lex/TokenConcatenation.h" |
| 19 | #include "clang/Rewrite/Core/Rewriter.h" |
Chandler Carruth | 3a02247 | 2012-12-04 09:13:33 +0000 | [diff] [blame] | 20 | #include "llvm/ADT/SmallString.h" |
Abramo Bagnara | ea4f7c7 | 2010-12-22 08:23:18 +0000 | [diff] [blame] | 21 | #include "llvm/Support/ErrorHandling.h" |
Ted Kremenek | 7dcc822 | 2008-03-18 21:19:49 +0000 | [diff] [blame] | 22 | #include "llvm/Support/MemoryBuffer.h" |
Ted Kremenek | 2d470fc | 2008-09-13 05:16:45 +0000 | [diff] [blame] | 23 | #include "llvm/Support/raw_ostream.h" |
Ahmed Charles | dfca6f9 | 2014-03-09 11:36:40 +0000 | [diff] [blame] | 24 | #include <memory> |
Ted Kremenek | 7dcc822 | 2008-03-18 21:19:49 +0000 | [diff] [blame] | 25 | using namespace clang; |
| 26 | |
Chris Lattner | 10dbbb0 | 2008-04-16 23:06:45 +0000 | [diff] [blame] | 27 | |
Chris Lattner | 8e3006a | 2008-04-16 22:45:51 +0000 | [diff] [blame] | 28 | /// HighlightRange - Highlight a range in the source code with the specified |
| 29 | /// start/end tags. B/E must be in the same file. This ensures that |
| 30 | /// start/end tags are placed at the start/end of each line if the range is |
| 31 | /// multiline. |
| 32 | void html::HighlightRange(Rewriter &R, SourceLocation B, SourceLocation E, |
| 33 | const char *StartTag, const char *EndTag) { |
| 34 | SourceManager &SM = R.getSourceMgr(); |
Chandler Carruth | 35f5320 | 2011-07-25 16:49:02 +0000 | [diff] [blame] | 35 | B = SM.getExpansionLoc(B); |
| 36 | E = SM.getExpansionLoc(E); |
Chris Lattner | cbc35ecb | 2009-01-19 07:46:45 +0000 | [diff] [blame] | 37 | FileID FID = SM.getFileID(B); |
| 38 | assert(SM.getFileID(E) == FID && "B/E not in the same file!"); |
Chris Lattner | 8e3006a | 2008-04-16 22:45:51 +0000 | [diff] [blame] | 39 | |
Chris Lattner | c360bf2 | 2009-01-27 06:27:13 +0000 | [diff] [blame] | 40 | unsigned BOffset = SM.getFileOffset(B); |
| 41 | unsigned EOffset = SM.getFileOffset(E); |
Mike Stump | 11289f4 | 2009-09-09 15:08:12 +0000 | [diff] [blame] | 42 | |
Chris Lattner | 8e3006a | 2008-04-16 22:45:51 +0000 | [diff] [blame] | 43 | // Include the whole end token in the range. |
Chris Lattner | 184e65d | 2009-04-14 23:22:57 +0000 | [diff] [blame] | 44 | EOffset += Lexer::MeasureTokenLength(E, R.getSourceMgr(), R.getLangOpts()); |
Mike Stump | 11289f4 | 2009-09-09 15:08:12 +0000 | [diff] [blame] | 45 | |
Douglas Gregor | e0fbb83 | 2010-03-16 00:06:06 +0000 | [diff] [blame] | 46 | bool Invalid = false; |
Benjamin Kramer | eb92dc0 | 2010-03-16 14:14:31 +0000 | [diff] [blame] | 47 | const char *BufferStart = SM.getBufferData(FID, &Invalid).data(); |
Douglas Gregor | e0fbb83 | 2010-03-16 00:06:06 +0000 | [diff] [blame] | 48 | if (Invalid) |
Douglas Gregor | 802b776 | 2010-03-15 22:54:52 +0000 | [diff] [blame] | 49 | return; |
Douglas Gregor | 802b776 | 2010-03-15 22:54:52 +0000 | [diff] [blame] | 50 | |
Chris Lattner | d32480d | 2009-01-17 06:22:33 +0000 | [diff] [blame] | 51 | HighlightRange(R.getEditBuffer(FID), BOffset, EOffset, |
Douglas Gregor | 802b776 | 2010-03-15 22:54:52 +0000 | [diff] [blame] | 52 | BufferStart, StartTag, EndTag); |
Chris Lattner | 8e3006a | 2008-04-16 22:45:51 +0000 | [diff] [blame] | 53 | } |
| 54 | |
| 55 | /// HighlightRange - This is the same as the above method, but takes |
| 56 | /// decomposed file locations. |
| 57 | void html::HighlightRange(RewriteBuffer &RB, unsigned B, unsigned E, |
| 58 | const char *BufferStart, |
| 59 | const char *StartTag, const char *EndTag) { |
Chris Lattner | 10dbbb0 | 2008-04-16 23:06:45 +0000 | [diff] [blame] | 60 | // Insert the tag at the absolute start/end of the range. |
Daniel Dunbar | dec484a | 2009-08-19 19:10:30 +0000 | [diff] [blame] | 61 | RB.InsertTextAfter(B, StartTag); |
| 62 | RB.InsertTextBefore(E, EndTag); |
Mike Stump | 11289f4 | 2009-09-09 15:08:12 +0000 | [diff] [blame] | 63 | |
Chris Lattner | 10dbbb0 | 2008-04-16 23:06:45 +0000 | [diff] [blame] | 64 | // Scan the range to see if there is a \r or \n. If so, and if the line is |
| 65 | // not blank, insert tags on that line as well. |
| 66 | bool HadOpenTag = true; |
Mike Stump | 11289f4 | 2009-09-09 15:08:12 +0000 | [diff] [blame] | 67 | |
Chris Lattner | 10dbbb0 | 2008-04-16 23:06:45 +0000 | [diff] [blame] | 68 | unsigned LastNonWhiteSpace = B; |
| 69 | for (unsigned i = B; i != E; ++i) { |
| 70 | switch (BufferStart[i]) { |
| 71 | case '\r': |
| 72 | case '\n': |
| 73 | // Okay, we found a newline in the range. If we have an open tag, we need |
| 74 | // to insert a close tag at the first non-whitespace before the newline. |
| 75 | if (HadOpenTag) |
Daniel Dunbar | dec484a | 2009-08-19 19:10:30 +0000 | [diff] [blame] | 76 | RB.InsertTextBefore(LastNonWhiteSpace+1, EndTag); |
Mike Stump | 11289f4 | 2009-09-09 15:08:12 +0000 | [diff] [blame] | 77 | |
Chris Lattner | 10dbbb0 | 2008-04-16 23:06:45 +0000 | [diff] [blame] | 78 | // Instead of inserting an open tag immediately after the newline, we |
| 79 | // wait until we see a non-whitespace character. This prevents us from |
| 80 | // inserting tags around blank lines, and also allows the open tag to |
| 81 | // be put *after* whitespace on a non-blank line. |
| 82 | HadOpenTag = false; |
| 83 | break; |
| 84 | case '\0': |
| 85 | case ' ': |
| 86 | case '\t': |
| 87 | case '\f': |
| 88 | case '\v': |
| 89 | // Ignore whitespace. |
| 90 | break; |
Mike Stump | 11289f4 | 2009-09-09 15:08:12 +0000 | [diff] [blame] | 91 | |
Chris Lattner | 10dbbb0 | 2008-04-16 23:06:45 +0000 | [diff] [blame] | 92 | default: |
| 93 | // If there is no tag open, do it now. |
| 94 | if (!HadOpenTag) { |
Daniel Dunbar | dec484a | 2009-08-19 19:10:30 +0000 | [diff] [blame] | 95 | RB.InsertTextAfter(i, StartTag); |
Chris Lattner | 10dbbb0 | 2008-04-16 23:06:45 +0000 | [diff] [blame] | 96 | HadOpenTag = true; |
| 97 | } |
Mike Stump | 11289f4 | 2009-09-09 15:08:12 +0000 | [diff] [blame] | 98 | |
Chris Lattner | 10dbbb0 | 2008-04-16 23:06:45 +0000 | [diff] [blame] | 99 | // Remember this character. |
| 100 | LastNonWhiteSpace = i; |
| 101 | break; |
| 102 | } |
| 103 | } |
Chris Lattner | 8e3006a | 2008-04-16 22:45:51 +0000 | [diff] [blame] | 104 | } |
| 105 | |
Chris Lattner | d32480d | 2009-01-17 06:22:33 +0000 | [diff] [blame] | 106 | void html::EscapeText(Rewriter &R, FileID FID, |
Ted Kremenek | 5f7ece0 | 2008-04-08 22:37:58 +0000 | [diff] [blame] | 107 | bool EscapeSpaces, bool ReplaceTabs) { |
Mike Stump | 11289f4 | 2009-09-09 15:08:12 +0000 | [diff] [blame] | 108 | |
Chris Lattner | d32480d | 2009-01-17 06:22:33 +0000 | [diff] [blame] | 109 | const llvm::MemoryBuffer *Buf = R.getSourceMgr().getBuffer(FID); |
Ted Kremenek | 7dcc822 | 2008-03-18 21:19:49 +0000 | [diff] [blame] | 110 | const char* C = Buf->getBufferStart(); |
| 111 | const char* FileEnd = Buf->getBufferEnd(); |
Mike Stump | 11289f4 | 2009-09-09 15:08:12 +0000 | [diff] [blame] | 112 | |
Ted Kremenek | 7dcc822 | 2008-03-18 21:19:49 +0000 | [diff] [blame] | 113 | assert (C <= FileEnd); |
Mike Stump | 11289f4 | 2009-09-09 15:08:12 +0000 | [diff] [blame] | 114 | |
Chris Lattner | d32480d | 2009-01-17 06:22:33 +0000 | [diff] [blame] | 115 | RewriteBuffer &RB = R.getEditBuffer(FID); |
Chris Lattner | 4bbd164 | 2008-04-18 04:54:20 +0000 | [diff] [blame] | 116 | |
| 117 | unsigned ColNo = 0; |
Ted Kremenek | 7dcc822 | 2008-03-18 21:19:49 +0000 | [diff] [blame] | 118 | for (unsigned FilePos = 0; C != FileEnd ; ++C, ++FilePos) { |
Ted Kremenek | 7dcc822 | 2008-03-18 21:19:49 +0000 | [diff] [blame] | 119 | switch (*C) { |
Chris Lattner | 4bbd164 | 2008-04-18 04:54:20 +0000 | [diff] [blame] | 120 | default: ++ColNo; break; |
| 121 | case '\n': |
| 122 | case '\r': |
| 123 | ColNo = 0; |
| 124 | break; |
Mike Stump | 11289f4 | 2009-09-09 15:08:12 +0000 | [diff] [blame] | 125 | |
Chris Lattner | e7d696e | 2008-04-16 04:33:23 +0000 | [diff] [blame] | 126 | case ' ': |
| 127 | if (EscapeSpaces) |
Daniel Dunbar | dec484a | 2009-08-19 19:10:30 +0000 | [diff] [blame] | 128 | RB.ReplaceText(FilePos, 1, " "); |
Chris Lattner | 4bbd164 | 2008-04-18 04:54:20 +0000 | [diff] [blame] | 129 | ++ColNo; |
Chris Lattner | e7d696e | 2008-04-16 04:33:23 +0000 | [diff] [blame] | 130 | break; |
Chris Lattner | 1e517a7 | 2008-04-19 23:56:30 +0000 | [diff] [blame] | 131 | case '\f': |
Daniel Dunbar | dec484a | 2009-08-19 19:10:30 +0000 | [diff] [blame] | 132 | RB.ReplaceText(FilePos, 1, "<hr>"); |
Chris Lattner | 1e517a7 | 2008-04-19 23:56:30 +0000 | [diff] [blame] | 133 | ColNo = 0; |
| 134 | break; |
Mike Stump | 11289f4 | 2009-09-09 15:08:12 +0000 | [diff] [blame] | 135 | |
Chris Lattner | 4bbd164 | 2008-04-18 04:54:20 +0000 | [diff] [blame] | 136 | case '\t': { |
Chris Lattner | e7d696e | 2008-04-16 04:33:23 +0000 | [diff] [blame] | 137 | if (!ReplaceTabs) |
Ted Kremenek | c599179 | 2008-04-03 07:12:29 +0000 | [diff] [blame] | 138 | break; |
Chris Lattner | 4bbd164 | 2008-04-18 04:54:20 +0000 | [diff] [blame] | 139 | unsigned NumSpaces = 8-(ColNo&7); |
Chris Lattner | e7d696e | 2008-04-16 04:33:23 +0000 | [diff] [blame] | 140 | if (EscapeSpaces) |
Daniel Dunbar | dec484a | 2009-08-19 19:10:30 +0000 | [diff] [blame] | 141 | RB.ReplaceText(FilePos, 1, |
Chris Lattner | 0e62c1c | 2011-07-23 10:55:15 +0000 | [diff] [blame] | 142 | StringRef(" " |
Daniel Dunbar | dec484a | 2009-08-19 19:10:30 +0000 | [diff] [blame] | 143 | " ", 6*NumSpaces)); |
Chris Lattner | e7d696e | 2008-04-16 04:33:23 +0000 | [diff] [blame] | 144 | else |
Chris Lattner | 0e62c1c | 2011-07-23 10:55:15 +0000 | [diff] [blame] | 145 | RB.ReplaceText(FilePos, 1, StringRef(" ", NumSpaces)); |
Chris Lattner | 4bbd164 | 2008-04-18 04:54:20 +0000 | [diff] [blame] | 146 | ColNo += NumSpaces; |
Chris Lattner | e7d696e | 2008-04-16 04:33:23 +0000 | [diff] [blame] | 147 | break; |
Chris Lattner | 4bbd164 | 2008-04-18 04:54:20 +0000 | [diff] [blame] | 148 | } |
Chris Lattner | e7d696e | 2008-04-16 04:33:23 +0000 | [diff] [blame] | 149 | case '<': |
Daniel Dunbar | dec484a | 2009-08-19 19:10:30 +0000 | [diff] [blame] | 150 | RB.ReplaceText(FilePos, 1, "<"); |
Chris Lattner | 4bbd164 | 2008-04-18 04:54:20 +0000 | [diff] [blame] | 151 | ++ColNo; |
Chris Lattner | e7d696e | 2008-04-16 04:33:23 +0000 | [diff] [blame] | 152 | break; |
Mike Stump | 11289f4 | 2009-09-09 15:08:12 +0000 | [diff] [blame] | 153 | |
Chris Lattner | e7d696e | 2008-04-16 04:33:23 +0000 | [diff] [blame] | 154 | case '>': |
Daniel Dunbar | dec484a | 2009-08-19 19:10:30 +0000 | [diff] [blame] | 155 | RB.ReplaceText(FilePos, 1, ">"); |
Chris Lattner | 4bbd164 | 2008-04-18 04:54:20 +0000 | [diff] [blame] | 156 | ++ColNo; |
Chris Lattner | e7d696e | 2008-04-16 04:33:23 +0000 | [diff] [blame] | 157 | break; |
Mike Stump | 11289f4 | 2009-09-09 15:08:12 +0000 | [diff] [blame] | 158 | |
Chris Lattner | e7d696e | 2008-04-16 04:33:23 +0000 | [diff] [blame] | 159 | case '&': |
Daniel Dunbar | dec484a | 2009-08-19 19:10:30 +0000 | [diff] [blame] | 160 | RB.ReplaceText(FilePos, 1, "&"); |
Chris Lattner | 4bbd164 | 2008-04-18 04:54:20 +0000 | [diff] [blame] | 161 | ++ColNo; |
Chris Lattner | e7d696e | 2008-04-16 04:33:23 +0000 | [diff] [blame] | 162 | break; |
Ted Kremenek | 7dcc822 | 2008-03-18 21:19:49 +0000 | [diff] [blame] | 163 | } |
| 164 | } |
| 165 | } |
| 166 | |
Benjamin Kramer | fbf914c | 2013-06-12 18:13:05 +0000 | [diff] [blame] | 167 | std::string html::EscapeText(StringRef s, bool EscapeSpaces, bool ReplaceTabs) { |
Mike Stump | 11289f4 | 2009-09-09 15:08:12 +0000 | [diff] [blame] | 168 | |
Ted Kremenek | 561dfe3 | 2008-03-27 17:15:29 +0000 | [diff] [blame] | 169 | unsigned len = s.size(); |
Ted Kremenek | 2d470fc | 2008-09-13 05:16:45 +0000 | [diff] [blame] | 170 | std::string Str; |
| 171 | llvm::raw_string_ostream os(Str); |
Mike Stump | 11289f4 | 2009-09-09 15:08:12 +0000 | [diff] [blame] | 172 | |
Ted Kremenek | 561dfe3 | 2008-03-27 17:15:29 +0000 | [diff] [blame] | 173 | for (unsigned i = 0 ; i < len; ++i) { |
Mike Stump | 11289f4 | 2009-09-09 15:08:12 +0000 | [diff] [blame] | 174 | |
Ted Kremenek | 561dfe3 | 2008-03-27 17:15:29 +0000 | [diff] [blame] | 175 | char c = s[i]; |
Ted Kremenek | 561dfe3 | 2008-03-27 17:15:29 +0000 | [diff] [blame] | 176 | switch (c) { |
Chris Lattner | c326f7e | 2008-04-16 04:37:29 +0000 | [diff] [blame] | 177 | default: |
| 178 | os << c; break; |
Mike Stump | 11289f4 | 2009-09-09 15:08:12 +0000 | [diff] [blame] | 179 | |
Chris Lattner | c326f7e | 2008-04-16 04:37:29 +0000 | [diff] [blame] | 180 | case ' ': |
| 181 | if (EscapeSpaces) os << " "; |
| 182 | else os << ' '; |
| 183 | break; |
Mike Stump | 11289f4 | 2009-09-09 15:08:12 +0000 | [diff] [blame] | 184 | |
Zhongxing Xu | b562444 | 2009-08-17 14:13:14 +0000 | [diff] [blame] | 185 | case '\t': |
| 186 | if (ReplaceTabs) { |
| 187 | if (EscapeSpaces) |
| 188 | for (unsigned i = 0; i < 4; ++i) |
| 189 | os << " "; |
| 190 | else |
| 191 | for (unsigned i = 0; i < 4; ++i) |
| 192 | os << " "; |
| 193 | } |
Mike Stump | 11289f4 | 2009-09-09 15:08:12 +0000 | [diff] [blame] | 194 | else |
Zhongxing Xu | b562444 | 2009-08-17 14:13:14 +0000 | [diff] [blame] | 195 | os << c; |
Mike Stump | 11289f4 | 2009-09-09 15:08:12 +0000 | [diff] [blame] | 196 | |
Zhongxing Xu | b562444 | 2009-08-17 14:13:14 +0000 | [diff] [blame] | 197 | break; |
Mike Stump | 11289f4 | 2009-09-09 15:08:12 +0000 | [diff] [blame] | 198 | |
Zhongxing Xu | b562444 | 2009-08-17 14:13:14 +0000 | [diff] [blame] | 199 | case '<': os << "<"; break; |
| 200 | case '>': os << ">"; break; |
| 201 | case '&': os << "&"; break; |
Ted Kremenek | 561dfe3 | 2008-03-27 17:15:29 +0000 | [diff] [blame] | 202 | } |
| 203 | } |
Mike Stump | 11289f4 | 2009-09-09 15:08:12 +0000 | [diff] [blame] | 204 | |
Ted Kremenek | 561dfe3 | 2008-03-27 17:15:29 +0000 | [diff] [blame] | 205 | return os.str(); |
| 206 | } |
| 207 | |
Chris Lattner | c326f7e | 2008-04-16 04:37:29 +0000 | [diff] [blame] | 208 | static void AddLineNumber(RewriteBuffer &RB, unsigned LineNo, |
| 209 | unsigned B, unsigned E) { |
Dylan Noblesmith | 2c1dd27 | 2012-02-05 02:13:05 +0000 | [diff] [blame] | 210 | SmallString<256> Str; |
Daniel Dunbar | 69c300d | 2009-08-19 18:30:37 +0000 | [diff] [blame] | 211 | llvm::raw_svector_ostream OS(Str); |
| 212 | |
| 213 | OS << "<tr><td class=\"num\" id=\"LN" |
| 214 | << LineNo << "\">" |
| 215 | << LineNo << "</td><td class=\"line\">"; |
Mike Stump | 11289f4 | 2009-09-09 15:08:12 +0000 | [diff] [blame] | 216 | |
Ted Kremenek | c599179 | 2008-04-03 07:12:29 +0000 | [diff] [blame] | 217 | if (B == E) { // Handle empty lines. |
Daniel Dunbar | 69c300d | 2009-08-19 18:30:37 +0000 | [diff] [blame] | 218 | OS << " </td></tr>"; |
Daniel Dunbar | dec484a | 2009-08-19 19:10:30 +0000 | [diff] [blame] | 219 | RB.InsertTextBefore(B, OS.str()); |
Chris Lattner | 05e5310 | 2008-04-16 04:11:35 +0000 | [diff] [blame] | 220 | } else { |
Daniel Dunbar | dec484a | 2009-08-19 19:10:30 +0000 | [diff] [blame] | 221 | RB.InsertTextBefore(B, OS.str()); |
| 222 | RB.InsertTextBefore(E, "</td></tr>"); |
Ted Kremenek | c599179 | 2008-04-03 07:12:29 +0000 | [diff] [blame] | 223 | } |
Ted Kremenek | 5792ceb | 2008-03-18 23:08:51 +0000 | [diff] [blame] | 224 | } |
| 225 | |
Chris Lattner | d32480d | 2009-01-17 06:22:33 +0000 | [diff] [blame] | 226 | void html::AddLineNumbers(Rewriter& R, FileID FID) { |
Ted Kremenek | 5792ceb | 2008-03-18 23:08:51 +0000 | [diff] [blame] | 227 | |
Chris Lattner | d32480d | 2009-01-17 06:22:33 +0000 | [diff] [blame] | 228 | const llvm::MemoryBuffer *Buf = R.getSourceMgr().getBuffer(FID); |
Ted Kremenek | 5792ceb | 2008-03-18 23:08:51 +0000 | [diff] [blame] | 229 | const char* FileBeg = Buf->getBufferStart(); |
| 230 | const char* FileEnd = Buf->getBufferEnd(); |
| 231 | const char* C = FileBeg; |
Chris Lattner | d32480d | 2009-01-17 06:22:33 +0000 | [diff] [blame] | 232 | RewriteBuffer &RB = R.getEditBuffer(FID); |
Mike Stump | 11289f4 | 2009-09-09 15:08:12 +0000 | [diff] [blame] | 233 | |
Ted Kremenek | 5792ceb | 2008-03-18 23:08:51 +0000 | [diff] [blame] | 234 | assert (C <= FileEnd); |
Mike Stump | 11289f4 | 2009-09-09 15:08:12 +0000 | [diff] [blame] | 235 | |
Ted Kremenek | 5792ceb | 2008-03-18 23:08:51 +0000 | [diff] [blame] | 236 | unsigned LineNo = 0; |
| 237 | unsigned FilePos = 0; |
Mike Stump | 11289f4 | 2009-09-09 15:08:12 +0000 | [diff] [blame] | 238 | |
| 239 | while (C != FileEnd) { |
| 240 | |
Ted Kremenek | 5792ceb | 2008-03-18 23:08:51 +0000 | [diff] [blame] | 241 | ++LineNo; |
| 242 | unsigned LineStartPos = FilePos; |
| 243 | unsigned LineEndPos = FileEnd - FileBeg; |
Mike Stump | 11289f4 | 2009-09-09 15:08:12 +0000 | [diff] [blame] | 244 | |
Ted Kremenek | 5792ceb | 2008-03-18 23:08:51 +0000 | [diff] [blame] | 245 | assert (FilePos <= LineEndPos); |
| 246 | assert (C < FileEnd); |
Mike Stump | 11289f4 | 2009-09-09 15:08:12 +0000 | [diff] [blame] | 247 | |
Ted Kremenek | 5792ceb | 2008-03-18 23:08:51 +0000 | [diff] [blame] | 248 | // Scan until the newline (or end-of-file). |
Mike Stump | 11289f4 | 2009-09-09 15:08:12 +0000 | [diff] [blame] | 249 | |
Ted Kremenek | c599179 | 2008-04-03 07:12:29 +0000 | [diff] [blame] | 250 | while (C != FileEnd) { |
| 251 | char c = *C; |
| 252 | ++C; |
Mike Stump | 11289f4 | 2009-09-09 15:08:12 +0000 | [diff] [blame] | 253 | |
Ted Kremenek | c599179 | 2008-04-03 07:12:29 +0000 | [diff] [blame] | 254 | if (c == '\n') { |
| 255 | LineEndPos = FilePos++; |
Ted Kremenek | 5792ceb | 2008-03-18 23:08:51 +0000 | [diff] [blame] | 256 | break; |
| 257 | } |
Mike Stump | 11289f4 | 2009-09-09 15:08:12 +0000 | [diff] [blame] | 258 | |
Ted Kremenek | c599179 | 2008-04-03 07:12:29 +0000 | [diff] [blame] | 259 | ++FilePos; |
| 260 | } |
Mike Stump | 11289f4 | 2009-09-09 15:08:12 +0000 | [diff] [blame] | 261 | |
Chris Lattner | c326f7e | 2008-04-16 04:37:29 +0000 | [diff] [blame] | 262 | AddLineNumber(RB, LineNo, LineStartPos, LineEndPos); |
Ted Kremenek | 3f83926 | 2008-03-19 05:07:26 +0000 | [diff] [blame] | 263 | } |
Mike Stump | 11289f4 | 2009-09-09 15:08:12 +0000 | [diff] [blame] | 264 | |
Chris Lattner | c326f7e | 2008-04-16 04:37:29 +0000 | [diff] [blame] | 265 | // Add one big table tag that surrounds all of the code. |
Daniel Dunbar | dec484a | 2009-08-19 19:10:30 +0000 | [diff] [blame] | 266 | RB.InsertTextBefore(0, "<table class=\"code\">\n"); |
| 267 | RB.InsertTextAfter(FileEnd - FileBeg, "</table>"); |
Ted Kremenek | 5792ceb | 2008-03-18 23:08:51 +0000 | [diff] [blame] | 268 | } |
Ted Kremenek | 966da4a | 2008-03-19 06:14:37 +0000 | [diff] [blame] | 269 | |
Mike Stump | 11289f4 | 2009-09-09 15:08:12 +0000 | [diff] [blame] | 270 | void html::AddHeaderFooterInternalBuiltinCSS(Rewriter& R, FileID FID, |
Ted Kremenek | 79ab0fa | 2008-07-07 18:31:05 +0000 | [diff] [blame] | 271 | const char *title) { |
Ted Kremenek | 966da4a | 2008-03-19 06:14:37 +0000 | [diff] [blame] | 272 | |
Chris Lattner | d32480d | 2009-01-17 06:22:33 +0000 | [diff] [blame] | 273 | const llvm::MemoryBuffer *Buf = R.getSourceMgr().getBuffer(FID); |
Ted Kremenek | 966da4a | 2008-03-19 06:14:37 +0000 | [diff] [blame] | 274 | const char* FileStart = Buf->getBufferStart(); |
| 275 | const char* FileEnd = Buf->getBufferEnd(); |
| 276 | |
Chris Lattner | d32480d | 2009-01-17 06:22:33 +0000 | [diff] [blame] | 277 | SourceLocation StartLoc = R.getSourceMgr().getLocForStartOfFile(FID); |
Argyrios Kyrtzidis | e6e67de | 2011-09-19 20:40:19 +0000 | [diff] [blame] | 278 | SourceLocation EndLoc = StartLoc.getLocWithOffset(FileEnd-FileStart); |
Ted Kremenek | 966da4a | 2008-03-19 06:14:37 +0000 | [diff] [blame] | 279 | |
Ted Kremenek | 2d470fc | 2008-09-13 05:16:45 +0000 | [diff] [blame] | 280 | std::string s; |
| 281 | llvm::raw_string_ostream os(s); |
Ted Kremenek | 79ab0fa | 2008-07-07 18:31:05 +0000 | [diff] [blame] | 282 | os << "<!doctype html>\n" // Use HTML 5 doctype |
| 283 | "<html>\n<head>\n"; |
Mike Stump | 11289f4 | 2009-09-09 15:08:12 +0000 | [diff] [blame] | 284 | |
Ted Kremenek | 79ab0fa | 2008-07-07 18:31:05 +0000 | [diff] [blame] | 285 | if (title) |
| 286 | os << "<title>" << html::EscapeText(title) << "</title>\n"; |
Mike Stump | 11289f4 | 2009-09-09 15:08:12 +0000 | [diff] [blame] | 287 | |
Ted Kremenek | 79ab0fa | 2008-07-07 18:31:05 +0000 | [diff] [blame] | 288 | os << "<style type=\"text/css\">\n" |
Ted Kremenek | f17d575 | 2008-04-09 15:40:40 +0000 | [diff] [blame] | 289 | " body { color:#000000; background-color:#ffffff }\n" |
| 290 | " body { font-family:Helvetica, sans-serif; font-size:10pt }\n" |
Ted Kremenek | 7d6219f | 2008-04-15 21:25:08 +0000 | [diff] [blame] | 291 | " h1 { font-size:14pt }\n" |
Ted Kremenek | a821e08 | 2008-04-18 02:12:39 +0000 | [diff] [blame] | 292 | " .code { border-collapse:collapse; width:100%; }\n" |
Ted Kremenek | 6b33356 | 2012-01-20 20:39:55 +0000 | [diff] [blame] | 293 | " .code { font-family: \"Monospace\", monospace; font-size:10pt }\n" |
Ted Kremenek | f17d575 | 2008-04-09 15:40:40 +0000 | [diff] [blame] | 294 | " .code { line-height: 1.2em }\n" |
Ted Kremenek | a821e08 | 2008-04-18 02:12:39 +0000 | [diff] [blame] | 295 | " .comment { color: green; font-style: oblique }\n" |
| 296 | " .keyword { color: blue }\n" |
Ted Kremenek | afe2a9f | 2008-08-31 16:37:56 +0000 | [diff] [blame] | 297 | " .string_literal { color: red }\n" |
Ted Kremenek | a821e08 | 2008-04-18 02:12:39 +0000 | [diff] [blame] | 298 | " .directive { color: darkmagenta }\n" |
Chris Lattner | f1c70d7 | 2008-04-17 00:40:45 +0000 | [diff] [blame] | 299 | // Macro expansions. |
Ted Kremenek | c2c08ca | 2008-04-17 19:57:27 +0000 | [diff] [blame] | 300 | " .expansion { display: none; }\n" |
| 301 | " .macro:hover .expansion { display: block; border: 2px solid #FF0000; " |
Chris Lattner | 6929bd8 | 2008-04-17 21:32:46 +0000 | [diff] [blame] | 302 | "padding: 2px; background-color:#FFF0F0; font-weight: normal; " |
Chris Lattner | f1c70d7 | 2008-04-17 00:40:45 +0000 | [diff] [blame] | 303 | " -webkit-border-radius:5px; -webkit-box-shadow:1px 1px 7px #000; " |
Chris Lattner | f219126 | 2008-04-17 21:28:41 +0000 | [diff] [blame] | 304 | "position: absolute; top: -1em; left:10em; z-index: 1 } \n" |
Ted Kremenek | a821e08 | 2008-04-18 02:12:39 +0000 | [diff] [blame] | 305 | " .macro { color: darkmagenta; background-color:LemonChiffon;" |
Chris Lattner | f1c70d7 | 2008-04-17 00:40:45 +0000 | [diff] [blame] | 306 | // Macros are position: relative to provide base for expansions. |
| 307 | " position: relative }\n" |
Ted Kremenek | f17d575 | 2008-04-09 15:40:40 +0000 | [diff] [blame] | 308 | " .num { width:2.5em; padding-right:2ex; background-color:#eeeeee }\n" |
Ted Kremenek | a039a62 | 2009-03-10 05:14:32 +0000 | [diff] [blame] | 309 | " .num { text-align:right; font-size:8pt }\n" |
Ted Kremenek | f17d575 | 2008-04-09 15:40:40 +0000 | [diff] [blame] | 310 | " .num { color:#444444 }\n" |
| 311 | " .line { padding-left: 1ex; border-left: 3px solid #ccc }\n" |
| 312 | " .line { white-space: pre }\n" |
Ted Kremenek | f17d575 | 2008-04-09 15:40:40 +0000 | [diff] [blame] | 313 | " .msg { -webkit-box-shadow:1px 1px 7px #000 }\n" |
| 314 | " .msg { -webkit-border-radius:5px }\n" |
Ted Kremenek | a039a62 | 2009-03-10 05:14:32 +0000 | [diff] [blame] | 315 | " .msg { font-family:Helvetica, sans-serif; font-size:8pt }\n" |
Ted Kremenek | f17d575 | 2008-04-09 15:40:40 +0000 | [diff] [blame] | 316 | " .msg { float:left }\n" |
Ted Kremenek | 6c6a098 | 2009-03-03 03:00:21 +0000 | [diff] [blame] | 317 | " .msg { padding:0.25em 1ex 0.25em 1ex }\n" |
Ted Kremenek | f17d575 | 2008-04-09 15:40:40 +0000 | [diff] [blame] | 318 | " .msg { margin-top:10px; margin-bottom:10px }\n" |
Ted Kremenek | e780823 | 2009-03-02 21:42:01 +0000 | [diff] [blame] | 319 | " .msg { font-weight:bold }\n" |
Ted Kremenek | c62af6c | 2009-03-02 23:05:40 +0000 | [diff] [blame] | 320 | " .msg { max-width:60em; word-wrap: break-word; white-space: pre-wrap }\n" |
| 321 | " .msgT { padding:0x; spacing:0x }\n" |
Ted Kremenek | e780823 | 2009-03-02 21:42:01 +0000 | [diff] [blame] | 322 | " .msgEvent { background-color:#fff8b4; color:#000000 }\n" |
Ted Kremenek | c62af6c | 2009-03-02 23:05:40 +0000 | [diff] [blame] | 323 | " .msgControl { background-color:#bbbbbb; color:#000000 }\n" |
Ted Kremenek | f17d575 | 2008-04-09 15:40:40 +0000 | [diff] [blame] | 324 | " .mrange { background-color:#dfddf3 }\n" |
| 325 | " .mrange { border-bottom:1px solid #6F9DBE }\n" |
Jordan Rose | 11790a4 | 2012-08-02 02:26:19 +0000 | [diff] [blame] | 326 | " .PathIndex { font-weight: bold; padding:0px 5px; " |
Ted Kremenek | 6c6a098 | 2009-03-03 03:00:21 +0000 | [diff] [blame] | 327 | "margin-right:5px; }\n" |
Ted Kremenek | ccca5c3 | 2009-03-02 23:39:27 +0000 | [diff] [blame] | 328 | " .PathIndex { -webkit-border-radius:8px }\n" |
| 329 | " .PathIndexEvent { background-color:#bfba87 }\n" |
| 330 | " .PathIndexControl { background-color:#8c8c8c }\n" |
Jordan Rose | 11790a4 | 2012-08-02 02:26:19 +0000 | [diff] [blame] | 331 | " .PathNav a { text-decoration:none; font-size: larger }\n" |
Douglas Gregor | 87f95b0 | 2009-02-26 21:00:50 +0000 | [diff] [blame] | 332 | " .CodeInsertionHint { font-weight: bold; background-color: #10dd10 }\n" |
| 333 | " .CodeRemovalHint { background-color:#de1010 }\n" |
| 334 | " .CodeRemovalHint { border-bottom:1px solid #6F9DBE }\n" |
Ted Kremenek | 7d6219f | 2008-04-15 21:25:08 +0000 | [diff] [blame] | 335 | " table.simpletable {\n" |
| 336 | " padding: 5px;\n" |
| 337 | " font-size:12pt;\n" |
| 338 | " margin:20px;\n" |
| 339 | " border-collapse: collapse; border-spacing: 0px;\n" |
| 340 | " }\n" |
| 341 | " td.rowname {\n" |
| 342 | " text-align:right; font-weight:bold; color:#444444;\n" |
| 343 | " padding-right:2ex; }\n" |
Ted Kremenek | 79ab0fa | 2008-07-07 18:31:05 +0000 | [diff] [blame] | 344 | "</style>\n</head>\n<body>"; |
Ted Kremenek | f17d575 | 2008-04-09 15:40:40 +0000 | [diff] [blame] | 345 | |
Ted Kremenek | 79ab0fa | 2008-07-07 18:31:05 +0000 | [diff] [blame] | 346 | // Generate header |
Daniel Dunbar | 62c850f | 2009-08-19 20:32:38 +0000 | [diff] [blame] | 347 | R.InsertTextBefore(StartLoc, os.str()); |
Ted Kremenek | 966da4a | 2008-03-19 06:14:37 +0000 | [diff] [blame] | 348 | // Generate footer |
Mike Stump | 11289f4 | 2009-09-09 15:08:12 +0000 | [diff] [blame] | 349 | |
Daniel Dunbar | 62c850f | 2009-08-19 20:32:38 +0000 | [diff] [blame] | 350 | R.InsertTextAfter(EndLoc, "</body></html>\n"); |
Ted Kremenek | 966da4a | 2008-03-19 06:14:37 +0000 | [diff] [blame] | 351 | } |
Chris Lattner | 060d8aa | 2008-04-16 06:11:58 +0000 | [diff] [blame] | 352 | |
| 353 | /// SyntaxHighlight - Relex the specified FileID and annotate the HTML with |
| 354 | /// information about keywords, macro expansions etc. This uses the macro |
| 355 | /// table state from the end of the file, so it won't be perfectly perfect, |
| 356 | /// but it will be reasonably close. |
Daniel Dunbar | a2ff3b4 | 2009-11-05 01:54:02 +0000 | [diff] [blame] | 357 | void html::SyntaxHighlight(Rewriter &R, FileID FID, const Preprocessor &PP) { |
Chris Lattner | d32480d | 2009-01-17 06:22:33 +0000 | [diff] [blame] | 358 | RewriteBuffer &RB = R.getEditBuffer(FID); |
Chris Lattner | 060d8aa | 2008-04-16 06:11:58 +0000 | [diff] [blame] | 359 | |
Chris Lattner | 9ef847b | 2009-02-13 19:33:24 +0000 | [diff] [blame] | 360 | const SourceManager &SM = PP.getSourceManager(); |
Chris Lattner | 710bb87 | 2009-11-30 04:18:44 +0000 | [diff] [blame] | 361 | const llvm::MemoryBuffer *FromFile = SM.getBuffer(FID); |
David Blaikie | bbafb8a | 2012-03-11 07:00:24 +0000 | [diff] [blame] | 362 | Lexer L(FID, FromFile, SM, PP.getLangOpts()); |
Alexander Kornienko | 33a35df | 2013-06-04 16:58:03 +0000 | [diff] [blame] | 363 | const char *BufferStart = L.getBuffer().data(); |
Mike Stump | 11289f4 | 2009-09-09 15:08:12 +0000 | [diff] [blame] | 364 | |
| 365 | // Inform the preprocessor that we want to retain comments as tokens, so we |
Chris Lattner | 060d8aa | 2008-04-16 06:11:58 +0000 | [diff] [blame] | 366 | // can highlight them. |
Chris Lattner | e9786c3 | 2008-04-16 20:54:51 +0000 | [diff] [blame] | 367 | L.SetCommentRetentionState(true); |
Mike Stump | 11289f4 | 2009-09-09 15:08:12 +0000 | [diff] [blame] | 368 | |
Chris Lattner | a5a75e7 | 2008-04-16 06:32:08 +0000 | [diff] [blame] | 369 | // Lex all the tokens in raw mode, to avoid entering #includes or expanding |
| 370 | // macros. |
Chris Lattner | 060d8aa | 2008-04-16 06:11:58 +0000 | [diff] [blame] | 371 | Token Tok; |
Chris Lattner | 50c9050 | 2008-10-12 01:15:46 +0000 | [diff] [blame] | 372 | L.LexFromRawLexer(Tok); |
Mike Stump | 11289f4 | 2009-09-09 15:08:12 +0000 | [diff] [blame] | 373 | |
Chris Lattner | 03b8fcc | 2008-04-16 06:53:09 +0000 | [diff] [blame] | 374 | while (Tok.isNot(tok::eof)) { |
| 375 | // Since we are lexing unexpanded tokens, all tokens are from the main |
| 376 | // FileID. |
Chris Lattner | 9ef847b | 2009-02-13 19:33:24 +0000 | [diff] [blame] | 377 | unsigned TokOffs = SM.getFileOffset(Tok.getLocation()); |
Chris Lattner | 060d8aa | 2008-04-16 06:11:58 +0000 | [diff] [blame] | 378 | unsigned TokLen = Tok.getLength(); |
| 379 | switch (Tok.getKind()) { |
Chris Lattner | 0bb0e7e | 2008-04-16 20:51:51 +0000 | [diff] [blame] | 380 | default: break; |
Abramo Bagnara | ea4f7c7 | 2010-12-22 08:23:18 +0000 | [diff] [blame] | 381 | case tok::identifier: |
| 382 | llvm_unreachable("tok::identifier in raw lexing mode!"); |
Abramo Bagnara | ea4f7c7 | 2010-12-22 08:23:18 +0000 | [diff] [blame] | 383 | case tok::raw_identifier: { |
| 384 | // Fill in Result.IdentifierInfo and update the token kind, |
| 385 | // looking up the identifier in the identifier table. |
| 386 | PP.LookUpIdentifierInfo(Tok); |
Mike Stump | 11289f4 | 2009-09-09 15:08:12 +0000 | [diff] [blame] | 387 | |
Chris Lattner | 0bb0e7e | 2008-04-16 20:51:51 +0000 | [diff] [blame] | 388 | // If this is a pp-identifier, for a keyword, highlight it as such. |
Abramo Bagnara | ea4f7c7 | 2010-12-22 08:23:18 +0000 | [diff] [blame] | 389 | if (Tok.isNot(tok::identifier)) |
Chris Lattner | 8e3006a | 2008-04-16 22:45:51 +0000 | [diff] [blame] | 390 | HighlightRange(RB, TokOffs, TokOffs+TokLen, BufferStart, |
| 391 | "<span class='keyword'>", "</span>"); |
Chris Lattner | 5e69a2d | 2008-04-16 06:35:07 +0000 | [diff] [blame] | 392 | break; |
Chris Lattner | 0bb0e7e | 2008-04-16 20:51:51 +0000 | [diff] [blame] | 393 | } |
Chris Lattner | 060d8aa | 2008-04-16 06:11:58 +0000 | [diff] [blame] | 394 | case tok::comment: |
Chris Lattner | 8e3006a | 2008-04-16 22:45:51 +0000 | [diff] [blame] | 395 | HighlightRange(RB, TokOffs, TokOffs+TokLen, BufferStart, |
| 396 | "<span class='comment'>", "</span>"); |
Chris Lattner | 060d8aa | 2008-04-16 06:11:58 +0000 | [diff] [blame] | 397 | break; |
Douglas Gregor | fb65e59 | 2011-07-27 05:40:30 +0000 | [diff] [blame] | 398 | case tok::utf8_string_literal: |
| 399 | // Chop off the u part of u8 prefix |
| 400 | ++TokOffs; |
| 401 | --TokLen; |
| 402 | // FALL THROUGH to chop the 8 |
Ted Kremenek | afe2a9f | 2008-08-31 16:37:56 +0000 | [diff] [blame] | 403 | case tok::wide_string_literal: |
Douglas Gregor | fb65e59 | 2011-07-27 05:40:30 +0000 | [diff] [blame] | 404 | case tok::utf16_string_literal: |
| 405 | case tok::utf32_string_literal: |
| 406 | // Chop off the L, u, U or 8 prefix |
Ted Kremenek | afe2a9f | 2008-08-31 16:37:56 +0000 | [diff] [blame] | 407 | ++TokOffs; |
| 408 | --TokLen; |
| 409 | // FALL THROUGH. |
| 410 | case tok::string_literal: |
Richard Smith | d67aea2 | 2012-03-06 03:21:47 +0000 | [diff] [blame] | 411 | // FIXME: Exclude the optional ud-suffix from the highlighted range. |
Ted Kremenek | afe2a9f | 2008-08-31 16:37:56 +0000 | [diff] [blame] | 412 | HighlightRange(RB, TokOffs, TokOffs+TokLen, BufferStart, |
| 413 | "<span class='string_literal'>", "</span>"); |
| 414 | break; |
Chris Lattner | 775fdd3 | 2008-04-16 23:21:17 +0000 | [diff] [blame] | 415 | case tok::hash: { |
Chris Lattner | 03b8fcc | 2008-04-16 06:53:09 +0000 | [diff] [blame] | 416 | // If this is a preprocessor directive, all tokens to end of line are too. |
Chris Lattner | 775fdd3 | 2008-04-16 23:21:17 +0000 | [diff] [blame] | 417 | if (!Tok.isAtStartOfLine()) |
| 418 | break; |
Mike Stump | 11289f4 | 2009-09-09 15:08:12 +0000 | [diff] [blame] | 419 | |
Chris Lattner | 775fdd3 | 2008-04-16 23:21:17 +0000 | [diff] [blame] | 420 | // Eat all of the tokens until we get to the next one at the start of |
| 421 | // line. |
| 422 | unsigned TokEnd = TokOffs+TokLen; |
Chris Lattner | 50c9050 | 2008-10-12 01:15:46 +0000 | [diff] [blame] | 423 | L.LexFromRawLexer(Tok); |
Chris Lattner | 775fdd3 | 2008-04-16 23:21:17 +0000 | [diff] [blame] | 424 | while (!Tok.isAtStartOfLine() && Tok.isNot(tok::eof)) { |
Chris Lattner | 9ef847b | 2009-02-13 19:33:24 +0000 | [diff] [blame] | 425 | TokEnd = SM.getFileOffset(Tok.getLocation())+Tok.getLength(); |
Chris Lattner | 50c9050 | 2008-10-12 01:15:46 +0000 | [diff] [blame] | 426 | L.LexFromRawLexer(Tok); |
Chris Lattner | 03b8fcc | 2008-04-16 06:53:09 +0000 | [diff] [blame] | 427 | } |
Mike Stump | 11289f4 | 2009-09-09 15:08:12 +0000 | [diff] [blame] | 428 | |
Chris Lattner | 775fdd3 | 2008-04-16 23:21:17 +0000 | [diff] [blame] | 429 | // Find end of line. This is a hack. |
| 430 | HighlightRange(RB, TokOffs, TokEnd, BufferStart, |
| 431 | "<span class='directive'>", "</span>"); |
Mike Stump | 11289f4 | 2009-09-09 15:08:12 +0000 | [diff] [blame] | 432 | |
Chris Lattner | 775fdd3 | 2008-04-16 23:21:17 +0000 | [diff] [blame] | 433 | // Don't skip the next token. |
| 434 | continue; |
| 435 | } |
Chris Lattner | 060d8aa | 2008-04-16 06:11:58 +0000 | [diff] [blame] | 436 | } |
Mike Stump | 11289f4 | 2009-09-09 15:08:12 +0000 | [diff] [blame] | 437 | |
Chris Lattner | 50c9050 | 2008-10-12 01:15:46 +0000 | [diff] [blame] | 438 | L.LexFromRawLexer(Tok); |
Chris Lattner | 03b8fcc | 2008-04-16 06:53:09 +0000 | [diff] [blame] | 439 | } |
Chris Lattner | 060d8aa | 2008-04-16 06:11:58 +0000 | [diff] [blame] | 440 | } |
Chris Lattner | a5a75e7 | 2008-04-16 06:32:08 +0000 | [diff] [blame] | 441 | |
| 442 | /// HighlightMacros - This uses the macro table state from the end of the |
Chris Lattner | 9ef847b | 2009-02-13 19:33:24 +0000 | [diff] [blame] | 443 | /// file, to re-expand macros and insert (into the HTML) information about the |
Chris Lattner | a5a75e7 | 2008-04-16 06:32:08 +0000 | [diff] [blame] | 444 | /// macro expansions. This won't be perfectly perfect, but it will be |
| 445 | /// reasonably close. |
Daniel Dunbar | a2ff3b4 | 2009-11-05 01:54:02 +0000 | [diff] [blame] | 446 | void html::HighlightMacros(Rewriter &R, FileID FID, const Preprocessor& PP) { |
Chris Lattner | 9ef847b | 2009-02-13 19:33:24 +0000 | [diff] [blame] | 447 | // Re-lex the raw token stream into a token buffer. |
| 448 | const SourceManager &SM = PP.getSourceManager(); |
| 449 | std::vector<Token> TokenStream; |
Mike Stump | 11289f4 | 2009-09-09 15:08:12 +0000 | [diff] [blame] | 450 | |
Chris Lattner | 710bb87 | 2009-11-30 04:18:44 +0000 | [diff] [blame] | 451 | const llvm::MemoryBuffer *FromFile = SM.getBuffer(FID); |
David Blaikie | bbafb8a | 2012-03-11 07:00:24 +0000 | [diff] [blame] | 452 | Lexer L(FID, FromFile, SM, PP.getLangOpts()); |
Mike Stump | 11289f4 | 2009-09-09 15:08:12 +0000 | [diff] [blame] | 453 | |
Chris Lattner | 9ef847b | 2009-02-13 19:33:24 +0000 | [diff] [blame] | 454 | // Lex all the tokens in raw mode, to avoid entering #includes or expanding |
| 455 | // macros. |
| 456 | while (1) { |
| 457 | Token Tok; |
| 458 | L.LexFromRawLexer(Tok); |
Mike Stump | 11289f4 | 2009-09-09 15:08:12 +0000 | [diff] [blame] | 459 | |
Chris Lattner | 9ef847b | 2009-02-13 19:33:24 +0000 | [diff] [blame] | 460 | // If this is a # at the start of a line, discard it from the token stream. |
| 461 | // We don't want the re-preprocess step to see #defines, #includes or other |
| 462 | // preprocessor directives. |
| 463 | if (Tok.is(tok::hash) && Tok.isAtStartOfLine()) |
| 464 | continue; |
Chris Lattner | 59da739 | 2009-02-24 05:29:33 +0000 | [diff] [blame] | 465 | |
| 466 | // If this is a ## token, change its kind to unknown so that repreprocessing |
| 467 | // it will not produce an error. |
| 468 | if (Tok.is(tok::hashhash)) |
| 469 | Tok.setKind(tok::unknown); |
Mike Stump | 11289f4 | 2009-09-09 15:08:12 +0000 | [diff] [blame] | 470 | |
Chris Lattner | 9ef847b | 2009-02-13 19:33:24 +0000 | [diff] [blame] | 471 | // If this raw token is an identifier, the raw lexer won't have looked up |
| 472 | // the corresponding identifier info for it. Do this now so that it will be |
| 473 | // macro expanded when we re-preprocess it. |
Abramo Bagnara | ea4f7c7 | 2010-12-22 08:23:18 +0000 | [diff] [blame] | 474 | if (Tok.is(tok::raw_identifier)) |
| 475 | PP.LookUpIdentifierInfo(Tok); |
Mike Stump | 11289f4 | 2009-09-09 15:08:12 +0000 | [diff] [blame] | 476 | |
Chris Lattner | 9ef847b | 2009-02-13 19:33:24 +0000 | [diff] [blame] | 477 | TokenStream.push_back(Tok); |
Mike Stump | 11289f4 | 2009-09-09 15:08:12 +0000 | [diff] [blame] | 478 | |
Chris Lattner | 9ef847b | 2009-02-13 19:33:24 +0000 | [diff] [blame] | 479 | if (Tok.is(tok::eof)) break; |
| 480 | } |
Mike Stump | 11289f4 | 2009-09-09 15:08:12 +0000 | [diff] [blame] | 481 | |
Chris Lattner | e07ea35 | 2009-03-13 21:44:46 +0000 | [diff] [blame] | 482 | // Temporarily change the diagnostics object so that we ignore any generated |
| 483 | // diagnostics from this pass. |
David Blaikie | 9c902b5 | 2011-09-25 23:23:43 +0000 | [diff] [blame] | 484 | DiagnosticsEngine TmpDiags(PP.getDiagnostics().getDiagnosticIDs(), |
Douglas Gregor | 811db4e | 2012-10-23 22:26:28 +0000 | [diff] [blame] | 485 | &PP.getDiagnostics().getDiagnosticOptions(), |
David Blaikie | 2cb2a83 | 2011-09-25 23:44:35 +0000 | [diff] [blame] | 486 | new IgnoringDiagConsumer); |
Mike Stump | 11289f4 | 2009-09-09 15:08:12 +0000 | [diff] [blame] | 487 | |
Daniel Dunbar | a2ff3b4 | 2009-11-05 01:54:02 +0000 | [diff] [blame] | 488 | // FIXME: This is a huge hack; we reuse the input preprocessor because we want |
| 489 | // its state, but we aren't actually changing it (we hope). This should really |
| 490 | // construct a copy of the preprocessor. |
| 491 | Preprocessor &TmpPP = const_cast<Preprocessor&>(PP); |
David Blaikie | 9c902b5 | 2011-09-25 23:23:43 +0000 | [diff] [blame] | 492 | DiagnosticsEngine *OldDiags = &TmpPP.getDiagnostics(); |
Daniel Dunbar | a2ff3b4 | 2009-11-05 01:54:02 +0000 | [diff] [blame] | 493 | TmpPP.setDiagnostics(TmpDiags); |
Mike Stump | 11289f4 | 2009-09-09 15:08:12 +0000 | [diff] [blame] | 494 | |
Chris Lattner | a5a75e7 | 2008-04-16 06:32:08 +0000 | [diff] [blame] | 495 | // Inform the preprocessor that we don't want comments. |
Daniel Dunbar | a2ff3b4 | 2009-11-05 01:54:02 +0000 | [diff] [blame] | 496 | TmpPP.SetCommentRetentionState(false, false); |
Chris Lattner | 9ef847b | 2009-02-13 19:33:24 +0000 | [diff] [blame] | 497 | |
Jordan Rose | de1a292 | 2012-06-08 18:06:21 +0000 | [diff] [blame] | 498 | // We don't want pragmas either. Although we filtered out #pragma, removing |
| 499 | // _Pragma and __pragma is much harder. |
| 500 | bool PragmasPreviouslyEnabled = TmpPP.getPragmasEnabled(); |
| 501 | TmpPP.setPragmasEnabled(false); |
| 502 | |
Chris Lattner | 9ef847b | 2009-02-13 19:33:24 +0000 | [diff] [blame] | 503 | // Enter the tokens we just lexed. This will cause them to be macro expanded |
| 504 | // but won't enter sub-files (because we removed #'s). |
Daniel Dunbar | a2ff3b4 | 2009-11-05 01:54:02 +0000 | [diff] [blame] | 505 | TmpPP.EnterTokenStream(&TokenStream[0], TokenStream.size(), false, false); |
Mike Stump | 11289f4 | 2009-09-09 15:08:12 +0000 | [diff] [blame] | 506 | |
Daniel Dunbar | a2ff3b4 | 2009-11-05 01:54:02 +0000 | [diff] [blame] | 507 | TokenConcatenation ConcatInfo(TmpPP); |
Mike Stump | 11289f4 | 2009-09-09 15:08:12 +0000 | [diff] [blame] | 508 | |
Chris Lattner | a5a75e7 | 2008-04-16 06:32:08 +0000 | [diff] [blame] | 509 | // Lex all the tokens. |
Chris Lattner | a5a75e7 | 2008-04-16 06:32:08 +0000 | [diff] [blame] | 510 | Token Tok; |
Daniel Dunbar | a2ff3b4 | 2009-11-05 01:54:02 +0000 | [diff] [blame] | 511 | TmpPP.Lex(Tok); |
Chris Lattner | a5a75e7 | 2008-04-16 06:32:08 +0000 | [diff] [blame] | 512 | while (Tok.isNot(tok::eof)) { |
| 513 | // Ignore non-macro tokens. |
| 514 | if (!Tok.getLocation().isMacroID()) { |
Daniel Dunbar | a2ff3b4 | 2009-11-05 01:54:02 +0000 | [diff] [blame] | 515 | TmpPP.Lex(Tok); |
Chris Lattner | a5a75e7 | 2008-04-16 06:32:08 +0000 | [diff] [blame] | 516 | continue; |
| 517 | } |
Mike Stump | 11289f4 | 2009-09-09 15:08:12 +0000 | [diff] [blame] | 518 | |
Chris Lattner | 20cf430 | 2009-02-15 21:32:34 +0000 | [diff] [blame] | 519 | // Okay, we have the first token of a macro expansion: highlight the |
Chandler Carruth | 5d4aff0 | 2011-07-15 00:04:40 +0000 | [diff] [blame] | 520 | // expansion by inserting a start tag before the macro expansion and |
Chris Lattner | 20cf430 | 2009-02-15 21:32:34 +0000 | [diff] [blame] | 521 | // end tag after it. |
| 522 | std::pair<SourceLocation, SourceLocation> LLoc = |
Chandler Carruth | 6d28d7f | 2011-07-25 16:56:02 +0000 | [diff] [blame] | 523 | SM.getExpansionRange(Tok.getLocation()); |
Mike Stump | 11289f4 | 2009-09-09 15:08:12 +0000 | [diff] [blame] | 524 | |
Chris Lattner | 20cf430 | 2009-02-15 21:32:34 +0000 | [diff] [blame] | 525 | // Ignore tokens whose instantiation location was not the main file. |
| 526 | if (SM.getFileID(LLoc.first) != FID) { |
Daniel Dunbar | a2ff3b4 | 2009-11-05 01:54:02 +0000 | [diff] [blame] | 527 | TmpPP.Lex(Tok); |
Chris Lattner | a5a75e7 | 2008-04-16 06:32:08 +0000 | [diff] [blame] | 528 | continue; |
| 529 | } |
Chris Lattner | 20cf430 | 2009-02-15 21:32:34 +0000 | [diff] [blame] | 530 | |
Chris Lattner | 20cf430 | 2009-02-15 21:32:34 +0000 | [diff] [blame] | 531 | assert(SM.getFileID(LLoc.second) == FID && |
| 532 | "Start and end of expansion must be in the same ultimate file!"); |
Chris Lattner | 8cad67b | 2009-02-17 00:51:07 +0000 | [diff] [blame] | 533 | |
Daniel Dunbar | a2ff3b4 | 2009-11-05 01:54:02 +0000 | [diff] [blame] | 534 | std::string Expansion = EscapeText(TmpPP.getSpelling(Tok)); |
Chris Lattner | f1c70d7 | 2008-04-17 00:40:45 +0000 | [diff] [blame] | 535 | unsigned LineLen = Expansion.size(); |
Mike Stump | 11289f4 | 2009-09-09 15:08:12 +0000 | [diff] [blame] | 536 | |
Chris Lattner | 0384e635 | 2010-04-14 03:57:19 +0000 | [diff] [blame] | 537 | Token PrevPrevTok; |
Chris Lattner | 837b990 | 2009-02-13 00:51:30 +0000 | [diff] [blame] | 538 | Token PrevTok = Tok; |
Chris Lattner | a5a75e7 | 2008-04-16 06:32:08 +0000 | [diff] [blame] | 539 | // Okay, eat this token, getting the next one. |
Daniel Dunbar | a2ff3b4 | 2009-11-05 01:54:02 +0000 | [diff] [blame] | 540 | TmpPP.Lex(Tok); |
Mike Stump | 11289f4 | 2009-09-09 15:08:12 +0000 | [diff] [blame] | 541 | |
Chris Lattner | a5a75e7 | 2008-04-16 06:32:08 +0000 | [diff] [blame] | 542 | // Skip all the rest of the tokens that are part of this macro |
| 543 | // instantiation. It would be really nice to pop up a window with all the |
| 544 | // spelling of the tokens or something. |
| 545 | while (!Tok.is(tok::eof) && |
Chandler Carruth | 35f5320 | 2011-07-25 16:49:02 +0000 | [diff] [blame] | 546 | SM.getExpansionLoc(Tok.getLocation()) == LLoc.first) { |
Chris Lattner | f1c70d7 | 2008-04-17 00:40:45 +0000 | [diff] [blame] | 547 | // Insert a newline if the macro expansion is getting large. |
| 548 | if (LineLen > 60) { |
| 549 | Expansion += "<br>"; |
| 550 | LineLen = 0; |
| 551 | } |
Mike Stump | 11289f4 | 2009-09-09 15:08:12 +0000 | [diff] [blame] | 552 | |
Chris Lattner | f1c70d7 | 2008-04-17 00:40:45 +0000 | [diff] [blame] | 553 | LineLen -= Expansion.size(); |
Mike Stump | 11289f4 | 2009-09-09 15:08:12 +0000 | [diff] [blame] | 554 | |
Chris Lattner | 837b990 | 2009-02-13 00:51:30 +0000 | [diff] [blame] | 555 | // If the tokens were already space separated, or if they must be to avoid |
| 556 | // them being implicitly pasted, add a space between them. |
| 557 | if (Tok.hasLeadingSpace() || |
Chris Lattner | 0384e635 | 2010-04-14 03:57:19 +0000 | [diff] [blame] | 558 | ConcatInfo.AvoidConcat(PrevPrevTok, PrevTok, Tok)) |
Chris Lattner | 837b990 | 2009-02-13 00:51:30 +0000 | [diff] [blame] | 559 | Expansion += ' '; |
Mike Stump | 11289f4 | 2009-09-09 15:08:12 +0000 | [diff] [blame] | 560 | |
Chris Lattner | 54349c5 | 2008-04-17 23:03:14 +0000 | [diff] [blame] | 561 | // Escape any special characters in the token text. |
Daniel Dunbar | a2ff3b4 | 2009-11-05 01:54:02 +0000 | [diff] [blame] | 562 | Expansion += EscapeText(TmpPP.getSpelling(Tok)); |
Chris Lattner | f1c70d7 | 2008-04-17 00:40:45 +0000 | [diff] [blame] | 563 | LineLen += Expansion.size(); |
Mike Stump | 11289f4 | 2009-09-09 15:08:12 +0000 | [diff] [blame] | 564 | |
Chris Lattner | 0384e635 | 2010-04-14 03:57:19 +0000 | [diff] [blame] | 565 | PrevPrevTok = PrevTok; |
Chris Lattner | 837b990 | 2009-02-13 00:51:30 +0000 | [diff] [blame] | 566 | PrevTok = Tok; |
Daniel Dunbar | a2ff3b4 | 2009-11-05 01:54:02 +0000 | [diff] [blame] | 567 | TmpPP.Lex(Tok); |
Chris Lattner | f1c70d7 | 2008-04-17 00:40:45 +0000 | [diff] [blame] | 568 | } |
Mike Stump | 11289f4 | 2009-09-09 15:08:12 +0000 | [diff] [blame] | 569 | |
Chris Lattner | 8cad67b | 2009-02-17 00:51:07 +0000 | [diff] [blame] | 570 | |
| 571 | // Insert the expansion as the end tag, so that multi-line macros all get |
| 572 | // highlighted. |
| 573 | Expansion = "<span class='expansion'>" + Expansion + "</span></span>"; |
| 574 | |
| 575 | HighlightRange(R, LLoc.first, LLoc.second, |
| 576 | "<span class='macro'>", Expansion.c_str()); |
Chris Lattner | a5a75e7 | 2008-04-16 06:32:08 +0000 | [diff] [blame] | 577 | } |
Chris Lattner | e07ea35 | 2009-03-13 21:44:46 +0000 | [diff] [blame] | 578 | |
Jordan Rose | de1a292 | 2012-06-08 18:06:21 +0000 | [diff] [blame] | 579 | // Restore the preprocessor's old state. |
Daniel Dunbar | a2ff3b4 | 2009-11-05 01:54:02 +0000 | [diff] [blame] | 580 | TmpPP.setDiagnostics(*OldDiags); |
Jordan Rose | de1a292 | 2012-06-08 18:06:21 +0000 | [diff] [blame] | 581 | TmpPP.setPragmasEnabled(PragmasPreviouslyEnabled); |
Chris Lattner | a5a75e7 | 2008-04-16 06:32:08 +0000 | [diff] [blame] | 582 | } |