Ted Kremenek | 6a34083 | 2008-03-18 21:19:49 +0000 | [diff] [blame] | 1 | //== HTMLRewrite.cpp - Translate source code into prettified HTML --*- C++ -*-// |
| 2 | // |
| 3 | // The LLVM Compiler Infrastructure |
| 4 | // |
| 5 | // This file is distributed under the University of Illinois Open Source |
| 6 | // License. See LICENSE.TXT for details. |
| 7 | // |
| 8 | //===----------------------------------------------------------------------===// |
| 9 | // |
| 10 | // This file defines the HTMLRewriter clas, which is used to translate the |
| 11 | // text of a source file into prettified HTML. |
| 12 | // |
| 13 | //===----------------------------------------------------------------------===// |
| 14 | |
Ted Kremenek | 339b9c2 | 2008-04-17 22:31:54 +0000 | [diff] [blame] | 15 | #include "clang/Lex/Preprocessor.h" |
Ted Kremenek | 6a34083 | 2008-03-18 21:19:49 +0000 | [diff] [blame] | 16 | #include "clang/Rewrite/Rewriter.h" |
| 17 | #include "clang/Rewrite/HTMLRewrite.h" |
Chris Lattner | 867924d | 2009-02-13 00:51:30 +0000 | [diff] [blame] | 18 | #include "clang/Lex/TokenConcatenation.h" |
Chris Lattner | 3245a0a | 2008-04-16 06:11:58 +0000 | [diff] [blame] | 19 | #include "clang/Lex/Preprocessor.h" |
Ted Kremenek | 6a34083 | 2008-03-18 21:19:49 +0000 | [diff] [blame] | 20 | #include "clang/Basic/SourceManager.h" |
Chris Lattner | 57df3b9 | 2008-04-16 04:11:35 +0000 | [diff] [blame] | 21 | #include "llvm/ADT/SmallString.h" |
Ted Kremenek | 339b9c2 | 2008-04-17 22:31:54 +0000 | [diff] [blame] | 22 | #include "llvm/ADT/OwningPtr.h" |
Abramo Bagnara | c4bf2b9 | 2010-12-22 08:23:18 +0000 | [diff] [blame] | 23 | #include "llvm/Support/ErrorHandling.h" |
Ted Kremenek | 6a34083 | 2008-03-18 21:19:49 +0000 | [diff] [blame] | 24 | #include "llvm/Support/MemoryBuffer.h" |
Ted Kremenek | a95d375 | 2008-09-13 05:16:45 +0000 | [diff] [blame] | 25 | #include "llvm/Support/raw_ostream.h" |
Ted Kremenek | 6a34083 | 2008-03-18 21:19:49 +0000 | [diff] [blame] | 26 | using namespace clang; |
| 27 | |
Chris Lattner | 9402b57 | 2008-04-16 23:06:45 +0000 | [diff] [blame] | 28 | |
Chris Lattner | 5ef3e2c | 2008-04-16 22:45:51 +0000 | [diff] [blame] | 29 | /// HighlightRange - Highlight a range in the source code with the specified |
| 30 | /// start/end tags. B/E must be in the same file. This ensures that |
| 31 | /// start/end tags are placed at the start/end of each line if the range is |
| 32 | /// multiline. |
| 33 | void html::HighlightRange(Rewriter &R, SourceLocation B, SourceLocation E, |
| 34 | const char *StartTag, const char *EndTag) { |
| 35 | SourceManager &SM = R.getSourceMgr(); |
Chandler Carruth | 4027853 | 2011-07-25 16:49:02 +0000 | [diff] [blame] | 36 | B = SM.getExpansionLoc(B); |
| 37 | E = SM.getExpansionLoc(E); |
Chris Lattner | a11d617 | 2009-01-19 07:46:45 +0000 | [diff] [blame] | 38 | FileID FID = SM.getFileID(B); |
| 39 | assert(SM.getFileID(E) == FID && "B/E not in the same file!"); |
Chris Lattner | 5ef3e2c | 2008-04-16 22:45:51 +0000 | [diff] [blame] | 40 | |
Chris Lattner | 52c2908 | 2009-01-27 06:27:13 +0000 | [diff] [blame] | 41 | unsigned BOffset = SM.getFileOffset(B); |
| 42 | unsigned EOffset = SM.getFileOffset(E); |
Mike Stump | 1eb4433 | 2009-09-09 15:08:12 +0000 | [diff] [blame] | 43 | |
Chris Lattner | 5ef3e2c | 2008-04-16 22:45:51 +0000 | [diff] [blame] | 44 | // Include the whole end token in the range. |
Chris Lattner | 2c78b87 | 2009-04-14 23:22:57 +0000 | [diff] [blame] | 45 | EOffset += Lexer::MeasureTokenLength(E, R.getSourceMgr(), R.getLangOpts()); |
Mike Stump | 1eb4433 | 2009-09-09 15:08:12 +0000 | [diff] [blame] | 46 | |
Douglas Gregor | f715ca1 | 2010-03-16 00:06:06 +0000 | [diff] [blame] | 47 | bool Invalid = false; |
Benjamin Kramer | f6ac97b | 2010-03-16 14:14:31 +0000 | [diff] [blame] | 48 | const char *BufferStart = SM.getBufferData(FID, &Invalid).data(); |
Douglas Gregor | f715ca1 | 2010-03-16 00:06:06 +0000 | [diff] [blame] | 49 | if (Invalid) |
Douglas Gregor | aea67db | 2010-03-15 22:54:52 +0000 | [diff] [blame] | 50 | return; |
Douglas Gregor | aea67db | 2010-03-15 22:54:52 +0000 | [diff] [blame] | 51 | |
Chris Lattner | 2b2453a | 2009-01-17 06:22:33 +0000 | [diff] [blame] | 52 | HighlightRange(R.getEditBuffer(FID), BOffset, EOffset, |
Douglas Gregor | aea67db | 2010-03-15 22:54:52 +0000 | [diff] [blame] | 53 | BufferStart, StartTag, EndTag); |
Chris Lattner | 5ef3e2c | 2008-04-16 22:45:51 +0000 | [diff] [blame] | 54 | } |
| 55 | |
| 56 | /// HighlightRange - This is the same as the above method, but takes |
| 57 | /// decomposed file locations. |
| 58 | void html::HighlightRange(RewriteBuffer &RB, unsigned B, unsigned E, |
| 59 | const char *BufferStart, |
| 60 | const char *StartTag, const char *EndTag) { |
Chris Lattner | 9402b57 | 2008-04-16 23:06:45 +0000 | [diff] [blame] | 61 | // Insert the tag at the absolute start/end of the range. |
Daniel Dunbar | d7407dc | 2009-08-19 19:10:30 +0000 | [diff] [blame] | 62 | RB.InsertTextAfter(B, StartTag); |
| 63 | RB.InsertTextBefore(E, EndTag); |
Mike Stump | 1eb4433 | 2009-09-09 15:08:12 +0000 | [diff] [blame] | 64 | |
Chris Lattner | 9402b57 | 2008-04-16 23:06:45 +0000 | [diff] [blame] | 65 | // Scan the range to see if there is a \r or \n. If so, and if the line is |
| 66 | // not blank, insert tags on that line as well. |
| 67 | bool HadOpenTag = true; |
Mike Stump | 1eb4433 | 2009-09-09 15:08:12 +0000 | [diff] [blame] | 68 | |
Chris Lattner | 9402b57 | 2008-04-16 23:06:45 +0000 | [diff] [blame] | 69 | unsigned LastNonWhiteSpace = B; |
| 70 | for (unsigned i = B; i != E; ++i) { |
| 71 | switch (BufferStart[i]) { |
| 72 | case '\r': |
| 73 | case '\n': |
| 74 | // Okay, we found a newline in the range. If we have an open tag, we need |
| 75 | // to insert a close tag at the first non-whitespace before the newline. |
| 76 | if (HadOpenTag) |
Daniel Dunbar | d7407dc | 2009-08-19 19:10:30 +0000 | [diff] [blame] | 77 | RB.InsertTextBefore(LastNonWhiteSpace+1, EndTag); |
Mike Stump | 1eb4433 | 2009-09-09 15:08:12 +0000 | [diff] [blame] | 78 | |
Chris Lattner | 9402b57 | 2008-04-16 23:06:45 +0000 | [diff] [blame] | 79 | // Instead of inserting an open tag immediately after the newline, we |
| 80 | // wait until we see a non-whitespace character. This prevents us from |
| 81 | // inserting tags around blank lines, and also allows the open tag to |
| 82 | // be put *after* whitespace on a non-blank line. |
| 83 | HadOpenTag = false; |
| 84 | break; |
| 85 | case '\0': |
| 86 | case ' ': |
| 87 | case '\t': |
| 88 | case '\f': |
| 89 | case '\v': |
| 90 | // Ignore whitespace. |
| 91 | break; |
Mike Stump | 1eb4433 | 2009-09-09 15:08:12 +0000 | [diff] [blame] | 92 | |
Chris Lattner | 9402b57 | 2008-04-16 23:06:45 +0000 | [diff] [blame] | 93 | default: |
| 94 | // If there is no tag open, do it now. |
| 95 | if (!HadOpenTag) { |
Daniel Dunbar | d7407dc | 2009-08-19 19:10:30 +0000 | [diff] [blame] | 96 | RB.InsertTextAfter(i, StartTag); |
Chris Lattner | 9402b57 | 2008-04-16 23:06:45 +0000 | [diff] [blame] | 97 | HadOpenTag = true; |
| 98 | } |
Mike Stump | 1eb4433 | 2009-09-09 15:08:12 +0000 | [diff] [blame] | 99 | |
Chris Lattner | 9402b57 | 2008-04-16 23:06:45 +0000 | [diff] [blame] | 100 | // Remember this character. |
| 101 | LastNonWhiteSpace = i; |
| 102 | break; |
| 103 | } |
| 104 | } |
Chris Lattner | 5ef3e2c | 2008-04-16 22:45:51 +0000 | [diff] [blame] | 105 | } |
| 106 | |
Chris Lattner | 2b2453a | 2009-01-17 06:22:33 +0000 | [diff] [blame] | 107 | void html::EscapeText(Rewriter &R, FileID FID, |
Ted Kremenek | fa5be36 | 2008-04-08 22:37:58 +0000 | [diff] [blame] | 108 | bool EscapeSpaces, bool ReplaceTabs) { |
Mike Stump | 1eb4433 | 2009-09-09 15:08:12 +0000 | [diff] [blame] | 109 | |
Chris Lattner | 2b2453a | 2009-01-17 06:22:33 +0000 | [diff] [blame] | 110 | const llvm::MemoryBuffer *Buf = R.getSourceMgr().getBuffer(FID); |
Ted Kremenek | 6a34083 | 2008-03-18 21:19:49 +0000 | [diff] [blame] | 111 | const char* C = Buf->getBufferStart(); |
| 112 | const char* FileEnd = Buf->getBufferEnd(); |
Mike Stump | 1eb4433 | 2009-09-09 15:08:12 +0000 | [diff] [blame] | 113 | |
Ted Kremenek | 6a34083 | 2008-03-18 21:19:49 +0000 | [diff] [blame] | 114 | assert (C <= FileEnd); |
Mike Stump | 1eb4433 | 2009-09-09 15:08:12 +0000 | [diff] [blame] | 115 | |
Chris Lattner | 2b2453a | 2009-01-17 06:22:33 +0000 | [diff] [blame] | 116 | RewriteBuffer &RB = R.getEditBuffer(FID); |
Chris Lattner | 5c176f7 | 2008-04-18 04:54:20 +0000 | [diff] [blame] | 117 | |
| 118 | unsigned ColNo = 0; |
Ted Kremenek | 6a34083 | 2008-03-18 21:19:49 +0000 | [diff] [blame] | 119 | for (unsigned FilePos = 0; C != FileEnd ; ++C, ++FilePos) { |
Ted Kremenek | 6a34083 | 2008-03-18 21:19:49 +0000 | [diff] [blame] | 120 | switch (*C) { |
Chris Lattner | 5c176f7 | 2008-04-18 04:54:20 +0000 | [diff] [blame] | 121 | default: ++ColNo; break; |
| 122 | case '\n': |
| 123 | case '\r': |
| 124 | ColNo = 0; |
| 125 | break; |
Mike Stump | 1eb4433 | 2009-09-09 15:08:12 +0000 | [diff] [blame] | 126 | |
Chris Lattner | 7352714 | 2008-04-16 04:33:23 +0000 | [diff] [blame] | 127 | case ' ': |
| 128 | if (EscapeSpaces) |
Daniel Dunbar | d7407dc | 2009-08-19 19:10:30 +0000 | [diff] [blame] | 129 | RB.ReplaceText(FilePos, 1, " "); |
Chris Lattner | 5c176f7 | 2008-04-18 04:54:20 +0000 | [diff] [blame] | 130 | ++ColNo; |
Chris Lattner | 7352714 | 2008-04-16 04:33:23 +0000 | [diff] [blame] | 131 | break; |
Chris Lattner | f3d8d19 | 2008-04-19 23:56:30 +0000 | [diff] [blame] | 132 | case '\f': |
Daniel Dunbar | d7407dc | 2009-08-19 19:10:30 +0000 | [diff] [blame] | 133 | RB.ReplaceText(FilePos, 1, "<hr>"); |
Chris Lattner | f3d8d19 | 2008-04-19 23:56:30 +0000 | [diff] [blame] | 134 | ColNo = 0; |
| 135 | break; |
Mike Stump | 1eb4433 | 2009-09-09 15:08:12 +0000 | [diff] [blame] | 136 | |
Chris Lattner | 5c176f7 | 2008-04-18 04:54:20 +0000 | [diff] [blame] | 137 | case '\t': { |
Chris Lattner | 7352714 | 2008-04-16 04:33:23 +0000 | [diff] [blame] | 138 | if (!ReplaceTabs) |
Ted Kremenek | 49cd635 | 2008-04-03 07:12:29 +0000 | [diff] [blame] | 139 | break; |
Chris Lattner | 5c176f7 | 2008-04-18 04:54:20 +0000 | [diff] [blame] | 140 | unsigned NumSpaces = 8-(ColNo&7); |
Chris Lattner | 7352714 | 2008-04-16 04:33:23 +0000 | [diff] [blame] | 141 | if (EscapeSpaces) |
Daniel Dunbar | d7407dc | 2009-08-19 19:10:30 +0000 | [diff] [blame] | 142 | RB.ReplaceText(FilePos, 1, |
Chris Lattner | 5f9e272 | 2011-07-23 10:55:15 +0000 | [diff] [blame] | 143 | StringRef(" " |
Daniel Dunbar | d7407dc | 2009-08-19 19:10:30 +0000 | [diff] [blame] | 144 | " ", 6*NumSpaces)); |
Chris Lattner | 7352714 | 2008-04-16 04:33:23 +0000 | [diff] [blame] | 145 | else |
Chris Lattner | 5f9e272 | 2011-07-23 10:55:15 +0000 | [diff] [blame] | 146 | RB.ReplaceText(FilePos, 1, StringRef(" ", NumSpaces)); |
Chris Lattner | 5c176f7 | 2008-04-18 04:54:20 +0000 | [diff] [blame] | 147 | ColNo += NumSpaces; |
Chris Lattner | 7352714 | 2008-04-16 04:33:23 +0000 | [diff] [blame] | 148 | break; |
Chris Lattner | 5c176f7 | 2008-04-18 04:54:20 +0000 | [diff] [blame] | 149 | } |
Chris Lattner | 7352714 | 2008-04-16 04:33:23 +0000 | [diff] [blame] | 150 | case '<': |
Daniel Dunbar | d7407dc | 2009-08-19 19:10:30 +0000 | [diff] [blame] | 151 | RB.ReplaceText(FilePos, 1, "<"); |
Chris Lattner | 5c176f7 | 2008-04-18 04:54:20 +0000 | [diff] [blame] | 152 | ++ColNo; |
Chris Lattner | 7352714 | 2008-04-16 04:33:23 +0000 | [diff] [blame] | 153 | break; |
Mike Stump | 1eb4433 | 2009-09-09 15:08:12 +0000 | [diff] [blame] | 154 | |
Chris Lattner | 7352714 | 2008-04-16 04:33:23 +0000 | [diff] [blame] | 155 | case '>': |
Daniel Dunbar | d7407dc | 2009-08-19 19:10:30 +0000 | [diff] [blame] | 156 | RB.ReplaceText(FilePos, 1, ">"); |
Chris Lattner | 5c176f7 | 2008-04-18 04:54:20 +0000 | [diff] [blame] | 157 | ++ColNo; |
Chris Lattner | 7352714 | 2008-04-16 04:33:23 +0000 | [diff] [blame] | 158 | break; |
Mike Stump | 1eb4433 | 2009-09-09 15:08:12 +0000 | [diff] [blame] | 159 | |
Chris Lattner | 7352714 | 2008-04-16 04:33:23 +0000 | [diff] [blame] | 160 | case '&': |
Daniel Dunbar | d7407dc | 2009-08-19 19:10:30 +0000 | [diff] [blame] | 161 | RB.ReplaceText(FilePos, 1, "&"); |
Chris Lattner | 5c176f7 | 2008-04-18 04:54:20 +0000 | [diff] [blame] | 162 | ++ColNo; |
Chris Lattner | 7352714 | 2008-04-16 04:33:23 +0000 | [diff] [blame] | 163 | break; |
Ted Kremenek | 6a34083 | 2008-03-18 21:19:49 +0000 | [diff] [blame] | 164 | } |
| 165 | } |
| 166 | } |
| 167 | |
Ted Kremenek | fa5be36 | 2008-04-08 22:37:58 +0000 | [diff] [blame] | 168 | std::string html::EscapeText(const std::string& s, bool EscapeSpaces, |
| 169 | bool ReplaceTabs) { |
Mike Stump | 1eb4433 | 2009-09-09 15:08:12 +0000 | [diff] [blame] | 170 | |
Ted Kremenek | 053ef59 | 2008-03-27 17:15:29 +0000 | [diff] [blame] | 171 | unsigned len = s.size(); |
Ted Kremenek | a95d375 | 2008-09-13 05:16:45 +0000 | [diff] [blame] | 172 | std::string Str; |
| 173 | llvm::raw_string_ostream os(Str); |
Mike Stump | 1eb4433 | 2009-09-09 15:08:12 +0000 | [diff] [blame] | 174 | |
Ted Kremenek | 053ef59 | 2008-03-27 17:15:29 +0000 | [diff] [blame] | 175 | for (unsigned i = 0 ; i < len; ++i) { |
Mike Stump | 1eb4433 | 2009-09-09 15:08:12 +0000 | [diff] [blame] | 176 | |
Ted Kremenek | 053ef59 | 2008-03-27 17:15:29 +0000 | [diff] [blame] | 177 | char c = s[i]; |
Ted Kremenek | 053ef59 | 2008-03-27 17:15:29 +0000 | [diff] [blame] | 178 | switch (c) { |
Chris Lattner | 8570f0b | 2008-04-16 04:37:29 +0000 | [diff] [blame] | 179 | default: |
| 180 | os << c; break; |
Mike Stump | 1eb4433 | 2009-09-09 15:08:12 +0000 | [diff] [blame] | 181 | |
Chris Lattner | 8570f0b | 2008-04-16 04:37:29 +0000 | [diff] [blame] | 182 | case ' ': |
| 183 | if (EscapeSpaces) os << " "; |
| 184 | else os << ' '; |
| 185 | break; |
Mike Stump | 1eb4433 | 2009-09-09 15:08:12 +0000 | [diff] [blame] | 186 | |
Zhongxing Xu | c01b46e | 2009-08-17 14:13:14 +0000 | [diff] [blame] | 187 | case '\t': |
| 188 | if (ReplaceTabs) { |
| 189 | if (EscapeSpaces) |
| 190 | for (unsigned i = 0; i < 4; ++i) |
| 191 | os << " "; |
| 192 | else |
| 193 | for (unsigned i = 0; i < 4; ++i) |
| 194 | os << " "; |
| 195 | } |
Mike Stump | 1eb4433 | 2009-09-09 15:08:12 +0000 | [diff] [blame] | 196 | else |
Zhongxing Xu | c01b46e | 2009-08-17 14:13:14 +0000 | [diff] [blame] | 197 | os << c; |
Mike Stump | 1eb4433 | 2009-09-09 15:08:12 +0000 | [diff] [blame] | 198 | |
Zhongxing Xu | c01b46e | 2009-08-17 14:13:14 +0000 | [diff] [blame] | 199 | break; |
Mike Stump | 1eb4433 | 2009-09-09 15:08:12 +0000 | [diff] [blame] | 200 | |
Zhongxing Xu | c01b46e | 2009-08-17 14:13:14 +0000 | [diff] [blame] | 201 | case '<': os << "<"; break; |
| 202 | case '>': os << ">"; break; |
| 203 | case '&': os << "&"; break; |
Ted Kremenek | 053ef59 | 2008-03-27 17:15:29 +0000 | [diff] [blame] | 204 | } |
| 205 | } |
Mike Stump | 1eb4433 | 2009-09-09 15:08:12 +0000 | [diff] [blame] | 206 | |
Ted Kremenek | 053ef59 | 2008-03-27 17:15:29 +0000 | [diff] [blame] | 207 | return os.str(); |
| 208 | } |
| 209 | |
Chris Lattner | 8570f0b | 2008-04-16 04:37:29 +0000 | [diff] [blame] | 210 | static void AddLineNumber(RewriteBuffer &RB, unsigned LineNo, |
| 211 | unsigned B, unsigned E) { |
Dylan Noblesmith | f7ccbad | 2012-02-05 02:13:05 +0000 | [diff] [blame] | 212 | SmallString<256> Str; |
Daniel Dunbar | 7e37c81 | 2009-08-19 18:30:37 +0000 | [diff] [blame] | 213 | llvm::raw_svector_ostream OS(Str); |
| 214 | |
| 215 | OS << "<tr><td class=\"num\" id=\"LN" |
| 216 | << LineNo << "\">" |
| 217 | << LineNo << "</td><td class=\"line\">"; |
Mike Stump | 1eb4433 | 2009-09-09 15:08:12 +0000 | [diff] [blame] | 218 | |
Ted Kremenek | 49cd635 | 2008-04-03 07:12:29 +0000 | [diff] [blame] | 219 | if (B == E) { // Handle empty lines. |
Daniel Dunbar | 7e37c81 | 2009-08-19 18:30:37 +0000 | [diff] [blame] | 220 | OS << " </td></tr>"; |
Daniel Dunbar | d7407dc | 2009-08-19 19:10:30 +0000 | [diff] [blame] | 221 | RB.InsertTextBefore(B, OS.str()); |
Chris Lattner | 57df3b9 | 2008-04-16 04:11:35 +0000 | [diff] [blame] | 222 | } else { |
Daniel Dunbar | d7407dc | 2009-08-19 19:10:30 +0000 | [diff] [blame] | 223 | RB.InsertTextBefore(B, OS.str()); |
| 224 | RB.InsertTextBefore(E, "</td></tr>"); |
Ted Kremenek | 49cd635 | 2008-04-03 07:12:29 +0000 | [diff] [blame] | 225 | } |
Ted Kremenek | b485cd1 | 2008-03-18 23:08:51 +0000 | [diff] [blame] | 226 | } |
| 227 | |
Chris Lattner | 2b2453a | 2009-01-17 06:22:33 +0000 | [diff] [blame] | 228 | void html::AddLineNumbers(Rewriter& R, FileID FID) { |
Ted Kremenek | b485cd1 | 2008-03-18 23:08:51 +0000 | [diff] [blame] | 229 | |
Chris Lattner | 2b2453a | 2009-01-17 06:22:33 +0000 | [diff] [blame] | 230 | const llvm::MemoryBuffer *Buf = R.getSourceMgr().getBuffer(FID); |
Ted Kremenek | b485cd1 | 2008-03-18 23:08:51 +0000 | [diff] [blame] | 231 | const char* FileBeg = Buf->getBufferStart(); |
| 232 | const char* FileEnd = Buf->getBufferEnd(); |
| 233 | const char* C = FileBeg; |
Chris Lattner | 2b2453a | 2009-01-17 06:22:33 +0000 | [diff] [blame] | 234 | RewriteBuffer &RB = R.getEditBuffer(FID); |
Mike Stump | 1eb4433 | 2009-09-09 15:08:12 +0000 | [diff] [blame] | 235 | |
Ted Kremenek | b485cd1 | 2008-03-18 23:08:51 +0000 | [diff] [blame] | 236 | assert (C <= FileEnd); |
Mike Stump | 1eb4433 | 2009-09-09 15:08:12 +0000 | [diff] [blame] | 237 | |
Ted Kremenek | b485cd1 | 2008-03-18 23:08:51 +0000 | [diff] [blame] | 238 | unsigned LineNo = 0; |
| 239 | unsigned FilePos = 0; |
Mike Stump | 1eb4433 | 2009-09-09 15:08:12 +0000 | [diff] [blame] | 240 | |
| 241 | while (C != FileEnd) { |
| 242 | |
Ted Kremenek | b485cd1 | 2008-03-18 23:08:51 +0000 | [diff] [blame] | 243 | ++LineNo; |
| 244 | unsigned LineStartPos = FilePos; |
| 245 | unsigned LineEndPos = FileEnd - FileBeg; |
Mike Stump | 1eb4433 | 2009-09-09 15:08:12 +0000 | [diff] [blame] | 246 | |
Ted Kremenek | b485cd1 | 2008-03-18 23:08:51 +0000 | [diff] [blame] | 247 | assert (FilePos <= LineEndPos); |
| 248 | assert (C < FileEnd); |
Mike Stump | 1eb4433 | 2009-09-09 15:08:12 +0000 | [diff] [blame] | 249 | |
Ted Kremenek | b485cd1 | 2008-03-18 23:08:51 +0000 | [diff] [blame] | 250 | // Scan until the newline (or end-of-file). |
Mike Stump | 1eb4433 | 2009-09-09 15:08:12 +0000 | [diff] [blame] | 251 | |
Ted Kremenek | 49cd635 | 2008-04-03 07:12:29 +0000 | [diff] [blame] | 252 | while (C != FileEnd) { |
| 253 | char c = *C; |
| 254 | ++C; |
Mike Stump | 1eb4433 | 2009-09-09 15:08:12 +0000 | [diff] [blame] | 255 | |
Ted Kremenek | 49cd635 | 2008-04-03 07:12:29 +0000 | [diff] [blame] | 256 | if (c == '\n') { |
| 257 | LineEndPos = FilePos++; |
Ted Kremenek | b485cd1 | 2008-03-18 23:08:51 +0000 | [diff] [blame] | 258 | break; |
| 259 | } |
Mike Stump | 1eb4433 | 2009-09-09 15:08:12 +0000 | [diff] [blame] | 260 | |
Ted Kremenek | 49cd635 | 2008-04-03 07:12:29 +0000 | [diff] [blame] | 261 | ++FilePos; |
| 262 | } |
Mike Stump | 1eb4433 | 2009-09-09 15:08:12 +0000 | [diff] [blame] | 263 | |
Chris Lattner | 8570f0b | 2008-04-16 04:37:29 +0000 | [diff] [blame] | 264 | AddLineNumber(RB, LineNo, LineStartPos, LineEndPos); |
Ted Kremenek | d6c1360 | 2008-03-19 05:07:26 +0000 | [diff] [blame] | 265 | } |
Mike Stump | 1eb4433 | 2009-09-09 15:08:12 +0000 | [diff] [blame] | 266 | |
Chris Lattner | 8570f0b | 2008-04-16 04:37:29 +0000 | [diff] [blame] | 267 | // Add one big table tag that surrounds all of the code. |
Daniel Dunbar | d7407dc | 2009-08-19 19:10:30 +0000 | [diff] [blame] | 268 | RB.InsertTextBefore(0, "<table class=\"code\">\n"); |
| 269 | RB.InsertTextAfter(FileEnd - FileBeg, "</table>"); |
Ted Kremenek | b485cd1 | 2008-03-18 23:08:51 +0000 | [diff] [blame] | 270 | } |
Ted Kremenek | ad0a203 | 2008-03-19 06:14:37 +0000 | [diff] [blame] | 271 | |
Mike Stump | 1eb4433 | 2009-09-09 15:08:12 +0000 | [diff] [blame] | 272 | void html::AddHeaderFooterInternalBuiltinCSS(Rewriter& R, FileID FID, |
Ted Kremenek | f6f593f | 2008-07-07 18:31:05 +0000 | [diff] [blame] | 273 | const char *title) { |
Ted Kremenek | ad0a203 | 2008-03-19 06:14:37 +0000 | [diff] [blame] | 274 | |
Chris Lattner | 2b2453a | 2009-01-17 06:22:33 +0000 | [diff] [blame] | 275 | const llvm::MemoryBuffer *Buf = R.getSourceMgr().getBuffer(FID); |
Ted Kremenek | ad0a203 | 2008-03-19 06:14:37 +0000 | [diff] [blame] | 276 | const char* FileStart = Buf->getBufferStart(); |
| 277 | const char* FileEnd = Buf->getBufferEnd(); |
| 278 | |
Chris Lattner | 2b2453a | 2009-01-17 06:22:33 +0000 | [diff] [blame] | 279 | SourceLocation StartLoc = R.getSourceMgr().getLocForStartOfFile(FID); |
Argyrios Kyrtzidis | a64ccef | 2011-09-19 20:40:19 +0000 | [diff] [blame] | 280 | SourceLocation EndLoc = StartLoc.getLocWithOffset(FileEnd-FileStart); |
Ted Kremenek | ad0a203 | 2008-03-19 06:14:37 +0000 | [diff] [blame] | 281 | |
Ted Kremenek | a95d375 | 2008-09-13 05:16:45 +0000 | [diff] [blame] | 282 | std::string s; |
| 283 | llvm::raw_string_ostream os(s); |
Ted Kremenek | f6f593f | 2008-07-07 18:31:05 +0000 | [diff] [blame] | 284 | os << "<!doctype html>\n" // Use HTML 5 doctype |
| 285 | "<html>\n<head>\n"; |
Mike Stump | 1eb4433 | 2009-09-09 15:08:12 +0000 | [diff] [blame] | 286 | |
Ted Kremenek | f6f593f | 2008-07-07 18:31:05 +0000 | [diff] [blame] | 287 | if (title) |
| 288 | os << "<title>" << html::EscapeText(title) << "</title>\n"; |
Mike Stump | 1eb4433 | 2009-09-09 15:08:12 +0000 | [diff] [blame] | 289 | |
Ted Kremenek | f6f593f | 2008-07-07 18:31:05 +0000 | [diff] [blame] | 290 | os << "<style type=\"text/css\">\n" |
Ted Kremenek | 70bcba6 | 2008-04-09 15:40:40 +0000 | [diff] [blame] | 291 | " body { color:#000000; background-color:#ffffff }\n" |
| 292 | " body { font-family:Helvetica, sans-serif; font-size:10pt }\n" |
Ted Kremenek | 4b0f813 | 2008-04-15 21:25:08 +0000 | [diff] [blame] | 293 | " h1 { font-size:14pt }\n" |
Ted Kremenek | f501626 | 2008-04-18 02:12:39 +0000 | [diff] [blame] | 294 | " .code { border-collapse:collapse; width:100%; }\n" |
Ted Kremenek | 3eaaa99 | 2012-01-20 20:39:55 +0000 | [diff] [blame] | 295 | " .code { font-family: \"Monospace\", monospace; font-size:10pt }\n" |
Ted Kremenek | 70bcba6 | 2008-04-09 15:40:40 +0000 | [diff] [blame] | 296 | " .code { line-height: 1.2em }\n" |
Ted Kremenek | f501626 | 2008-04-18 02:12:39 +0000 | [diff] [blame] | 297 | " .comment { color: green; font-style: oblique }\n" |
| 298 | " .keyword { color: blue }\n" |
Ted Kremenek | cc1b853 | 2008-08-31 16:37:56 +0000 | [diff] [blame] | 299 | " .string_literal { color: red }\n" |
Ted Kremenek | f501626 | 2008-04-18 02:12:39 +0000 | [diff] [blame] | 300 | " .directive { color: darkmagenta }\n" |
Chris Lattner | 6f46be2 | 2008-04-17 00:40:45 +0000 | [diff] [blame] | 301 | // Macro expansions. |
Ted Kremenek | 07339a6 | 2008-04-17 19:57:27 +0000 | [diff] [blame] | 302 | " .expansion { display: none; }\n" |
| 303 | " .macro:hover .expansion { display: block; border: 2px solid #FF0000; " |
Chris Lattner | dc5be47 | 2008-04-17 21:32:46 +0000 | [diff] [blame] | 304 | "padding: 2px; background-color:#FFF0F0; font-weight: normal; " |
Chris Lattner | 6f46be2 | 2008-04-17 00:40:45 +0000 | [diff] [blame] | 305 | " -webkit-border-radius:5px; -webkit-box-shadow:1px 1px 7px #000; " |
Chris Lattner | 8aa06ac | 2008-04-17 21:28:41 +0000 | [diff] [blame] | 306 | "position: absolute; top: -1em; left:10em; z-index: 1 } \n" |
Ted Kremenek | f501626 | 2008-04-18 02:12:39 +0000 | [diff] [blame] | 307 | " .macro { color: darkmagenta; background-color:LemonChiffon;" |
Chris Lattner | 6f46be2 | 2008-04-17 00:40:45 +0000 | [diff] [blame] | 308 | // Macros are position: relative to provide base for expansions. |
| 309 | " position: relative }\n" |
Ted Kremenek | 70bcba6 | 2008-04-09 15:40:40 +0000 | [diff] [blame] | 310 | " .num { width:2.5em; padding-right:2ex; background-color:#eeeeee }\n" |
Ted Kremenek | 2223622 | 2009-03-10 05:14:32 +0000 | [diff] [blame] | 311 | " .num { text-align:right; font-size:8pt }\n" |
Ted Kremenek | 70bcba6 | 2008-04-09 15:40:40 +0000 | [diff] [blame] | 312 | " .num { color:#444444 }\n" |
| 313 | " .line { padding-left: 1ex; border-left: 3px solid #ccc }\n" |
| 314 | " .line { white-space: pre }\n" |
Ted Kremenek | 70bcba6 | 2008-04-09 15:40:40 +0000 | [diff] [blame] | 315 | " .msg { -webkit-box-shadow:1px 1px 7px #000 }\n" |
| 316 | " .msg { -webkit-border-radius:5px }\n" |
Ted Kremenek | 2223622 | 2009-03-10 05:14:32 +0000 | [diff] [blame] | 317 | " .msg { font-family:Helvetica, sans-serif; font-size:8pt }\n" |
Ted Kremenek | 70bcba6 | 2008-04-09 15:40:40 +0000 | [diff] [blame] | 318 | " .msg { float:left }\n" |
Ted Kremenek | 3c59823 | 2009-03-03 03:00:21 +0000 | [diff] [blame] | 319 | " .msg { padding:0.25em 1ex 0.25em 1ex }\n" |
Ted Kremenek | 70bcba6 | 2008-04-09 15:40:40 +0000 | [diff] [blame] | 320 | " .msg { margin-top:10px; margin-bottom:10px }\n" |
Ted Kremenek | 2f10398 | 2009-03-02 21:42:01 +0000 | [diff] [blame] | 321 | " .msg { font-weight:bold }\n" |
Ted Kremenek | 80bae76 | 2009-03-02 23:05:40 +0000 | [diff] [blame] | 322 | " .msg { max-width:60em; word-wrap: break-word; white-space: pre-wrap }\n" |
| 323 | " .msgT { padding:0x; spacing:0x }\n" |
Ted Kremenek | 2f10398 | 2009-03-02 21:42:01 +0000 | [diff] [blame] | 324 | " .msgEvent { background-color:#fff8b4; color:#000000 }\n" |
Ted Kremenek | 80bae76 | 2009-03-02 23:05:40 +0000 | [diff] [blame] | 325 | " .msgControl { background-color:#bbbbbb; color:#000000 }\n" |
Ted Kremenek | 70bcba6 | 2008-04-09 15:40:40 +0000 | [diff] [blame] | 326 | " .mrange { background-color:#dfddf3 }\n" |
| 327 | " .mrange { border-bottom:1px solid #6F9DBE }\n" |
Ted Kremenek | 3c59823 | 2009-03-03 03:00:21 +0000 | [diff] [blame] | 328 | " .PathIndex { font-weight: bold; padding:0px 5px 0px 5px; " |
| 329 | "margin-right:5px; }\n" |
Ted Kremenek | 00f01e4 | 2009-03-02 23:39:27 +0000 | [diff] [blame] | 330 | " .PathIndex { -webkit-border-radius:8px }\n" |
| 331 | " .PathIndexEvent { background-color:#bfba87 }\n" |
| 332 | " .PathIndexControl { background-color:#8c8c8c }\n" |
Douglas Gregor | 4b2d3f7 | 2009-02-26 21:00:50 +0000 | [diff] [blame] | 333 | " .CodeInsertionHint { font-weight: bold; background-color: #10dd10 }\n" |
| 334 | " .CodeRemovalHint { background-color:#de1010 }\n" |
| 335 | " .CodeRemovalHint { border-bottom:1px solid #6F9DBE }\n" |
Ted Kremenek | 4b0f813 | 2008-04-15 21:25:08 +0000 | [diff] [blame] | 336 | " table.simpletable {\n" |
| 337 | " padding: 5px;\n" |
| 338 | " font-size:12pt;\n" |
| 339 | " margin:20px;\n" |
| 340 | " border-collapse: collapse; border-spacing: 0px;\n" |
| 341 | " }\n" |
| 342 | " td.rowname {\n" |
| 343 | " text-align:right; font-weight:bold; color:#444444;\n" |
| 344 | " padding-right:2ex; }\n" |
Ted Kremenek | f6f593f | 2008-07-07 18:31:05 +0000 | [diff] [blame] | 345 | "</style>\n</head>\n<body>"; |
Ted Kremenek | 70bcba6 | 2008-04-09 15:40:40 +0000 | [diff] [blame] | 346 | |
Ted Kremenek | f6f593f | 2008-07-07 18:31:05 +0000 | [diff] [blame] | 347 | // Generate header |
Daniel Dunbar | 44ba7bf | 2009-08-19 20:32:38 +0000 | [diff] [blame] | 348 | R.InsertTextBefore(StartLoc, os.str()); |
Ted Kremenek | ad0a203 | 2008-03-19 06:14:37 +0000 | [diff] [blame] | 349 | // Generate footer |
Mike Stump | 1eb4433 | 2009-09-09 15:08:12 +0000 | [diff] [blame] | 350 | |
Daniel Dunbar | 44ba7bf | 2009-08-19 20:32:38 +0000 | [diff] [blame] | 351 | R.InsertTextAfter(EndLoc, "</body></html>\n"); |
Ted Kremenek | ad0a203 | 2008-03-19 06:14:37 +0000 | [diff] [blame] | 352 | } |
Chris Lattner | 3245a0a | 2008-04-16 06:11:58 +0000 | [diff] [blame] | 353 | |
| 354 | /// SyntaxHighlight - Relex the specified FileID and annotate the HTML with |
| 355 | /// information about keywords, macro expansions etc. This uses the macro |
| 356 | /// table state from the end of the file, so it won't be perfectly perfect, |
| 357 | /// but it will be reasonably close. |
Daniel Dunbar | ff6912b | 2009-11-05 01:54:02 +0000 | [diff] [blame] | 358 | void html::SyntaxHighlight(Rewriter &R, FileID FID, const Preprocessor &PP) { |
Chris Lattner | 2b2453a | 2009-01-17 06:22:33 +0000 | [diff] [blame] | 359 | RewriteBuffer &RB = R.getEditBuffer(FID); |
Chris Lattner | 3245a0a | 2008-04-16 06:11:58 +0000 | [diff] [blame] | 360 | |
Chris Lattner | 05db427 | 2009-02-13 19:33:24 +0000 | [diff] [blame] | 361 | const SourceManager &SM = PP.getSourceManager(); |
Chris Lattner | 6e29014 | 2009-11-30 04:18:44 +0000 | [diff] [blame] | 362 | const llvm::MemoryBuffer *FromFile = SM.getBuffer(FID); |
David Blaikie | 4e4d084 | 2012-03-11 07:00:24 +0000 | [diff] [blame] | 363 | Lexer L(FID, FromFile, SM, PP.getLangOpts()); |
Chris Lattner | 025c3a6 | 2009-01-17 07:35:14 +0000 | [diff] [blame] | 364 | const char *BufferStart = L.getBufferStart(); |
Mike Stump | 1eb4433 | 2009-09-09 15:08:12 +0000 | [diff] [blame] | 365 | |
| 366 | // Inform the preprocessor that we want to retain comments as tokens, so we |
Chris Lattner | 3245a0a | 2008-04-16 06:11:58 +0000 | [diff] [blame] | 367 | // can highlight them. |
Chris Lattner | 678c635 | 2008-04-16 20:54:51 +0000 | [diff] [blame] | 368 | L.SetCommentRetentionState(true); |
Mike Stump | 1eb4433 | 2009-09-09 15:08:12 +0000 | [diff] [blame] | 369 | |
Chris Lattner | c54d50a | 2008-04-16 06:32:08 +0000 | [diff] [blame] | 370 | // Lex all the tokens in raw mode, to avoid entering #includes or expanding |
| 371 | // macros. |
Chris Lattner | 3245a0a | 2008-04-16 06:11:58 +0000 | [diff] [blame] | 372 | Token Tok; |
Chris Lattner | 590f0cc | 2008-10-12 01:15:46 +0000 | [diff] [blame] | 373 | L.LexFromRawLexer(Tok); |
Mike Stump | 1eb4433 | 2009-09-09 15:08:12 +0000 | [diff] [blame] | 374 | |
Chris Lattner | 74ea3e5 | 2008-04-16 06:53:09 +0000 | [diff] [blame] | 375 | while (Tok.isNot(tok::eof)) { |
| 376 | // Since we are lexing unexpanded tokens, all tokens are from the main |
| 377 | // FileID. |
Chris Lattner | 05db427 | 2009-02-13 19:33:24 +0000 | [diff] [blame] | 378 | unsigned TokOffs = SM.getFileOffset(Tok.getLocation()); |
Chris Lattner | 3245a0a | 2008-04-16 06:11:58 +0000 | [diff] [blame] | 379 | unsigned TokLen = Tok.getLength(); |
| 380 | switch (Tok.getKind()) { |
Chris Lattner | a745e8c | 2008-04-16 20:51:51 +0000 | [diff] [blame] | 381 | default: break; |
Abramo Bagnara | c4bf2b9 | 2010-12-22 08:23:18 +0000 | [diff] [blame] | 382 | case tok::identifier: |
| 383 | llvm_unreachable("tok::identifier in raw lexing mode!"); |
Abramo Bagnara | c4bf2b9 | 2010-12-22 08:23:18 +0000 | [diff] [blame] | 384 | case tok::raw_identifier: { |
| 385 | // Fill in Result.IdentifierInfo and update the token kind, |
| 386 | // looking up the identifier in the identifier table. |
| 387 | PP.LookUpIdentifierInfo(Tok); |
Mike Stump | 1eb4433 | 2009-09-09 15:08:12 +0000 | [diff] [blame] | 388 | |
Chris Lattner | a745e8c | 2008-04-16 20:51:51 +0000 | [diff] [blame] | 389 | // If this is a pp-identifier, for a keyword, highlight it as such. |
Abramo Bagnara | c4bf2b9 | 2010-12-22 08:23:18 +0000 | [diff] [blame] | 390 | if (Tok.isNot(tok::identifier)) |
Chris Lattner | 5ef3e2c | 2008-04-16 22:45:51 +0000 | [diff] [blame] | 391 | HighlightRange(RB, TokOffs, TokOffs+TokLen, BufferStart, |
| 392 | "<span class='keyword'>", "</span>"); |
Chris Lattner | c4586c2 | 2008-04-16 06:35:07 +0000 | [diff] [blame] | 393 | break; |
Chris Lattner | a745e8c | 2008-04-16 20:51:51 +0000 | [diff] [blame] | 394 | } |
Chris Lattner | 3245a0a | 2008-04-16 06:11:58 +0000 | [diff] [blame] | 395 | case tok::comment: |
Chris Lattner | 5ef3e2c | 2008-04-16 22:45:51 +0000 | [diff] [blame] | 396 | HighlightRange(RB, TokOffs, TokOffs+TokLen, BufferStart, |
| 397 | "<span class='comment'>", "</span>"); |
Chris Lattner | 3245a0a | 2008-04-16 06:11:58 +0000 | [diff] [blame] | 398 | break; |
Douglas Gregor | 5cee119 | 2011-07-27 05:40:30 +0000 | [diff] [blame] | 399 | case tok::utf8_string_literal: |
| 400 | // Chop off the u part of u8 prefix |
| 401 | ++TokOffs; |
| 402 | --TokLen; |
| 403 | // FALL THROUGH to chop the 8 |
Ted Kremenek | cc1b853 | 2008-08-31 16:37:56 +0000 | [diff] [blame] | 404 | case tok::wide_string_literal: |
Douglas Gregor | 5cee119 | 2011-07-27 05:40:30 +0000 | [diff] [blame] | 405 | case tok::utf16_string_literal: |
| 406 | case tok::utf32_string_literal: |
| 407 | // Chop off the L, u, U or 8 prefix |
Ted Kremenek | cc1b853 | 2008-08-31 16:37:56 +0000 | [diff] [blame] | 408 | ++TokOffs; |
| 409 | --TokLen; |
| 410 | // FALL THROUGH. |
| 411 | case tok::string_literal: |
Richard Smith | 99831e4 | 2012-03-06 03:21:47 +0000 | [diff] [blame] | 412 | // FIXME: Exclude the optional ud-suffix from the highlighted range. |
Ted Kremenek | cc1b853 | 2008-08-31 16:37:56 +0000 | [diff] [blame] | 413 | HighlightRange(RB, TokOffs, TokOffs+TokLen, BufferStart, |
| 414 | "<span class='string_literal'>", "</span>"); |
| 415 | break; |
Chris Lattner | 5deb96d | 2008-04-16 23:21:17 +0000 | [diff] [blame] | 416 | case tok::hash: { |
Chris Lattner | 74ea3e5 | 2008-04-16 06:53:09 +0000 | [diff] [blame] | 417 | // If this is a preprocessor directive, all tokens to end of line are too. |
Chris Lattner | 5deb96d | 2008-04-16 23:21:17 +0000 | [diff] [blame] | 418 | if (!Tok.isAtStartOfLine()) |
| 419 | break; |
Mike Stump | 1eb4433 | 2009-09-09 15:08:12 +0000 | [diff] [blame] | 420 | |
Chris Lattner | 5deb96d | 2008-04-16 23:21:17 +0000 | [diff] [blame] | 421 | // Eat all of the tokens until we get to the next one at the start of |
| 422 | // line. |
| 423 | unsigned TokEnd = TokOffs+TokLen; |
Chris Lattner | 590f0cc | 2008-10-12 01:15:46 +0000 | [diff] [blame] | 424 | L.LexFromRawLexer(Tok); |
Chris Lattner | 5deb96d | 2008-04-16 23:21:17 +0000 | [diff] [blame] | 425 | while (!Tok.isAtStartOfLine() && Tok.isNot(tok::eof)) { |
Chris Lattner | 05db427 | 2009-02-13 19:33:24 +0000 | [diff] [blame] | 426 | TokEnd = SM.getFileOffset(Tok.getLocation())+Tok.getLength(); |
Chris Lattner | 590f0cc | 2008-10-12 01:15:46 +0000 | [diff] [blame] | 427 | L.LexFromRawLexer(Tok); |
Chris Lattner | 74ea3e5 | 2008-04-16 06:53:09 +0000 | [diff] [blame] | 428 | } |
Mike Stump | 1eb4433 | 2009-09-09 15:08:12 +0000 | [diff] [blame] | 429 | |
Chris Lattner | 5deb96d | 2008-04-16 23:21:17 +0000 | [diff] [blame] | 430 | // Find end of line. This is a hack. |
| 431 | HighlightRange(RB, TokOffs, TokEnd, BufferStart, |
| 432 | "<span class='directive'>", "</span>"); |
Mike Stump | 1eb4433 | 2009-09-09 15:08:12 +0000 | [diff] [blame] | 433 | |
Chris Lattner | 5deb96d | 2008-04-16 23:21:17 +0000 | [diff] [blame] | 434 | // Don't skip the next token. |
| 435 | continue; |
| 436 | } |
Chris Lattner | 3245a0a | 2008-04-16 06:11:58 +0000 | [diff] [blame] | 437 | } |
Mike Stump | 1eb4433 | 2009-09-09 15:08:12 +0000 | [diff] [blame] | 438 | |
Chris Lattner | 590f0cc | 2008-10-12 01:15:46 +0000 | [diff] [blame] | 439 | L.LexFromRawLexer(Tok); |
Chris Lattner | 74ea3e5 | 2008-04-16 06:53:09 +0000 | [diff] [blame] | 440 | } |
Chris Lattner | 3245a0a | 2008-04-16 06:11:58 +0000 | [diff] [blame] | 441 | } |
Chris Lattner | c54d50a | 2008-04-16 06:32:08 +0000 | [diff] [blame] | 442 | |
| 443 | /// HighlightMacros - This uses the macro table state from the end of the |
Chris Lattner | 05db427 | 2009-02-13 19:33:24 +0000 | [diff] [blame] | 444 | /// file, to re-expand macros and insert (into the HTML) information about the |
Chris Lattner | c54d50a | 2008-04-16 06:32:08 +0000 | [diff] [blame] | 445 | /// macro expansions. This won't be perfectly perfect, but it will be |
| 446 | /// reasonably close. |
Daniel Dunbar | ff6912b | 2009-11-05 01:54:02 +0000 | [diff] [blame] | 447 | void html::HighlightMacros(Rewriter &R, FileID FID, const Preprocessor& PP) { |
Chris Lattner | 05db427 | 2009-02-13 19:33:24 +0000 | [diff] [blame] | 448 | // Re-lex the raw token stream into a token buffer. |
| 449 | const SourceManager &SM = PP.getSourceManager(); |
| 450 | std::vector<Token> TokenStream; |
Mike Stump | 1eb4433 | 2009-09-09 15:08:12 +0000 | [diff] [blame] | 451 | |
Chris Lattner | 6e29014 | 2009-11-30 04:18:44 +0000 | [diff] [blame] | 452 | const llvm::MemoryBuffer *FromFile = SM.getBuffer(FID); |
David Blaikie | 4e4d084 | 2012-03-11 07:00:24 +0000 | [diff] [blame] | 453 | Lexer L(FID, FromFile, SM, PP.getLangOpts()); |
Mike Stump | 1eb4433 | 2009-09-09 15:08:12 +0000 | [diff] [blame] | 454 | |
Chris Lattner | 05db427 | 2009-02-13 19:33:24 +0000 | [diff] [blame] | 455 | // Lex all the tokens in raw mode, to avoid entering #includes or expanding |
| 456 | // macros. |
| 457 | while (1) { |
| 458 | Token Tok; |
| 459 | L.LexFromRawLexer(Tok); |
Mike Stump | 1eb4433 | 2009-09-09 15:08:12 +0000 | [diff] [blame] | 460 | |
Chris Lattner | 05db427 | 2009-02-13 19:33:24 +0000 | [diff] [blame] | 461 | // If this is a # at the start of a line, discard it from the token stream. |
| 462 | // We don't want the re-preprocess step to see #defines, #includes or other |
| 463 | // preprocessor directives. |
| 464 | if (Tok.is(tok::hash) && Tok.isAtStartOfLine()) |
| 465 | continue; |
Chris Lattner | f0b26b1 | 2009-02-24 05:29:33 +0000 | [diff] [blame] | 466 | |
| 467 | // If this is a ## token, change its kind to unknown so that repreprocessing |
| 468 | // it will not produce an error. |
| 469 | if (Tok.is(tok::hashhash)) |
| 470 | Tok.setKind(tok::unknown); |
Mike Stump | 1eb4433 | 2009-09-09 15:08:12 +0000 | [diff] [blame] | 471 | |
Chris Lattner | 05db427 | 2009-02-13 19:33:24 +0000 | [diff] [blame] | 472 | // If this raw token is an identifier, the raw lexer won't have looked up |
| 473 | // the corresponding identifier info for it. Do this now so that it will be |
| 474 | // macro expanded when we re-preprocess it. |
Abramo Bagnara | c4bf2b9 | 2010-12-22 08:23:18 +0000 | [diff] [blame] | 475 | if (Tok.is(tok::raw_identifier)) |
| 476 | PP.LookUpIdentifierInfo(Tok); |
Mike Stump | 1eb4433 | 2009-09-09 15:08:12 +0000 | [diff] [blame] | 477 | |
Chris Lattner | 05db427 | 2009-02-13 19:33:24 +0000 | [diff] [blame] | 478 | TokenStream.push_back(Tok); |
Mike Stump | 1eb4433 | 2009-09-09 15:08:12 +0000 | [diff] [blame] | 479 | |
Chris Lattner | 05db427 | 2009-02-13 19:33:24 +0000 | [diff] [blame] | 480 | if (Tok.is(tok::eof)) break; |
| 481 | } |
Mike Stump | 1eb4433 | 2009-09-09 15:08:12 +0000 | [diff] [blame] | 482 | |
Chris Lattner | 7c175fb | 2009-03-13 21:44:46 +0000 | [diff] [blame] | 483 | // Temporarily change the diagnostics object so that we ignore any generated |
| 484 | // diagnostics from this pass. |
David Blaikie | d6471f7 | 2011-09-25 23:23:43 +0000 | [diff] [blame] | 485 | DiagnosticsEngine TmpDiags(PP.getDiagnostics().getDiagnosticIDs(), |
David Blaikie | f40c0ac | 2011-09-25 23:44:35 +0000 | [diff] [blame] | 486 | new IgnoringDiagConsumer); |
Mike Stump | 1eb4433 | 2009-09-09 15:08:12 +0000 | [diff] [blame] | 487 | |
Daniel Dunbar | ff6912b | 2009-11-05 01:54:02 +0000 | [diff] [blame] | 488 | // FIXME: This is a huge hack; we reuse the input preprocessor because we want |
| 489 | // its state, but we aren't actually changing it (we hope). This should really |
| 490 | // construct a copy of the preprocessor. |
| 491 | Preprocessor &TmpPP = const_cast<Preprocessor&>(PP); |
David Blaikie | d6471f7 | 2011-09-25 23:23:43 +0000 | [diff] [blame] | 492 | DiagnosticsEngine *OldDiags = &TmpPP.getDiagnostics(); |
Daniel Dunbar | ff6912b | 2009-11-05 01:54:02 +0000 | [diff] [blame] | 493 | TmpPP.setDiagnostics(TmpDiags); |
Mike Stump | 1eb4433 | 2009-09-09 15:08:12 +0000 | [diff] [blame] | 494 | |
Chris Lattner | c54d50a | 2008-04-16 06:32:08 +0000 | [diff] [blame] | 495 | // Inform the preprocessor that we don't want comments. |
Daniel Dunbar | ff6912b | 2009-11-05 01:54:02 +0000 | [diff] [blame] | 496 | TmpPP.SetCommentRetentionState(false, false); |
Chris Lattner | 05db427 | 2009-02-13 19:33:24 +0000 | [diff] [blame] | 497 | |
| 498 | // Enter the tokens we just lexed. This will cause them to be macro expanded |
| 499 | // but won't enter sub-files (because we removed #'s). |
Daniel Dunbar | ff6912b | 2009-11-05 01:54:02 +0000 | [diff] [blame] | 500 | TmpPP.EnterTokenStream(&TokenStream[0], TokenStream.size(), false, false); |
Mike Stump | 1eb4433 | 2009-09-09 15:08:12 +0000 | [diff] [blame] | 501 | |
Daniel Dunbar | ff6912b | 2009-11-05 01:54:02 +0000 | [diff] [blame] | 502 | TokenConcatenation ConcatInfo(TmpPP); |
Mike Stump | 1eb4433 | 2009-09-09 15:08:12 +0000 | [diff] [blame] | 503 | |
Chris Lattner | c54d50a | 2008-04-16 06:32:08 +0000 | [diff] [blame] | 504 | // Lex all the tokens. |
Chris Lattner | c54d50a | 2008-04-16 06:32:08 +0000 | [diff] [blame] | 505 | Token Tok; |
Daniel Dunbar | ff6912b | 2009-11-05 01:54:02 +0000 | [diff] [blame] | 506 | TmpPP.Lex(Tok); |
Chris Lattner | c54d50a | 2008-04-16 06:32:08 +0000 | [diff] [blame] | 507 | while (Tok.isNot(tok::eof)) { |
| 508 | // Ignore non-macro tokens. |
| 509 | if (!Tok.getLocation().isMacroID()) { |
Daniel Dunbar | ff6912b | 2009-11-05 01:54:02 +0000 | [diff] [blame] | 510 | TmpPP.Lex(Tok); |
Chris Lattner | c54d50a | 2008-04-16 06:32:08 +0000 | [diff] [blame] | 511 | continue; |
| 512 | } |
Mike Stump | 1eb4433 | 2009-09-09 15:08:12 +0000 | [diff] [blame] | 513 | |
Chris Lattner | b7949a9 | 2009-02-15 21:32:34 +0000 | [diff] [blame] | 514 | // Okay, we have the first token of a macro expansion: highlight the |
Chandler Carruth | 7c5c676 | 2011-07-15 00:04:40 +0000 | [diff] [blame] | 515 | // expansion by inserting a start tag before the macro expansion and |
Chris Lattner | b7949a9 | 2009-02-15 21:32:34 +0000 | [diff] [blame] | 516 | // end tag after it. |
| 517 | std::pair<SourceLocation, SourceLocation> LLoc = |
Chandler Carruth | edc3dcc | 2011-07-25 16:56:02 +0000 | [diff] [blame] | 518 | SM.getExpansionRange(Tok.getLocation()); |
Mike Stump | 1eb4433 | 2009-09-09 15:08:12 +0000 | [diff] [blame] | 519 | |
Chris Lattner | b7949a9 | 2009-02-15 21:32:34 +0000 | [diff] [blame] | 520 | // Ignore tokens whose instantiation location was not the main file. |
| 521 | if (SM.getFileID(LLoc.first) != FID) { |
Daniel Dunbar | ff6912b | 2009-11-05 01:54:02 +0000 | [diff] [blame] | 522 | TmpPP.Lex(Tok); |
Chris Lattner | c54d50a | 2008-04-16 06:32:08 +0000 | [diff] [blame] | 523 | continue; |
| 524 | } |
Chris Lattner | b7949a9 | 2009-02-15 21:32:34 +0000 | [diff] [blame] | 525 | |
Chris Lattner | b7949a9 | 2009-02-15 21:32:34 +0000 | [diff] [blame] | 526 | assert(SM.getFileID(LLoc.second) == FID && |
| 527 | "Start and end of expansion must be in the same ultimate file!"); |
Chris Lattner | e9e6cb9 | 2009-02-17 00:51:07 +0000 | [diff] [blame] | 528 | |
Daniel Dunbar | ff6912b | 2009-11-05 01:54:02 +0000 | [diff] [blame] | 529 | std::string Expansion = EscapeText(TmpPP.getSpelling(Tok)); |
Chris Lattner | 6f46be2 | 2008-04-17 00:40:45 +0000 | [diff] [blame] | 530 | unsigned LineLen = Expansion.size(); |
Mike Stump | 1eb4433 | 2009-09-09 15:08:12 +0000 | [diff] [blame] | 531 | |
Chris Lattner | 8877321 | 2010-04-14 03:57:19 +0000 | [diff] [blame] | 532 | Token PrevPrevTok; |
Chris Lattner | 867924d | 2009-02-13 00:51:30 +0000 | [diff] [blame] | 533 | Token PrevTok = Tok; |
Chris Lattner | c54d50a | 2008-04-16 06:32:08 +0000 | [diff] [blame] | 534 | // Okay, eat this token, getting the next one. |
Daniel Dunbar | ff6912b | 2009-11-05 01:54:02 +0000 | [diff] [blame] | 535 | TmpPP.Lex(Tok); |
Mike Stump | 1eb4433 | 2009-09-09 15:08:12 +0000 | [diff] [blame] | 536 | |
Chris Lattner | c54d50a | 2008-04-16 06:32:08 +0000 | [diff] [blame] | 537 | // Skip all the rest of the tokens that are part of this macro |
| 538 | // instantiation. It would be really nice to pop up a window with all the |
| 539 | // spelling of the tokens or something. |
| 540 | while (!Tok.is(tok::eof) && |
Chandler Carruth | 4027853 | 2011-07-25 16:49:02 +0000 | [diff] [blame] | 541 | SM.getExpansionLoc(Tok.getLocation()) == LLoc.first) { |
Chris Lattner | 6f46be2 | 2008-04-17 00:40:45 +0000 | [diff] [blame] | 542 | // Insert a newline if the macro expansion is getting large. |
| 543 | if (LineLen > 60) { |
| 544 | Expansion += "<br>"; |
| 545 | LineLen = 0; |
| 546 | } |
Mike Stump | 1eb4433 | 2009-09-09 15:08:12 +0000 | [diff] [blame] | 547 | |
Chris Lattner | 6f46be2 | 2008-04-17 00:40:45 +0000 | [diff] [blame] | 548 | LineLen -= Expansion.size(); |
Mike Stump | 1eb4433 | 2009-09-09 15:08:12 +0000 | [diff] [blame] | 549 | |
Chris Lattner | 867924d | 2009-02-13 00:51:30 +0000 | [diff] [blame] | 550 | // If the tokens were already space separated, or if they must be to avoid |
| 551 | // them being implicitly pasted, add a space between them. |
| 552 | if (Tok.hasLeadingSpace() || |
Chris Lattner | 8877321 | 2010-04-14 03:57:19 +0000 | [diff] [blame] | 553 | ConcatInfo.AvoidConcat(PrevPrevTok, PrevTok, Tok)) |
Chris Lattner | 867924d | 2009-02-13 00:51:30 +0000 | [diff] [blame] | 554 | Expansion += ' '; |
Mike Stump | 1eb4433 | 2009-09-09 15:08:12 +0000 | [diff] [blame] | 555 | |
Chris Lattner | 9227c69 | 2008-04-17 23:03:14 +0000 | [diff] [blame] | 556 | // Escape any special characters in the token text. |
Daniel Dunbar | ff6912b | 2009-11-05 01:54:02 +0000 | [diff] [blame] | 557 | Expansion += EscapeText(TmpPP.getSpelling(Tok)); |
Chris Lattner | 6f46be2 | 2008-04-17 00:40:45 +0000 | [diff] [blame] | 558 | LineLen += Expansion.size(); |
Mike Stump | 1eb4433 | 2009-09-09 15:08:12 +0000 | [diff] [blame] | 559 | |
Chris Lattner | 8877321 | 2010-04-14 03:57:19 +0000 | [diff] [blame] | 560 | PrevPrevTok = PrevTok; |
Chris Lattner | 867924d | 2009-02-13 00:51:30 +0000 | [diff] [blame] | 561 | PrevTok = Tok; |
Daniel Dunbar | ff6912b | 2009-11-05 01:54:02 +0000 | [diff] [blame] | 562 | TmpPP.Lex(Tok); |
Chris Lattner | 6f46be2 | 2008-04-17 00:40:45 +0000 | [diff] [blame] | 563 | } |
Mike Stump | 1eb4433 | 2009-09-09 15:08:12 +0000 | [diff] [blame] | 564 | |
Chris Lattner | e9e6cb9 | 2009-02-17 00:51:07 +0000 | [diff] [blame] | 565 | |
| 566 | // Insert the expansion as the end tag, so that multi-line macros all get |
| 567 | // highlighted. |
| 568 | Expansion = "<span class='expansion'>" + Expansion + "</span></span>"; |
| 569 | |
| 570 | HighlightRange(R, LLoc.first, LLoc.second, |
| 571 | "<span class='macro'>", Expansion.c_str()); |
Chris Lattner | c54d50a | 2008-04-16 06:32:08 +0000 | [diff] [blame] | 572 | } |
Chris Lattner | 7c175fb | 2009-03-13 21:44:46 +0000 | [diff] [blame] | 573 | |
| 574 | // Restore diagnostics object back to its own thing. |
Daniel Dunbar | ff6912b | 2009-11-05 01:54:02 +0000 | [diff] [blame] | 575 | TmpPP.setDiagnostics(*OldDiags); |
Chris Lattner | c54d50a | 2008-04-16 06:32:08 +0000 | [diff] [blame] | 576 | } |