Daniel Jasper | bac016b | 2012-12-03 18:12:45 +0000 | [diff] [blame] | 1 | //===--- UnwrappedLineParser.cpp - Format C++ code ------------------------===// |
| 2 | // |
| 3 | // The LLVM Compiler Infrastructure |
| 4 | // |
| 5 | // This file is distributed under the University of Illinois Open Source |
| 6 | // License. See LICENSE.TXT for details. |
| 7 | // |
| 8 | //===----------------------------------------------------------------------===// |
| 9 | /// |
| 10 | /// \file |
| 11 | /// \brief This file contains the implementation of the UnwrappedLineParser, |
| 12 | /// which turns a stream of tokens into UnwrappedLines. |
| 13 | /// |
Daniel Jasper | bac016b | 2012-12-03 18:12:45 +0000 | [diff] [blame] | 14 | //===----------------------------------------------------------------------===// |
| 15 | |
Manuel Klimek | 8fa3799 | 2013-01-16 12:31:12 +0000 | [diff] [blame] | 16 | #define DEBUG_TYPE "format-parser" |
Daniel Jasper | bac016b | 2012-12-03 18:12:45 +0000 | [diff] [blame] | 17 | |
Chandler Carruth | b1ba0ef | 2013-01-19 08:09:44 +0000 | [diff] [blame] | 18 | #include "UnwrappedLineParser.h" |
Manuel Klimek | 8fa3799 | 2013-01-16 12:31:12 +0000 | [diff] [blame] | 19 | #include "clang/Basic/Diagnostic.h" |
| 20 | #include "llvm/Support/Debug.h" |
Manuel Klimek | 8fa3799 | 2013-01-16 12:31:12 +0000 | [diff] [blame] | 21 | |
Daniel Jasper | bac016b | 2012-12-03 18:12:45 +0000 | [diff] [blame] | 22 | namespace clang { |
| 23 | namespace format { |
| 24 | |
Manuel Klimek | 70b03f4 | 2013-01-23 09:32:48 +0000 | [diff] [blame] | 25 | class ScopedDeclarationState { |
| 26 | public: |
| 27 | ScopedDeclarationState(UnwrappedLine &Line, std::vector<bool> &Stack, |
| 28 | bool MustBeDeclaration) |
| 29 | : Line(Line), Stack(Stack) { |
Manuel Klimek | 70b03f4 | 2013-01-23 09:32:48 +0000 | [diff] [blame] | 30 | Line.MustBeDeclaration = MustBeDeclaration; |
Manuel Klimek | 836b58f | 2013-01-23 11:03:04 +0000 | [diff] [blame] | 31 | Stack.push_back(MustBeDeclaration); |
Manuel Klimek | 70b03f4 | 2013-01-23 09:32:48 +0000 | [diff] [blame] | 32 | } |
| 33 | ~ScopedDeclarationState() { |
Manuel Klimek | 70b03f4 | 2013-01-23 09:32:48 +0000 | [diff] [blame] | 34 | Stack.pop_back(); |
Manuel Klimek | a32a7fd | 2013-01-23 14:08:21 +0000 | [diff] [blame] | 35 | if (!Stack.empty()) |
| 36 | Line.MustBeDeclaration = Stack.back(); |
| 37 | else |
| 38 | Line.MustBeDeclaration = true; |
Manuel Klimek | 70b03f4 | 2013-01-23 09:32:48 +0000 | [diff] [blame] | 39 | } |
| 40 | private: |
| 41 | UnwrappedLine &Line; |
| 42 | std::vector<bool> &Stack; |
| 43 | }; |
| 44 | |
Manuel Klimek | d4397b9 | 2013-01-04 23:34:14 +0000 | [diff] [blame] | 45 | class ScopedMacroState : public FormatTokenSource { |
| 46 | public: |
| 47 | ScopedMacroState(UnwrappedLine &Line, FormatTokenSource *&TokenSource, |
Manuel Klimek | 67d080d | 2013-04-12 14:13:36 +0000 | [diff] [blame^] | 48 | FormatToken &ResetToken, bool &StructuralError) |
Manuel Klimek | d4397b9 | 2013-01-04 23:34:14 +0000 | [diff] [blame] | 49 | : Line(Line), TokenSource(TokenSource), ResetToken(ResetToken), |
Manuel Klimek | 67d080d | 2013-04-12 14:13:36 +0000 | [diff] [blame^] | 50 | PreviousLineLevel(Line.Level), PreviousTokenSource(TokenSource), |
| 51 | StructuralError(StructuralError), |
| 52 | PreviousStructuralError(StructuralError) { |
Manuel Klimek | d4397b9 | 2013-01-04 23:34:14 +0000 | [diff] [blame] | 53 | TokenSource = this; |
Manuel Klimek | c37b4d6 | 2013-01-05 22:14:16 +0000 | [diff] [blame] | 54 | Line.Level = 0; |
Manuel Klimek | d4397b9 | 2013-01-04 23:34:14 +0000 | [diff] [blame] | 55 | Line.InPPDirective = true; |
| 56 | } |
| 57 | |
| 58 | ~ScopedMacroState() { |
| 59 | TokenSource = PreviousTokenSource; |
| 60 | ResetToken = Token; |
| 61 | Line.InPPDirective = false; |
Manuel Klimek | c37b4d6 | 2013-01-05 22:14:16 +0000 | [diff] [blame] | 62 | Line.Level = PreviousLineLevel; |
Manuel Klimek | 67d080d | 2013-04-12 14:13:36 +0000 | [diff] [blame^] | 63 | StructuralError = PreviousStructuralError; |
Manuel Klimek | d4397b9 | 2013-01-04 23:34:14 +0000 | [diff] [blame] | 64 | } |
| 65 | |
| 66 | virtual FormatToken getNextToken() { |
Manuel Klimek | dd5b101 | 2013-01-07 10:03:37 +0000 | [diff] [blame] | 67 | // The \c UnwrappedLineParser guards against this by never calling |
| 68 | // \c getNextToken() after it has encountered the first eof token. |
| 69 | assert(!eof()); |
Manuel Klimek | d4397b9 | 2013-01-04 23:34:14 +0000 | [diff] [blame] | 70 | Token = PreviousTokenSource->getNextToken(); |
| 71 | if (eof()) |
| 72 | return createEOF(); |
| 73 | return Token; |
| 74 | } |
| 75 | |
| 76 | private: |
Alexander Kornienko | 3d713a7 | 2013-04-08 22:16:06 +0000 | [diff] [blame] | 77 | bool eof() { return Token.HasUnescapedNewline; } |
Manuel Klimek | d4397b9 | 2013-01-04 23:34:14 +0000 | [diff] [blame] | 78 | |
| 79 | FormatToken createEOF() { |
| 80 | FormatToken FormatTok; |
| 81 | FormatTok.Tok.startToken(); |
| 82 | FormatTok.Tok.setKind(tok::eof); |
| 83 | return FormatTok; |
| 84 | } |
| 85 | |
| 86 | UnwrappedLine &Line; |
| 87 | FormatTokenSource *&TokenSource; |
| 88 | FormatToken &ResetToken; |
Manuel Klimek | c37b4d6 | 2013-01-05 22:14:16 +0000 | [diff] [blame] | 89 | unsigned PreviousLineLevel; |
Manuel Klimek | d4397b9 | 2013-01-04 23:34:14 +0000 | [diff] [blame] | 90 | FormatTokenSource *PreviousTokenSource; |
Manuel Klimek | 67d080d | 2013-04-12 14:13:36 +0000 | [diff] [blame^] | 91 | bool &StructuralError; |
| 92 | bool PreviousStructuralError; |
Manuel Klimek | d4397b9 | 2013-01-04 23:34:14 +0000 | [diff] [blame] | 93 | |
| 94 | FormatToken Token; |
| 95 | }; |
| 96 | |
Manuel Klimek | bb42bf1 | 2013-01-10 11:52:21 +0000 | [diff] [blame] | 97 | class ScopedLineState { |
| 98 | public: |
Manuel Klimek | 525fe16 | 2013-01-18 14:04:34 +0000 | [diff] [blame] | 99 | ScopedLineState(UnwrappedLineParser &Parser, |
| 100 | bool SwitchToPreprocessorLines = false) |
| 101 | : Parser(Parser), SwitchToPreprocessorLines(SwitchToPreprocessorLines) { |
| 102 | if (SwitchToPreprocessorLines) |
| 103 | Parser.CurrentLines = &Parser.PreprocessorDirectives; |
Manuel Klimek | bb42bf1 | 2013-01-10 11:52:21 +0000 | [diff] [blame] | 104 | PreBlockLine = Parser.Line.take(); |
Daniel Jasper | cbb6c41 | 2013-01-16 09:10:19 +0000 | [diff] [blame] | 105 | Parser.Line.reset(new UnwrappedLine()); |
| 106 | Parser.Line->Level = PreBlockLine->Level; |
| 107 | Parser.Line->InPPDirective = PreBlockLine->InPPDirective; |
Manuel Klimek | bb42bf1 | 2013-01-10 11:52:21 +0000 | [diff] [blame] | 108 | } |
| 109 | |
| 110 | ~ScopedLineState() { |
Daniel Jasper | cbb6c41 | 2013-01-16 09:10:19 +0000 | [diff] [blame] | 111 | if (!Parser.Line->Tokens.empty()) { |
Manuel Klimek | bb42bf1 | 2013-01-10 11:52:21 +0000 | [diff] [blame] | 112 | Parser.addUnwrappedLine(); |
| 113 | } |
Daniel Jasper | cbb6c41 | 2013-01-16 09:10:19 +0000 | [diff] [blame] | 114 | assert(Parser.Line->Tokens.empty()); |
Manuel Klimek | bb42bf1 | 2013-01-10 11:52:21 +0000 | [diff] [blame] | 115 | Parser.Line.reset(PreBlockLine); |
Manuel Klimek | bb42bf1 | 2013-01-10 11:52:21 +0000 | [diff] [blame] | 116 | Parser.MustBreakBeforeNextToken = true; |
Manuel Klimek | 525fe16 | 2013-01-18 14:04:34 +0000 | [diff] [blame] | 117 | if (SwitchToPreprocessorLines) |
| 118 | Parser.CurrentLines = &Parser.Lines; |
Manuel Klimek | bb42bf1 | 2013-01-10 11:52:21 +0000 | [diff] [blame] | 119 | } |
| 120 | |
| 121 | private: |
| 122 | UnwrappedLineParser &Parser; |
Manuel Klimek | 525fe16 | 2013-01-18 14:04:34 +0000 | [diff] [blame] | 123 | const bool SwitchToPreprocessorLines; |
Manuel Klimek | bb42bf1 | 2013-01-10 11:52:21 +0000 | [diff] [blame] | 124 | |
| 125 | UnwrappedLine *PreBlockLine; |
Manuel Klimek | bb42bf1 | 2013-01-10 11:52:21 +0000 | [diff] [blame] | 126 | }; |
| 127 | |
Alexander Kornienko | 3048aea | 2013-01-10 15:05:09 +0000 | [diff] [blame] | 128 | UnwrappedLineParser::UnwrappedLineParser( |
| 129 | clang::DiagnosticsEngine &Diag, const FormatStyle &Style, |
| 130 | FormatTokenSource &Tokens, UnwrappedLineConsumer &Callback) |
Manuel Klimek | 525fe16 | 2013-01-18 14:04:34 +0000 | [diff] [blame] | 131 | : Line(new UnwrappedLine), MustBreakBeforeNextToken(false), |
Manuel Klimek | 67d080d | 2013-04-12 14:13:36 +0000 | [diff] [blame^] | 132 | CurrentLines(&Lines), StructuralError(false), Diag(Diag), Style(Style), |
| 133 | Tokens(&Tokens), Callback(Callback) {} |
Daniel Jasper | bac016b | 2012-12-03 18:12:45 +0000 | [diff] [blame] | 134 | |
Alexander Kornienko | cff563c | 2012-12-04 17:27:50 +0000 | [diff] [blame] | 135 | bool UnwrappedLineParser::parse() { |
Manuel Klimek | 8fa3799 | 2013-01-16 12:31:12 +0000 | [diff] [blame] | 136 | DEBUG(llvm::dbgs() << "----\n"); |
Manuel Klimek | d4397b9 | 2013-01-04 23:34:14 +0000 | [diff] [blame] | 137 | readToken(); |
Manuel Klimek | 67d080d | 2013-04-12 14:13:36 +0000 | [diff] [blame^] | 138 | parseFile(); |
Daniel Jasper | f9955d3 | 2013-03-20 12:37:50 +0000 | [diff] [blame] | 139 | for (std::vector<UnwrappedLine>::iterator I = Lines.begin(), E = Lines.end(); |
Manuel Klimek | 525fe16 | 2013-01-18 14:04:34 +0000 | [diff] [blame] | 140 | I != E; ++I) { |
| 141 | Callback.consumeUnwrappedLine(*I); |
| 142 | } |
Daniel Jasper | 516fb31 | 2013-03-01 18:11:39 +0000 | [diff] [blame] | 143 | |
| 144 | // Create line with eof token. |
| 145 | pushToken(FormatTok); |
| 146 | Callback.consumeUnwrappedLine(*Line); |
Manuel Klimek | 67d080d | 2013-04-12 14:13:36 +0000 | [diff] [blame^] | 147 | return StructuralError; |
Manuel Klimek | d4397b9 | 2013-01-04 23:34:14 +0000 | [diff] [blame] | 148 | } |
| 149 | |
Manuel Klimek | 67d080d | 2013-04-12 14:13:36 +0000 | [diff] [blame^] | 150 | void UnwrappedLineParser::parseFile() { |
Daniel Jasper | 627707b | 2013-03-22 16:55:40 +0000 | [diff] [blame] | 151 | ScopedDeclarationState DeclarationState( |
| 152 | *Line, DeclarationScopeStack, |
| 153 | /*MustBeDeclaration=*/ !Line->InPPDirective); |
Manuel Klimek | 67d080d | 2013-04-12 14:13:36 +0000 | [diff] [blame^] | 154 | parseLevel(/*HasOpeningBrace=*/ false); |
Manuel Klimek | d4397b9 | 2013-01-04 23:34:14 +0000 | [diff] [blame] | 155 | // Make sure to format the remaining tokens. |
Manuel Klimek | 86721d2 | 2013-01-22 16:31:55 +0000 | [diff] [blame] | 156 | flushComments(true); |
Manuel Klimek | d4397b9 | 2013-01-04 23:34:14 +0000 | [diff] [blame] | 157 | addUnwrappedLine(); |
Daniel Jasper | bac016b | 2012-12-03 18:12:45 +0000 | [diff] [blame] | 158 | } |
| 159 | |
Manuel Klimek | 67d080d | 2013-04-12 14:13:36 +0000 | [diff] [blame^] | 160 | void UnwrappedLineParser::parseLevel(bool HasOpeningBrace) { |
Daniel Jasper | bac016b | 2012-12-03 18:12:45 +0000 | [diff] [blame] | 161 | do { |
| 162 | switch (FormatTok.Tok.getKind()) { |
Daniel Jasper | bac016b | 2012-12-03 18:12:45 +0000 | [diff] [blame] | 163 | case tok::comment: |
Daniel Jasper | 05b1ac8 | 2012-12-17 11:29:41 +0000 | [diff] [blame] | 164 | nextToken(); |
| 165 | addUnwrappedLine(); |
Daniel Jasper | bac016b | 2012-12-03 18:12:45 +0000 | [diff] [blame] | 166 | break; |
| 167 | case tok::l_brace: |
Manuel Klimek | 70b03f4 | 2013-01-23 09:32:48 +0000 | [diff] [blame] | 168 | // FIXME: Add parameter whether this can happen - if this happens, we must |
| 169 | // be in a non-declaration context. |
Manuel Klimek | 67d080d | 2013-04-12 14:13:36 +0000 | [diff] [blame^] | 170 | parseBlock(/*MustBeDeclaration=*/ false); |
Daniel Jasper | bac016b | 2012-12-03 18:12:45 +0000 | [diff] [blame] | 171 | addUnwrappedLine(); |
| 172 | break; |
| 173 | case tok::r_brace: |
Manuel Klimek | 67d080d | 2013-04-12 14:13:36 +0000 | [diff] [blame^] | 174 | if (HasOpeningBrace) |
| 175 | return; |
| 176 | Diag.Report(FormatTok.Tok.getLocation(), |
| 177 | Diag.getCustomDiagID(clang::DiagnosticsEngine::Error, |
| 178 | "unexpected '}'")); |
| 179 | StructuralError = true; |
| 180 | nextToken(); |
| 181 | addUnwrappedLine(); |
Manuel Klimek | a5342db | 2013-01-06 20:07:31 +0000 | [diff] [blame] | 182 | break; |
Daniel Jasper | bac016b | 2012-12-03 18:12:45 +0000 | [diff] [blame] | 183 | default: |
Manuel Klimek | f0ab0a3 | 2013-01-07 14:56:16 +0000 | [diff] [blame] | 184 | parseStructuralElement(); |
Daniel Jasper | bac016b | 2012-12-03 18:12:45 +0000 | [diff] [blame] | 185 | break; |
| 186 | } |
| 187 | } while (!eof()); |
| 188 | } |
| 189 | |
Manuel Klimek | 67d080d | 2013-04-12 14:13:36 +0000 | [diff] [blame^] | 190 | void UnwrappedLineParser::parseBlock(bool MustBeDeclaration, |
Nico Weber | d74fcdb | 2013-02-10 20:35:35 +0000 | [diff] [blame] | 191 | unsigned AddLevels) { |
Alexander Kornienko | a3a2b3a | 2012-12-06 17:49:17 +0000 | [diff] [blame] | 192 | assert(FormatTok.Tok.is(tok::l_brace) && "'{' expected"); |
Daniel Jasper | bac016b | 2012-12-03 18:12:45 +0000 | [diff] [blame] | 193 | nextToken(); |
| 194 | |
Manuel Klimek | 2f1ac41 | 2013-01-21 16:42:44 +0000 | [diff] [blame] | 195 | addUnwrappedLine(); |
Daniel Jasper | bac016b | 2012-12-03 18:12:45 +0000 | [diff] [blame] | 196 | |
Manuel Klimek | 70b03f4 | 2013-01-23 09:32:48 +0000 | [diff] [blame] | 197 | ScopedDeclarationState DeclarationState(*Line, DeclarationScopeStack, |
| 198 | MustBeDeclaration); |
Manuel Klimek | 2f1ac41 | 2013-01-21 16:42:44 +0000 | [diff] [blame] | 199 | Line->Level += AddLevels; |
Daniel Jasper | f9955d3 | 2013-03-20 12:37:50 +0000 | [diff] [blame] | 200 | parseLevel(/*HasOpeningBrace=*/ true); |
Alexander Kornienko | 1575731 | 2012-12-06 18:03:27 +0000 | [diff] [blame] | 201 | |
Manuel Klimek | 86721d2 | 2013-01-22 16:31:55 +0000 | [diff] [blame] | 202 | if (!FormatTok.Tok.is(tok::r_brace)) { |
| 203 | Line->Level -= AddLevels; |
Manuel Klimek | 67d080d | 2013-04-12 14:13:36 +0000 | [diff] [blame^] | 204 | StructuralError = true; |
| 205 | return; |
Manuel Klimek | 86721d2 | 2013-01-22 16:31:55 +0000 | [diff] [blame] | 206 | } |
Alexander Kornienko | 393b008 | 2012-12-04 15:40:36 +0000 | [diff] [blame] | 207 | |
Daniel Jasper | f9955d3 | 2013-03-20 12:37:50 +0000 | [diff] [blame] | 208 | nextToken(); // Munch the closing brace. |
Manuel Klimek | 86721d2 | 2013-01-22 16:31:55 +0000 | [diff] [blame] | 209 | Line->Level -= AddLevels; |
Daniel Jasper | bac016b | 2012-12-03 18:12:45 +0000 | [diff] [blame] | 210 | } |
| 211 | |
| 212 | void UnwrappedLineParser::parsePPDirective() { |
Manuel Klimek | a080a18 | 2013-01-02 16:30:12 +0000 | [diff] [blame] | 213 | assert(FormatTok.Tok.is(tok::hash) && "'#' expected"); |
Manuel Klimek | 67d080d | 2013-04-12 14:13:36 +0000 | [diff] [blame^] | 214 | ScopedMacroState MacroState(*Line, Tokens, FormatTok, StructuralError); |
Manuel Klimek | a080a18 | 2013-01-02 16:30:12 +0000 | [diff] [blame] | 215 | nextToken(); |
| 216 | |
Manuel Klimek | a080a18 | 2013-01-02 16:30:12 +0000 | [diff] [blame] | 217 | if (FormatTok.Tok.getIdentifierInfo() == NULL) { |
Manuel Klimek | bd04f2a | 2013-01-31 15:58:48 +0000 | [diff] [blame] | 218 | parsePPUnknown(); |
Manuel Klimek | a080a18 | 2013-01-02 16:30:12 +0000 | [diff] [blame] | 219 | return; |
Daniel Jasper | bac016b | 2012-12-03 18:12:45 +0000 | [diff] [blame] | 220 | } |
Manuel Klimek | a080a18 | 2013-01-02 16:30:12 +0000 | [diff] [blame] | 221 | |
Manuel Klimek | d4397b9 | 2013-01-04 23:34:14 +0000 | [diff] [blame] | 222 | switch (FormatTok.Tok.getIdentifierInfo()->getPPKeywordID()) { |
| 223 | case tok::pp_define: |
| 224 | parsePPDefine(); |
| 225 | break; |
| 226 | default: |
| 227 | parsePPUnknown(); |
| 228 | break; |
| 229 | } |
| 230 | } |
| 231 | |
| 232 | void UnwrappedLineParser::parsePPDefine() { |
| 233 | nextToken(); |
| 234 | |
| 235 | if (FormatTok.Tok.getKind() != tok::identifier) { |
| 236 | parsePPUnknown(); |
| 237 | return; |
| 238 | } |
| 239 | nextToken(); |
Manuel Klimek | 7ccbc21 | 2013-01-23 14:37:36 +0000 | [diff] [blame] | 240 | if (FormatTok.Tok.getKind() == tok::l_paren && |
| 241 | FormatTok.WhiteSpaceLength == 0) { |
Manuel Klimek | d4397b9 | 2013-01-04 23:34:14 +0000 | [diff] [blame] | 242 | parseParens(); |
| 243 | } |
| 244 | addUnwrappedLine(); |
Manuel Klimek | 526ed11 | 2013-01-09 15:25:02 +0000 | [diff] [blame] | 245 | Line->Level = 1; |
Manuel Klimek | c3d0c82 | 2013-01-07 09:34:28 +0000 | [diff] [blame] | 246 | |
| 247 | // Errors during a preprocessor directive can only affect the layout of the |
| 248 | // preprocessor directive, and thus we ignore them. An alternative approach |
| 249 | // would be to use the same approach we use on the file level (no |
| 250 | // re-indentation if there was a structural error) within the macro |
| 251 | // definition. |
Manuel Klimek | d4397b9 | 2013-01-04 23:34:14 +0000 | [diff] [blame] | 252 | parseFile(); |
| 253 | } |
| 254 | |
| 255 | void UnwrappedLineParser::parsePPUnknown() { |
Manuel Klimek | a080a18 | 2013-01-02 16:30:12 +0000 | [diff] [blame] | 256 | do { |
Manuel Klimek | a080a18 | 2013-01-02 16:30:12 +0000 | [diff] [blame] | 257 | nextToken(); |
| 258 | } while (!eof()); |
| 259 | addUnwrappedLine(); |
Daniel Jasper | bac016b | 2012-12-03 18:12:45 +0000 | [diff] [blame] | 260 | } |
| 261 | |
Alexander Kornienko | 99b0e14 | 2013-04-09 16:15:19 +0000 | [diff] [blame] | 262 | // Here we blacklist certain tokens that are not usually the first token in an |
| 263 | // unwrapped line. This is used in attempt to distinguish macro calls without |
| 264 | // trailing semicolons from other constructs split to several lines. |
| 265 | bool tokenCanStartNewLine(clang::Token Tok) { |
| 266 | // Semicolon can be a null-statement, l_square can be a start of a macro or |
| 267 | // a C++11 attribute, but this doesn't seem to be common. |
| 268 | return Tok.isNot(tok::semi) && Tok.isNot(tok::l_brace) && |
| 269 | Tok.isNot(tok::l_square) && |
| 270 | // Tokens that can only be used as binary operators and a part of |
| 271 | // overloaded operator names. |
| 272 | Tok.isNot(tok::period) && Tok.isNot(tok::periodstar) && |
| 273 | Tok.isNot(tok::arrow) && Tok.isNot(tok::arrowstar) && |
| 274 | Tok.isNot(tok::less) && Tok.isNot(tok::greater) && |
| 275 | Tok.isNot(tok::slash) && Tok.isNot(tok::percent) && |
| 276 | Tok.isNot(tok::lessless) && Tok.isNot(tok::greatergreater) && |
| 277 | Tok.isNot(tok::equal) && Tok.isNot(tok::plusequal) && |
| 278 | Tok.isNot(tok::minusequal) && Tok.isNot(tok::starequal) && |
| 279 | Tok.isNot(tok::slashequal) && Tok.isNot(tok::percentequal) && |
| 280 | Tok.isNot(tok::ampequal) && Tok.isNot(tok::pipeequal) && |
| 281 | Tok.isNot(tok::caretequal) && Tok.isNot(tok::greatergreaterequal) && |
| 282 | Tok.isNot(tok::lesslessequal) && |
| 283 | // Colon is used in labels, base class lists, initializer lists, |
| 284 | // range-based for loops, ternary operator, but should never be the |
| 285 | // first token in an unwrapped line. |
| 286 | Tok.isNot(tok::colon); |
| 287 | } |
| 288 | |
Manuel Klimek | f0ab0a3 | 2013-01-07 14:56:16 +0000 | [diff] [blame] | 289 | void UnwrappedLineParser::parseStructuralElement() { |
Manuel Klimek | bb42bf1 | 2013-01-10 11:52:21 +0000 | [diff] [blame] | 290 | assert(!FormatTok.Tok.is(tok::l_brace)); |
Alexander Kornienko | a166e73 | 2012-12-04 14:46:19 +0000 | [diff] [blame] | 291 | switch (FormatTok.Tok.getKind()) { |
Nico Weber | 6092d4e | 2013-01-07 19:05:19 +0000 | [diff] [blame] | 292 | case tok::at: |
| 293 | nextToken(); |
Nico Weber | d74fcdb | 2013-02-10 20:35:35 +0000 | [diff] [blame] | 294 | if (FormatTok.Tok.is(tok::l_brace)) { |
| 295 | parseBracedList(); |
| 296 | break; |
| 297 | } |
Nico Weber | 6092d4e | 2013-01-07 19:05:19 +0000 | [diff] [blame] | 298 | switch (FormatTok.Tok.getObjCKeywordID()) { |
| 299 | case tok::objc_public: |
| 300 | case tok::objc_protected: |
| 301 | case tok::objc_package: |
| 302 | case tok::objc_private: |
| 303 | return parseAccessSpecifier(); |
Nico Weber | 27d1367 | 2013-01-09 20:25:35 +0000 | [diff] [blame] | 304 | case tok::objc_interface: |
Nico Weber | 50767d8 | 2013-01-09 23:25:37 +0000 | [diff] [blame] | 305 | case tok::objc_implementation: |
| 306 | return parseObjCInterfaceOrImplementation(); |
Nico Weber | 1abe6ea | 2013-01-09 21:15:03 +0000 | [diff] [blame] | 307 | case tok::objc_protocol: |
| 308 | return parseObjCProtocol(); |
Nico Weber | 049c447 | 2013-01-09 21:42:32 +0000 | [diff] [blame] | 309 | case tok::objc_end: |
| 310 | return; // Handled by the caller. |
Nico Weber | b530fa3 | 2013-01-10 00:25:19 +0000 | [diff] [blame] | 311 | case tok::objc_optional: |
| 312 | case tok::objc_required: |
| 313 | nextToken(); |
| 314 | addUnwrappedLine(); |
| 315 | return; |
Nico Weber | 6092d4e | 2013-01-07 19:05:19 +0000 | [diff] [blame] | 316 | default: |
| 317 | break; |
| 318 | } |
| 319 | break; |
Alexander Kornienko | 1575731 | 2012-12-06 18:03:27 +0000 | [diff] [blame] | 320 | case tok::kw_namespace: |
| 321 | parseNamespace(); |
| 322 | return; |
Dmitri Gribenko | 1f94f2b | 2012-12-30 21:27:25 +0000 | [diff] [blame] | 323 | case tok::kw_inline: |
| 324 | nextToken(); |
Dmitri Gribenko | 1f94f2b | 2012-12-30 21:27:25 +0000 | [diff] [blame] | 325 | if (FormatTok.Tok.is(tok::kw_namespace)) { |
| 326 | parseNamespace(); |
| 327 | return; |
| 328 | } |
| 329 | break; |
Alexander Kornienko | a166e73 | 2012-12-04 14:46:19 +0000 | [diff] [blame] | 330 | case tok::kw_public: |
| 331 | case tok::kw_protected: |
| 332 | case tok::kw_private: |
Daniel Jasper | bac016b | 2012-12-03 18:12:45 +0000 | [diff] [blame] | 333 | parseAccessSpecifier(); |
| 334 | return; |
Alexander Kornienko | a166e73 | 2012-12-04 14:46:19 +0000 | [diff] [blame] | 335 | case tok::kw_if: |
| 336 | parseIfThenElse(); |
Daniel Jasper | bac016b | 2012-12-03 18:12:45 +0000 | [diff] [blame] | 337 | return; |
Alexander Kornienko | 2e97cfc | 2012-12-05 15:06:06 +0000 | [diff] [blame] | 338 | case tok::kw_for: |
| 339 | case tok::kw_while: |
| 340 | parseForOrWhileLoop(); |
| 341 | return; |
Alexander Kornienko | a166e73 | 2012-12-04 14:46:19 +0000 | [diff] [blame] | 342 | case tok::kw_do: |
| 343 | parseDoWhile(); |
| 344 | return; |
| 345 | case tok::kw_switch: |
| 346 | parseSwitch(); |
| 347 | return; |
| 348 | case tok::kw_default: |
| 349 | nextToken(); |
| 350 | parseLabel(); |
| 351 | return; |
| 352 | case tok::kw_case: |
| 353 | parseCaseLabel(); |
| 354 | return; |
Manuel Klimek | c44ee89 | 2013-01-21 10:07:49 +0000 | [diff] [blame] | 355 | case tok::kw_return: |
| 356 | parseReturn(); |
| 357 | return; |
Manuel Klimek | d19dc2d | 2013-01-21 14:32:05 +0000 | [diff] [blame] | 358 | case tok::kw_extern: |
| 359 | nextToken(); |
| 360 | if (FormatTok.Tok.is(tok::string_literal)) { |
| 361 | nextToken(); |
| 362 | if (FormatTok.Tok.is(tok::l_brace)) { |
Manuel Klimek | 70b03f4 | 2013-01-23 09:32:48 +0000 | [diff] [blame] | 363 | parseBlock(/*MustBeDeclaration=*/ true, 0); |
Manuel Klimek | d19dc2d | 2013-01-21 14:32:05 +0000 | [diff] [blame] | 364 | addUnwrappedLine(); |
| 365 | return; |
| 366 | } |
| 367 | } |
| 368 | // In all other cases, parse the declaration. |
| 369 | break; |
Alexander Kornienko | a166e73 | 2012-12-04 14:46:19 +0000 | [diff] [blame] | 370 | default: |
| 371 | break; |
Daniel Jasper | bac016b | 2012-12-03 18:12:45 +0000 | [diff] [blame] | 372 | } |
Daniel Jasper | bac016b | 2012-12-03 18:12:45 +0000 | [diff] [blame] | 373 | do { |
Daniel Jasper | bac016b | 2012-12-03 18:12:45 +0000 | [diff] [blame] | 374 | switch (FormatTok.Tok.getKind()) { |
Nico Weber | d74fcdb | 2013-02-10 20:35:35 +0000 | [diff] [blame] | 375 | case tok::at: |
| 376 | nextToken(); |
| 377 | if (FormatTok.Tok.is(tok::l_brace)) |
| 378 | parseBracedList(); |
| 379 | break; |
Alexander Kornienko | a166e73 | 2012-12-04 14:46:19 +0000 | [diff] [blame] | 380 | case tok::kw_enum: |
| 381 | parseEnum(); |
Manuel Klimek | 308232c | 2013-01-21 19:17:52 +0000 | [diff] [blame] | 382 | break; |
Alexander Kornienko | d881875 | 2013-01-16 11:43:46 +0000 | [diff] [blame] | 383 | case tok::kw_struct: |
| 384 | case tok::kw_union: |
Manuel Klimek | de76854 | 2013-01-07 18:10:23 +0000 | [diff] [blame] | 385 | case tok::kw_class: |
Manuel Klimek | 47ea7f6 | 2013-01-15 13:38:33 +0000 | [diff] [blame] | 386 | parseRecord(); |
| 387 | // A record declaration or definition is always the start of a structural |
| 388 | // element. |
| 389 | break; |
Daniel Jasper | bac016b | 2012-12-03 18:12:45 +0000 | [diff] [blame] | 390 | case tok::semi: |
| 391 | nextToken(); |
| 392 | addUnwrappedLine(); |
| 393 | return; |
Alexander Kornienko | d881875 | 2013-01-16 11:43:46 +0000 | [diff] [blame] | 394 | case tok::r_brace: |
| 395 | addUnwrappedLine(); |
| 396 | return; |
Daniel Jasper | bac016b | 2012-12-03 18:12:45 +0000 | [diff] [blame] | 397 | case tok::l_paren: |
| 398 | parseParens(); |
| 399 | break; |
| 400 | case tok::l_brace: |
Manuel Klimek | bb42bf1 | 2013-01-10 11:52:21 +0000 | [diff] [blame] | 401 | // A block outside of parentheses must be the last part of a |
| 402 | // structural element. |
| 403 | // FIXME: Figure out cases where this is not true, and add projections for |
| 404 | // them (the one we know is missing are lambdas). |
Manuel Klimek | 70b03f4 | 2013-01-23 09:32:48 +0000 | [diff] [blame] | 405 | parseBlock(/*MustBeDeclaration=*/ false); |
Daniel Jasper | bac016b | 2012-12-03 18:12:45 +0000 | [diff] [blame] | 406 | addUnwrappedLine(); |
| 407 | return; |
Alexander Kornienko | a166e73 | 2012-12-04 14:46:19 +0000 | [diff] [blame] | 408 | case tok::identifier: |
Daniel Jasper | bac016b | 2012-12-03 18:12:45 +0000 | [diff] [blame] | 409 | nextToken(); |
Alexander Kornienko | 3d713a7 | 2013-04-08 22:16:06 +0000 | [diff] [blame] | 410 | if (Line->Tokens.size() == 1) { |
| 411 | if (FormatTok.Tok.is(tok::colon)) { |
| 412 | parseLabel(); |
| 413 | return; |
| 414 | } |
Alexander Kornienko | 99b0e14 | 2013-04-09 16:15:19 +0000 | [diff] [blame] | 415 | // Recognize function-like macro usages without trailing semicolon. |
Alexander Kornienko | 3d713a7 | 2013-04-08 22:16:06 +0000 | [diff] [blame] | 416 | if (FormatTok.Tok.is(tok::l_paren)) { |
| 417 | parseParens(); |
Alexander Kornienko | 99b0e14 | 2013-04-09 16:15:19 +0000 | [diff] [blame] | 418 | if (FormatTok.HasUnescapedNewline && |
| 419 | tokenCanStartNewLine(FormatTok.Tok)) { |
Alexander Kornienko | 3d713a7 | 2013-04-08 22:16:06 +0000 | [diff] [blame] | 420 | addUnwrappedLine(); |
| 421 | return; |
| 422 | } |
| 423 | } |
Daniel Jasper | bac016b | 2012-12-03 18:12:45 +0000 | [diff] [blame] | 424 | } |
| 425 | break; |
Daniel Jasper | 05b1ac8 | 2012-12-17 11:29:41 +0000 | [diff] [blame] | 426 | case tok::equal: |
| 427 | nextToken(); |
Manuel Klimek | bb42bf1 | 2013-01-10 11:52:21 +0000 | [diff] [blame] | 428 | if (FormatTok.Tok.is(tok::l_brace)) { |
| 429 | parseBracedList(); |
| 430 | } |
Daniel Jasper | 05b1ac8 | 2012-12-17 11:29:41 +0000 | [diff] [blame] | 431 | break; |
Alexander Kornienko | a166e73 | 2012-12-04 14:46:19 +0000 | [diff] [blame] | 432 | default: |
| 433 | nextToken(); |
| 434 | break; |
Daniel Jasper | bac016b | 2012-12-03 18:12:45 +0000 | [diff] [blame] | 435 | } |
| 436 | } while (!eof()); |
| 437 | } |
| 438 | |
Manuel Klimek | bb42bf1 | 2013-01-10 11:52:21 +0000 | [diff] [blame] | 439 | void UnwrappedLineParser::parseBracedList() { |
| 440 | nextToken(); |
| 441 | |
Manuel Klimek | 423dd93 | 2013-04-10 09:52:05 +0000 | [diff] [blame] | 442 | // FIXME: Once we have an expression parser in the UnwrappedLineParser, |
| 443 | // replace this by using parseAssigmentExpression() inside. |
| 444 | bool StartOfExpression = true; |
Manuel Klimek | bb42bf1 | 2013-01-10 11:52:21 +0000 | [diff] [blame] | 445 | do { |
Manuel Klimek | 423dd93 | 2013-04-10 09:52:05 +0000 | [diff] [blame] | 446 | // FIXME: When we start to support lambdas, we'll want to parse them away |
| 447 | // here, otherwise our bail-out scenarios below break. The better solution |
| 448 | // might be to just implement a more or less complete expression parser. |
Manuel Klimek | bb42bf1 | 2013-01-10 11:52:21 +0000 | [diff] [blame] | 449 | switch (FormatTok.Tok.getKind()) { |
| 450 | case tok::l_brace: |
Manuel Klimek | 423dd93 | 2013-04-10 09:52:05 +0000 | [diff] [blame] | 451 | if (!StartOfExpression) { |
| 452 | // Probably a missing closing brace. Bail out. |
| 453 | addUnwrappedLine(); |
| 454 | return; |
| 455 | } |
Manuel Klimek | bb42bf1 | 2013-01-10 11:52:21 +0000 | [diff] [blame] | 456 | parseBracedList(); |
Manuel Klimek | 423dd93 | 2013-04-10 09:52:05 +0000 | [diff] [blame] | 457 | StartOfExpression = false; |
Manuel Klimek | bb42bf1 | 2013-01-10 11:52:21 +0000 | [diff] [blame] | 458 | break; |
| 459 | case tok::r_brace: |
| 460 | nextToken(); |
| 461 | return; |
Manuel Klimek | 423dd93 | 2013-04-10 09:52:05 +0000 | [diff] [blame] | 462 | case tok::semi: |
| 463 | // Probably a missing closing brace. Bail out. |
| 464 | return; |
| 465 | case tok::comma: |
| 466 | nextToken(); |
| 467 | StartOfExpression = true; |
| 468 | break; |
Manuel Klimek | bb42bf1 | 2013-01-10 11:52:21 +0000 | [diff] [blame] | 469 | default: |
| 470 | nextToken(); |
Manuel Klimek | 423dd93 | 2013-04-10 09:52:05 +0000 | [diff] [blame] | 471 | StartOfExpression = false; |
Manuel Klimek | bb42bf1 | 2013-01-10 11:52:21 +0000 | [diff] [blame] | 472 | break; |
| 473 | } |
| 474 | } while (!eof()); |
| 475 | } |
| 476 | |
Manuel Klimek | c44ee89 | 2013-01-21 10:07:49 +0000 | [diff] [blame] | 477 | void UnwrappedLineParser::parseReturn() { |
| 478 | nextToken(); |
| 479 | |
| 480 | do { |
| 481 | switch (FormatTok.Tok.getKind()) { |
| 482 | case tok::l_brace: |
| 483 | parseBracedList(); |
Manuel Klimek | 423dd93 | 2013-04-10 09:52:05 +0000 | [diff] [blame] | 484 | if (FormatTok.Tok.isNot(tok::semi)) { |
| 485 | // Assume missing ';'. |
| 486 | addUnwrappedLine(); |
| 487 | return; |
| 488 | } |
Manuel Klimek | c44ee89 | 2013-01-21 10:07:49 +0000 | [diff] [blame] | 489 | break; |
| 490 | case tok::l_paren: |
| 491 | parseParens(); |
| 492 | break; |
| 493 | case tok::r_brace: |
| 494 | // Assume missing ';'. |
| 495 | addUnwrappedLine(); |
| 496 | return; |
| 497 | case tok::semi: |
| 498 | nextToken(); |
| 499 | addUnwrappedLine(); |
| 500 | return; |
| 501 | default: |
| 502 | nextToken(); |
| 503 | break; |
| 504 | } |
| 505 | } while (!eof()); |
| 506 | } |
| 507 | |
Daniel Jasper | bac016b | 2012-12-03 18:12:45 +0000 | [diff] [blame] | 508 | void UnwrappedLineParser::parseParens() { |
| 509 | assert(FormatTok.Tok.is(tok::l_paren) && "'(' expected."); |
| 510 | nextToken(); |
| 511 | do { |
| 512 | switch (FormatTok.Tok.getKind()) { |
| 513 | case tok::l_paren: |
| 514 | parseParens(); |
| 515 | break; |
| 516 | case tok::r_paren: |
| 517 | nextToken(); |
| 518 | return; |
Nico Weber | 2afbe52 | 2013-02-10 04:38:23 +0000 | [diff] [blame] | 519 | case tok::l_brace: { |
| 520 | nextToken(); |
| 521 | ScopedLineState LineState(*this); |
| 522 | ScopedDeclarationState DeclarationState(*Line, DeclarationScopeStack, |
| 523 | /*MustBeDeclaration=*/ false); |
| 524 | Line->Level += 1; |
| 525 | parseLevel(/*HasOpeningBrace=*/ true); |
| 526 | Line->Level -= 1; |
Manuel Klimek | bb42bf1 | 2013-01-10 11:52:21 +0000 | [diff] [blame] | 527 | break; |
Nico Weber | 2afbe52 | 2013-02-10 04:38:23 +0000 | [diff] [blame] | 528 | } |
Nico Weber | d74fcdb | 2013-02-10 20:35:35 +0000 | [diff] [blame] | 529 | case tok::at: |
| 530 | nextToken(); |
| 531 | if (FormatTok.Tok.is(tok::l_brace)) |
| 532 | parseBracedList(); |
| 533 | break; |
Daniel Jasper | bac016b | 2012-12-03 18:12:45 +0000 | [diff] [blame] | 534 | default: |
| 535 | nextToken(); |
| 536 | break; |
| 537 | } |
| 538 | } while (!eof()); |
| 539 | } |
| 540 | |
| 541 | void UnwrappedLineParser::parseIfThenElse() { |
| 542 | assert(FormatTok.Tok.is(tok::kw_if) && "'if' expected"); |
| 543 | nextToken(); |
Manuel Klimek | d465843 | 2013-01-11 18:28:36 +0000 | [diff] [blame] | 544 | if (FormatTok.Tok.is(tok::l_paren)) |
| 545 | parseParens(); |
Daniel Jasper | bac016b | 2012-12-03 18:12:45 +0000 | [diff] [blame] | 546 | bool NeedsUnwrappedLine = false; |
| 547 | if (FormatTok.Tok.is(tok::l_brace)) { |
Manuel Klimek | 70b03f4 | 2013-01-23 09:32:48 +0000 | [diff] [blame] | 548 | parseBlock(/*MustBeDeclaration=*/ false); |
Daniel Jasper | bac016b | 2012-12-03 18:12:45 +0000 | [diff] [blame] | 549 | NeedsUnwrappedLine = true; |
| 550 | } else { |
| 551 | addUnwrappedLine(); |
Manuel Klimek | 526ed11 | 2013-01-09 15:25:02 +0000 | [diff] [blame] | 552 | ++Line->Level; |
Manuel Klimek | f0ab0a3 | 2013-01-07 14:56:16 +0000 | [diff] [blame] | 553 | parseStructuralElement(); |
Manuel Klimek | 526ed11 | 2013-01-09 15:25:02 +0000 | [diff] [blame] | 554 | --Line->Level; |
Daniel Jasper | bac016b | 2012-12-03 18:12:45 +0000 | [diff] [blame] | 555 | } |
| 556 | if (FormatTok.Tok.is(tok::kw_else)) { |
| 557 | nextToken(); |
| 558 | if (FormatTok.Tok.is(tok::l_brace)) { |
Manuel Klimek | 70b03f4 | 2013-01-23 09:32:48 +0000 | [diff] [blame] | 559 | parseBlock(/*MustBeDeclaration=*/ false); |
Daniel Jasper | bac016b | 2012-12-03 18:12:45 +0000 | [diff] [blame] | 560 | addUnwrappedLine(); |
| 561 | } else if (FormatTok.Tok.is(tok::kw_if)) { |
| 562 | parseIfThenElse(); |
| 563 | } else { |
| 564 | addUnwrappedLine(); |
Manuel Klimek | 526ed11 | 2013-01-09 15:25:02 +0000 | [diff] [blame] | 565 | ++Line->Level; |
Manuel Klimek | f0ab0a3 | 2013-01-07 14:56:16 +0000 | [diff] [blame] | 566 | parseStructuralElement(); |
Manuel Klimek | 526ed11 | 2013-01-09 15:25:02 +0000 | [diff] [blame] | 567 | --Line->Level; |
Daniel Jasper | bac016b | 2012-12-03 18:12:45 +0000 | [diff] [blame] | 568 | } |
| 569 | } else if (NeedsUnwrappedLine) { |
| 570 | addUnwrappedLine(); |
| 571 | } |
| 572 | } |
| 573 | |
Alexander Kornienko | 1575731 | 2012-12-06 18:03:27 +0000 | [diff] [blame] | 574 | void UnwrappedLineParser::parseNamespace() { |
| 575 | assert(FormatTok.Tok.is(tok::kw_namespace) && "'namespace' expected"); |
| 576 | nextToken(); |
| 577 | if (FormatTok.Tok.is(tok::identifier)) |
| 578 | nextToken(); |
| 579 | if (FormatTok.Tok.is(tok::l_brace)) { |
Manuel Klimek | 70b03f4 | 2013-01-23 09:32:48 +0000 | [diff] [blame] | 580 | parseBlock(/*MustBeDeclaration=*/ true, 0); |
Manuel Klimek | 7fc2db0 | 2013-02-06 16:08:09 +0000 | [diff] [blame] | 581 | // Munch the semicolon after a namespace. This is more common than one would |
| 582 | // think. Puttin the semicolon into its own line is very ugly. |
| 583 | if (FormatTok.Tok.is(tok::semi)) |
| 584 | nextToken(); |
Alexander Kornienko | 1575731 | 2012-12-06 18:03:27 +0000 | [diff] [blame] | 585 | addUnwrappedLine(); |
| 586 | } |
| 587 | // FIXME: Add error handling. |
| 588 | } |
| 589 | |
Alexander Kornienko | 2e97cfc | 2012-12-05 15:06:06 +0000 | [diff] [blame] | 590 | void UnwrappedLineParser::parseForOrWhileLoop() { |
| 591 | assert((FormatTok.Tok.is(tok::kw_for) || FormatTok.Tok.is(tok::kw_while)) && |
| 592 | "'for' or 'while' expected"); |
| 593 | nextToken(); |
Manuel Klimek | 6eca03f | 2013-01-11 19:23:05 +0000 | [diff] [blame] | 594 | if (FormatTok.Tok.is(tok::l_paren)) |
| 595 | parseParens(); |
Alexander Kornienko | 2e97cfc | 2012-12-05 15:06:06 +0000 | [diff] [blame] | 596 | if (FormatTok.Tok.is(tok::l_brace)) { |
Manuel Klimek | 70b03f4 | 2013-01-23 09:32:48 +0000 | [diff] [blame] | 597 | parseBlock(/*MustBeDeclaration=*/ false); |
Alexander Kornienko | 2e97cfc | 2012-12-05 15:06:06 +0000 | [diff] [blame] | 598 | addUnwrappedLine(); |
| 599 | } else { |
| 600 | addUnwrappedLine(); |
Manuel Klimek | 526ed11 | 2013-01-09 15:25:02 +0000 | [diff] [blame] | 601 | ++Line->Level; |
Manuel Klimek | f0ab0a3 | 2013-01-07 14:56:16 +0000 | [diff] [blame] | 602 | parseStructuralElement(); |
Manuel Klimek | 526ed11 | 2013-01-09 15:25:02 +0000 | [diff] [blame] | 603 | --Line->Level; |
Alexander Kornienko | 2e97cfc | 2012-12-05 15:06:06 +0000 | [diff] [blame] | 604 | } |
| 605 | } |
| 606 | |
Daniel Jasper | bac016b | 2012-12-03 18:12:45 +0000 | [diff] [blame] | 607 | void UnwrappedLineParser::parseDoWhile() { |
| 608 | assert(FormatTok.Tok.is(tok::kw_do) && "'do' expected"); |
| 609 | nextToken(); |
| 610 | if (FormatTok.Tok.is(tok::l_brace)) { |
Manuel Klimek | 70b03f4 | 2013-01-23 09:32:48 +0000 | [diff] [blame] | 611 | parseBlock(/*MustBeDeclaration=*/ false); |
Daniel Jasper | bac016b | 2012-12-03 18:12:45 +0000 | [diff] [blame] | 612 | } else { |
| 613 | addUnwrappedLine(); |
Manuel Klimek | 526ed11 | 2013-01-09 15:25:02 +0000 | [diff] [blame] | 614 | ++Line->Level; |
Manuel Klimek | f0ab0a3 | 2013-01-07 14:56:16 +0000 | [diff] [blame] | 615 | parseStructuralElement(); |
Manuel Klimek | 526ed11 | 2013-01-09 15:25:02 +0000 | [diff] [blame] | 616 | --Line->Level; |
Daniel Jasper | bac016b | 2012-12-03 18:12:45 +0000 | [diff] [blame] | 617 | } |
| 618 | |
Alexander Kornienko | 393b008 | 2012-12-04 15:40:36 +0000 | [diff] [blame] | 619 | // FIXME: Add error handling. |
| 620 | if (!FormatTok.Tok.is(tok::kw_while)) { |
| 621 | addUnwrappedLine(); |
| 622 | return; |
| 623 | } |
| 624 | |
Daniel Jasper | bac016b | 2012-12-03 18:12:45 +0000 | [diff] [blame] | 625 | nextToken(); |
Manuel Klimek | f0ab0a3 | 2013-01-07 14:56:16 +0000 | [diff] [blame] | 626 | parseStructuralElement(); |
Daniel Jasper | bac016b | 2012-12-03 18:12:45 +0000 | [diff] [blame] | 627 | } |
| 628 | |
| 629 | void UnwrappedLineParser::parseLabel() { |
Daniel Jasper | 89a0daa | 2013-02-12 20:17:17 +0000 | [diff] [blame] | 630 | if (FormatTok.Tok.isNot(tok::colon)) |
| 631 | return; |
Daniel Jasper | bac016b | 2012-12-03 18:12:45 +0000 | [diff] [blame] | 632 | nextToken(); |
Manuel Klimek | 526ed11 | 2013-01-09 15:25:02 +0000 | [diff] [blame] | 633 | unsigned OldLineLevel = Line->Level; |
Daniel Jasper | bcca7e4 | 2013-03-20 10:23:53 +0000 | [diff] [blame] | 634 | if (Line->Level > 1 || (!Line->InPPDirective && Line->Level > 0)) |
Manuel Klimek | 526ed11 | 2013-01-09 15:25:02 +0000 | [diff] [blame] | 635 | --Line->Level; |
Daniel Jasper | c30eb51 | 2013-03-19 18:33:58 +0000 | [diff] [blame] | 636 | if (CommentsBeforeNextToken.empty() && FormatTok.Tok.is(tok::l_brace)) { |
Manuel Klimek | 70b03f4 | 2013-01-23 09:32:48 +0000 | [diff] [blame] | 637 | parseBlock(/*MustBeDeclaration=*/ false); |
Nico Weber | 94fb729 | 2013-01-18 05:50:57 +0000 | [diff] [blame] | 638 | if (FormatTok.Tok.is(tok::kw_break)) |
| 639 | parseStructuralElement(); // "break;" after "}" goes on the same line. |
Daniel Jasper | bac016b | 2012-12-03 18:12:45 +0000 | [diff] [blame] | 640 | } |
| 641 | addUnwrappedLine(); |
Manuel Klimek | 526ed11 | 2013-01-09 15:25:02 +0000 | [diff] [blame] | 642 | Line->Level = OldLineLevel; |
Daniel Jasper | bac016b | 2012-12-03 18:12:45 +0000 | [diff] [blame] | 643 | } |
| 644 | |
| 645 | void UnwrappedLineParser::parseCaseLabel() { |
| 646 | assert(FormatTok.Tok.is(tok::kw_case) && "'case' expected"); |
| 647 | // FIXME: fix handling of complex expressions here. |
| 648 | do { |
| 649 | nextToken(); |
| 650 | } while (!eof() && !FormatTok.Tok.is(tok::colon)); |
| 651 | parseLabel(); |
| 652 | } |
| 653 | |
| 654 | void UnwrappedLineParser::parseSwitch() { |
| 655 | assert(FormatTok.Tok.is(tok::kw_switch) && "'switch' expected"); |
| 656 | nextToken(); |
Manuel Klimek | 6eca03f | 2013-01-11 19:23:05 +0000 | [diff] [blame] | 657 | if (FormatTok.Tok.is(tok::l_paren)) |
| 658 | parseParens(); |
Daniel Jasper | bac016b | 2012-12-03 18:12:45 +0000 | [diff] [blame] | 659 | if (FormatTok.Tok.is(tok::l_brace)) { |
Manuel Klimek | 70b03f4 | 2013-01-23 09:32:48 +0000 | [diff] [blame] | 660 | parseBlock(/*MustBeDeclaration=*/ false, Style.IndentCaseLabels ? 2 : 1); |
Daniel Jasper | bac016b | 2012-12-03 18:12:45 +0000 | [diff] [blame] | 661 | addUnwrappedLine(); |
| 662 | } else { |
| 663 | addUnwrappedLine(); |
Manuel Klimek | 526ed11 | 2013-01-09 15:25:02 +0000 | [diff] [blame] | 664 | Line->Level += (Style.IndentCaseLabels ? 2 : 1); |
Manuel Klimek | f0ab0a3 | 2013-01-07 14:56:16 +0000 | [diff] [blame] | 665 | parseStructuralElement(); |
Manuel Klimek | 526ed11 | 2013-01-09 15:25:02 +0000 | [diff] [blame] | 666 | Line->Level -= (Style.IndentCaseLabels ? 2 : 1); |
Daniel Jasper | bac016b | 2012-12-03 18:12:45 +0000 | [diff] [blame] | 667 | } |
| 668 | } |
| 669 | |
| 670 | void UnwrappedLineParser::parseAccessSpecifier() { |
| 671 | nextToken(); |
Alexander Kornienko | 56e49c5 | 2012-12-10 16:34:48 +0000 | [diff] [blame] | 672 | // Otherwise, we don't know what it is, and we'd better keep the next token. |
| 673 | if (FormatTok.Tok.is(tok::colon)) |
| 674 | nextToken(); |
Daniel Jasper | bac016b | 2012-12-03 18:12:45 +0000 | [diff] [blame] | 675 | addUnwrappedLine(); |
| 676 | } |
| 677 | |
| 678 | void UnwrappedLineParser::parseEnum() { |
Manuel Klimek | 308232c | 2013-01-21 19:17:52 +0000 | [diff] [blame] | 679 | nextToken(); |
| 680 | if (FormatTok.Tok.is(tok::identifier) || |
| 681 | FormatTok.Tok.is(tok::kw___attribute) || |
| 682 | FormatTok.Tok.is(tok::kw___declspec)) { |
| 683 | nextToken(); |
| 684 | // We can have macros or attributes in between 'enum' and the enum name. |
| 685 | if (FormatTok.Tok.is(tok::l_paren)) { |
Alexander Kornienko | a166e73 | 2012-12-04 14:46:19 +0000 | [diff] [blame] | 686 | parseParens(); |
Daniel Jasper | bac016b | 2012-12-03 18:12:45 +0000 | [diff] [blame] | 687 | } |
Manuel Klimek | 308232c | 2013-01-21 19:17:52 +0000 | [diff] [blame] | 688 | if (FormatTok.Tok.is(tok::identifier)) |
| 689 | nextToken(); |
| 690 | } |
| 691 | if (FormatTok.Tok.is(tok::l_brace)) { |
| 692 | nextToken(); |
| 693 | addUnwrappedLine(); |
| 694 | ++Line->Level; |
| 695 | do { |
| 696 | switch (FormatTok.Tok.getKind()) { |
Manuel Klimek | 308232c | 2013-01-21 19:17:52 +0000 | [diff] [blame] | 697 | case tok::l_paren: |
| 698 | parseParens(); |
| 699 | break; |
| 700 | case tok::r_brace: |
| 701 | addUnwrappedLine(); |
| 702 | nextToken(); |
| 703 | --Line->Level; |
| 704 | return; |
| 705 | case tok::comma: |
| 706 | nextToken(); |
| 707 | addUnwrappedLine(); |
| 708 | break; |
| 709 | default: |
| 710 | nextToken(); |
| 711 | break; |
| 712 | } |
| 713 | } while (!eof()); |
| 714 | } |
| 715 | // We fall through to parsing a structural element afterwards, so that in |
| 716 | // enum A {} n, m; |
| 717 | // "} n, m;" will end up in one unwrapped line. |
Daniel Jasper | bac016b | 2012-12-03 18:12:45 +0000 | [diff] [blame] | 718 | } |
| 719 | |
Manuel Klimek | 47ea7f6 | 2013-01-15 13:38:33 +0000 | [diff] [blame] | 720 | void UnwrappedLineParser::parseRecord() { |
Manuel Klimek | de76854 | 2013-01-07 18:10:23 +0000 | [diff] [blame] | 721 | nextToken(); |
Manuel Klimek | 47ea7f6 | 2013-01-15 13:38:33 +0000 | [diff] [blame] | 722 | if (FormatTok.Tok.is(tok::identifier) || |
| 723 | FormatTok.Tok.is(tok::kw___attribute) || |
| 724 | FormatTok.Tok.is(tok::kw___declspec)) { |
| 725 | nextToken(); |
| 726 | // We can have macros or attributes in between 'class' and the class name. |
| 727 | if (FormatTok.Tok.is(tok::l_paren)) { |
| 728 | parseParens(); |
Manuel Klimek | de76854 | 2013-01-07 18:10:23 +0000 | [diff] [blame] | 729 | } |
Manuel Klimek | b8b1ce1 | 2013-02-06 15:57:54 +0000 | [diff] [blame] | 730 | // The actual identifier can be a nested name specifier, and in macros |
| 731 | // it is often token-pasted. |
Manuel Klimek | 7f5b025 | 2013-01-21 10:17:14 +0000 | [diff] [blame] | 732 | while (FormatTok.Tok.is(tok::identifier) || |
Daniel Jasper | f9955d3 | 2013-03-20 12:37:50 +0000 | [diff] [blame] | 733 | FormatTok.Tok.is(tok::coloncolon) || FormatTok.Tok.is(tok::hashhash)) |
Manuel Klimek | 47ea7f6 | 2013-01-15 13:38:33 +0000 | [diff] [blame] | 734 | nextToken(); |
| 735 | |
Manuel Klimek | 3a3408c | 2013-01-21 13:58:54 +0000 | [diff] [blame] | 736 | // Note that parsing away template declarations here leads to incorrectly |
| 737 | // accepting function declarations as record declarations. |
| 738 | // In general, we cannot solve this problem. Consider: |
| 739 | // class A<int> B() {} |
| 740 | // which can be a function definition or a class definition when B() is a |
| 741 | // macro. If we find enough real-world cases where this is a problem, we |
| 742 | // can parse for the 'template' keyword in the beginning of the statement, |
| 743 | // and thus rule out the record production in case there is no template |
| 744 | // (this would still leave us with an ambiguity between template function |
| 745 | // and class declarations). |
| 746 | if (FormatTok.Tok.is(tok::colon) || FormatTok.Tok.is(tok::less)) { |
Daniel Jasper | 6fe554e | 2013-03-20 15:12:38 +0000 | [diff] [blame] | 747 | while (!eof() && FormatTok.Tok.isNot(tok::l_brace)) { |
Manuel Klimek | 47ea7f6 | 2013-01-15 13:38:33 +0000 | [diff] [blame] | 748 | if (FormatTok.Tok.is(tok::semi)) |
| 749 | return; |
| 750 | nextToken(); |
| 751 | } |
| 752 | } |
| 753 | } |
| 754 | if (FormatTok.Tok.is(tok::l_brace)) |
Manuel Klimek | 70b03f4 | 2013-01-23 09:32:48 +0000 | [diff] [blame] | 755 | parseBlock(/*MustBeDeclaration=*/ true); |
Manuel Klimek | 3a3408c | 2013-01-21 13:58:54 +0000 | [diff] [blame] | 756 | // We fall through to parsing a structural element afterwards, so |
| 757 | // class A {} n, m; |
| 758 | // will end up in one unwrapped line. |
Manuel Klimek | de76854 | 2013-01-07 18:10:23 +0000 | [diff] [blame] | 759 | } |
| 760 | |
Nico Weber | 1abe6ea | 2013-01-09 21:15:03 +0000 | [diff] [blame] | 761 | void UnwrappedLineParser::parseObjCProtocolList() { |
| 762 | assert(FormatTok.Tok.is(tok::less) && "'<' expected."); |
| 763 | do |
| 764 | nextToken(); |
| 765 | while (!eof() && FormatTok.Tok.isNot(tok::greater)); |
| 766 | nextToken(); // Skip '>'. |
| 767 | } |
| 768 | |
| 769 | void UnwrappedLineParser::parseObjCUntilAtEnd() { |
| 770 | do { |
| 771 | if (FormatTok.Tok.isObjCAtKeyword(tok::objc_end)) { |
| 772 | nextToken(); |
| 773 | addUnwrappedLine(); |
| 774 | break; |
| 775 | } |
| 776 | parseStructuralElement(); |
| 777 | } while (!eof()); |
| 778 | } |
| 779 | |
Nico Weber | 50767d8 | 2013-01-09 23:25:37 +0000 | [diff] [blame] | 780 | void UnwrappedLineParser::parseObjCInterfaceOrImplementation() { |
Nico Weber | 27d1367 | 2013-01-09 20:25:35 +0000 | [diff] [blame] | 781 | nextToken(); |
Daniel Jasper | f9955d3 | 2013-03-20 12:37:50 +0000 | [diff] [blame] | 782 | nextToken(); // interface name |
Nico Weber | 27d1367 | 2013-01-09 20:25:35 +0000 | [diff] [blame] | 783 | |
| 784 | // @interface can be followed by either a base class, or a category. |
| 785 | if (FormatTok.Tok.is(tok::colon)) { |
| 786 | nextToken(); |
Daniel Jasper | f9955d3 | 2013-03-20 12:37:50 +0000 | [diff] [blame] | 787 | nextToken(); // base class name |
Nico Weber | 27d1367 | 2013-01-09 20:25:35 +0000 | [diff] [blame] | 788 | } else if (FormatTok.Tok.is(tok::l_paren)) |
| 789 | // Skip category, if present. |
| 790 | parseParens(); |
| 791 | |
Nico Weber | 1abe6ea | 2013-01-09 21:15:03 +0000 | [diff] [blame] | 792 | if (FormatTok.Tok.is(tok::less)) |
| 793 | parseObjCProtocolList(); |
Nico Weber | 27d1367 | 2013-01-09 20:25:35 +0000 | [diff] [blame] | 794 | |
| 795 | // If instance variables are present, keep the '{' on the first line too. |
| 796 | if (FormatTok.Tok.is(tok::l_brace)) |
Manuel Klimek | 70b03f4 | 2013-01-23 09:32:48 +0000 | [diff] [blame] | 797 | parseBlock(/*MustBeDeclaration=*/ true); |
Nico Weber | 27d1367 | 2013-01-09 20:25:35 +0000 | [diff] [blame] | 798 | |
| 799 | // With instance variables, this puts '}' on its own line. Without instance |
| 800 | // variables, this ends the @interface line. |
| 801 | addUnwrappedLine(); |
| 802 | |
Nico Weber | 1abe6ea | 2013-01-09 21:15:03 +0000 | [diff] [blame] | 803 | parseObjCUntilAtEnd(); |
| 804 | } |
Nico Weber | 27d1367 | 2013-01-09 20:25:35 +0000 | [diff] [blame] | 805 | |
Nico Weber | 1abe6ea | 2013-01-09 21:15:03 +0000 | [diff] [blame] | 806 | void UnwrappedLineParser::parseObjCProtocol() { |
| 807 | nextToken(); |
Daniel Jasper | f9955d3 | 2013-03-20 12:37:50 +0000 | [diff] [blame] | 808 | nextToken(); // protocol name |
Nico Weber | 1abe6ea | 2013-01-09 21:15:03 +0000 | [diff] [blame] | 809 | |
| 810 | if (FormatTok.Tok.is(tok::less)) |
| 811 | parseObjCProtocolList(); |
| 812 | |
| 813 | // Check for protocol declaration. |
| 814 | if (FormatTok.Tok.is(tok::semi)) { |
| 815 | nextToken(); |
| 816 | return addUnwrappedLine(); |
| 817 | } |
| 818 | |
| 819 | addUnwrappedLine(); |
| 820 | parseObjCUntilAtEnd(); |
Nico Weber | 27d1367 | 2013-01-09 20:25:35 +0000 | [diff] [blame] | 821 | } |
| 822 | |
Daniel Jasper | bac016b | 2012-12-03 18:12:45 +0000 | [diff] [blame] | 823 | void UnwrappedLineParser::addUnwrappedLine() { |
Daniel Jasper | cbb6c41 | 2013-01-16 09:10:19 +0000 | [diff] [blame] | 824 | if (Line->Tokens.empty()) |
Daniel Jasper | 26f7e78 | 2013-01-08 14:56:18 +0000 | [diff] [blame] | 825 | return; |
Manuel Klimek | 8fa3799 | 2013-01-16 12:31:12 +0000 | [diff] [blame] | 826 | DEBUG({ |
Manuel Klimek | a28fc06 | 2013-02-11 12:33:24 +0000 | [diff] [blame] | 827 | llvm::dbgs() << "Line(" << Line->Level << ")" |
| 828 | << (Line->InPPDirective ? " MACRO" : "") << ": "; |
Manuel Klimek | 8fa3799 | 2013-01-16 12:31:12 +0000 | [diff] [blame] | 829 | for (std::list<FormatToken>::iterator I = Line->Tokens.begin(), |
| 830 | E = Line->Tokens.end(); |
| 831 | I != E; ++I) { |
| 832 | llvm::dbgs() << I->Tok.getName() << " "; |
Daniel Jasper | cbb6c41 | 2013-01-16 09:10:19 +0000 | [diff] [blame] | 833 | |
Manuel Klimek | 8fa3799 | 2013-01-16 12:31:12 +0000 | [diff] [blame] | 834 | } |
| 835 | llvm::dbgs() << "\n"; |
| 836 | }); |
Manuel Klimek | 525fe16 | 2013-01-18 14:04:34 +0000 | [diff] [blame] | 837 | CurrentLines->push_back(*Line); |
Daniel Jasper | cbb6c41 | 2013-01-16 09:10:19 +0000 | [diff] [blame] | 838 | Line->Tokens.clear(); |
Manuel Klimek | 525fe16 | 2013-01-18 14:04:34 +0000 | [diff] [blame] | 839 | if (CurrentLines == &Lines && !PreprocessorDirectives.empty()) { |
Daniel Jasper | 516fb31 | 2013-03-01 18:11:39 +0000 | [diff] [blame] | 840 | for (std::vector<UnwrappedLine>::iterator |
| 841 | I = PreprocessorDirectives.begin(), |
| 842 | E = PreprocessorDirectives.end(); |
Manuel Klimek | 525fe16 | 2013-01-18 14:04:34 +0000 | [diff] [blame] | 843 | I != E; ++I) { |
| 844 | CurrentLines->push_back(*I); |
| 845 | } |
| 846 | PreprocessorDirectives.clear(); |
| 847 | } |
Daniel Jasper | bac016b | 2012-12-03 18:12:45 +0000 | [diff] [blame] | 848 | } |
| 849 | |
Daniel Jasper | f9955d3 | 2013-03-20 12:37:50 +0000 | [diff] [blame] | 850 | bool UnwrappedLineParser::eof() const { return FormatTok.Tok.is(tok::eof); } |
Daniel Jasper | bac016b | 2012-12-03 18:12:45 +0000 | [diff] [blame] | 851 | |
Manuel Klimek | 86721d2 | 2013-01-22 16:31:55 +0000 | [diff] [blame] | 852 | void UnwrappedLineParser::flushComments(bool NewlineBeforeNext) { |
| 853 | bool JustComments = Line->Tokens.empty(); |
| 854 | for (SmallVectorImpl<FormatToken>::const_iterator |
| 855 | I = CommentsBeforeNextToken.begin(), |
| 856 | E = CommentsBeforeNextToken.end(); |
| 857 | I != E; ++I) { |
Manuel Klimek | b3507cd | 2013-02-06 16:40:56 +0000 | [diff] [blame] | 858 | if (I->NewlinesBefore && JustComments) { |
Manuel Klimek | 86721d2 | 2013-01-22 16:31:55 +0000 | [diff] [blame] | 859 | addUnwrappedLine(); |
| 860 | } |
| 861 | pushToken(*I); |
| 862 | } |
| 863 | if (NewlineBeforeNext && JustComments) { |
| 864 | addUnwrappedLine(); |
| 865 | } |
| 866 | CommentsBeforeNextToken.clear(); |
| 867 | } |
| 868 | |
Daniel Jasper | bac016b | 2012-12-03 18:12:45 +0000 | [diff] [blame] | 869 | void UnwrappedLineParser::nextToken() { |
| 870 | if (eof()) |
| 871 | return; |
Manuel Klimek | b3507cd | 2013-02-06 16:40:56 +0000 | [diff] [blame] | 872 | flushComments(FormatTok.NewlinesBefore > 0); |
Manuel Klimek | 86721d2 | 2013-01-22 16:31:55 +0000 | [diff] [blame] | 873 | pushToken(FormatTok); |
Manuel Klimek | d4397b9 | 2013-01-04 23:34:14 +0000 | [diff] [blame] | 874 | readToken(); |
| 875 | } |
| 876 | |
| 877 | void UnwrappedLineParser::readToken() { |
Manuel Klimek | 86721d2 | 2013-01-22 16:31:55 +0000 | [diff] [blame] | 878 | bool CommentsInCurrentLine = true; |
| 879 | do { |
| 880 | FormatTok = Tokens->getNextToken(); |
| 881 | while (!Line->InPPDirective && FormatTok.Tok.is(tok::hash) && |
Alexander Kornienko | 3d713a7 | 2013-04-08 22:16:06 +0000 | [diff] [blame] | 882 | (FormatTok.HasUnescapedNewline || FormatTok.IsFirst)) { |
Manuel Klimek | 86721d2 | 2013-01-22 16:31:55 +0000 | [diff] [blame] | 883 | // If there is an unfinished unwrapped line, we flush the preprocessor |
| 884 | // directives only after that unwrapped line was finished later. |
Daniel Jasper | f9955d3 | 2013-03-20 12:37:50 +0000 | [diff] [blame] | 885 | bool SwitchToPreprocessorLines = |
| 886 | !Line->Tokens.empty() && CurrentLines == &Lines; |
Manuel Klimek | 86721d2 | 2013-01-22 16:31:55 +0000 | [diff] [blame] | 887 | ScopedLineState BlockState(*this, SwitchToPreprocessorLines); |
Alexander Kornienko | 4128e19 | 2013-04-03 12:38:53 +0000 | [diff] [blame] | 888 | // Comments stored before the preprocessor directive need to be output |
| 889 | // before the preprocessor directive, at the same level as the |
| 890 | // preprocessor directive, as we consider them to apply to the directive. |
| 891 | flushComments(FormatTok.NewlinesBefore > 0); |
Manuel Klimek | 86721d2 | 2013-01-22 16:31:55 +0000 | [diff] [blame] | 892 | parsePPDirective(); |
| 893 | } |
| 894 | if (!FormatTok.Tok.is(tok::comment)) |
| 895 | return; |
Manuel Klimek | b3507cd | 2013-02-06 16:40:56 +0000 | [diff] [blame] | 896 | if (FormatTok.NewlinesBefore > 0 || FormatTok.IsFirst) { |
Manuel Klimek | 86721d2 | 2013-01-22 16:31:55 +0000 | [diff] [blame] | 897 | CommentsInCurrentLine = false; |
| 898 | } |
| 899 | if (CommentsInCurrentLine) { |
| 900 | pushToken(FormatTok); |
| 901 | } else { |
| 902 | CommentsBeforeNextToken.push_back(FormatTok); |
| 903 | } |
| 904 | } while (!eof()); |
| 905 | } |
| 906 | |
| 907 | void UnwrappedLineParser::pushToken(const FormatToken &Tok) { |
| 908 | Line->Tokens.push_back(Tok); |
| 909 | if (MustBreakBeforeNextToken) { |
| 910 | Line->Tokens.back().MustBreakBefore = true; |
| 911 | MustBreakBeforeNextToken = false; |
Manuel Klimek | d4397b9 | 2013-01-04 23:34:14 +0000 | [diff] [blame] | 912 | } |
Daniel Jasper | bac016b | 2012-12-03 18:12:45 +0000 | [diff] [blame] | 913 | } |
| 914 | |
Daniel Jasper | cd16238 | 2013-01-07 13:26:07 +0000 | [diff] [blame] | 915 | } // end namespace format |
| 916 | } // end namespace clang |