blob: 261ae3030d9ae9eba15ff6a057e8df70a8dbb022 [file] [log] [blame]
Daniel Jasperf7935112012-12-03 18:12:45 +00001//===--- UnwrappedLineParser.cpp - Format C++ code ------------------------===//
2//
3// The LLVM Compiler Infrastructure
4//
5// This file is distributed under the University of Illinois Open Source
6// License. See LICENSE.TXT for details.
7//
8//===----------------------------------------------------------------------===//
9///
10/// \file
11/// \brief This file contains the implementation of the UnwrappedLineParser,
12/// which turns a stream of tokens into UnwrappedLines.
13///
Daniel Jasperf7935112012-12-03 18:12:45 +000014//===----------------------------------------------------------------------===//
15
Chandler Carruth4b417452013-01-19 08:09:44 +000016#include "UnwrappedLineParser.h"
Benjamin Kramer33335df2015-03-01 21:36:40 +000017#include "llvm/ADT/STLExtras.h"
Manuel Klimekab3dc002013-01-16 12:31:12 +000018#include "llvm/Support/Debug.h"
Benjamin Kramer53f5e892015-03-23 18:05:43 +000019#include "llvm/Support/raw_ostream.h"
Manuel Klimekab3dc002013-01-16 12:31:12 +000020
Chandler Carruth10346662014-04-22 03:17:02 +000021#define DEBUG_TYPE "format-parser"
22
Daniel Jasperf7935112012-12-03 18:12:45 +000023namespace clang {
24namespace format {
25
Manuel Klimek15dfe7a2013-05-28 11:55:06 +000026class FormatTokenSource {
27public:
Angel Garcia Gomez637d1e62015-10-20 13:23:58 +000028 virtual ~FormatTokenSource() {}
Manuel Klimek15dfe7a2013-05-28 11:55:06 +000029 virtual FormatToken *getNextToken() = 0;
30
31 virtual unsigned getPosition() = 0;
32 virtual FormatToken *setPosition(unsigned Position) = 0;
33};
34
Craig Topper69665e12013-07-01 04:21:54 +000035namespace {
36
Manuel Klimek0a3a3c92013-01-23 09:32:48 +000037class ScopedDeclarationState {
38public:
39 ScopedDeclarationState(UnwrappedLine &Line, std::vector<bool> &Stack,
40 bool MustBeDeclaration)
41 : Line(Line), Stack(Stack) {
Manuel Klimek0a3a3c92013-01-23 09:32:48 +000042 Line.MustBeDeclaration = MustBeDeclaration;
Manuel Klimek39080572013-01-23 11:03:04 +000043 Stack.push_back(MustBeDeclaration);
Manuel Klimek0a3a3c92013-01-23 09:32:48 +000044 }
45 ~ScopedDeclarationState() {
Manuel Klimek0a3a3c92013-01-23 09:32:48 +000046 Stack.pop_back();
Manuel Klimekc1237a82013-01-23 14:08:21 +000047 if (!Stack.empty())
48 Line.MustBeDeclaration = Stack.back();
49 else
50 Line.MustBeDeclaration = true;
Manuel Klimek0a3a3c92013-01-23 09:32:48 +000051 }
Daniel Jasper393564f2013-05-31 14:56:29 +000052
Manuel Klimek0a3a3c92013-01-23 09:32:48 +000053private:
54 UnwrappedLine &Line;
55 std::vector<bool> &Stack;
56};
57
Krasimir Georgieva1c30932017-05-19 10:34:57 +000058static bool isLineComment(const FormatToken &FormatTok) {
59 return FormatTok.is(tok::comment) &&
60 FormatTok.TokenText.startswith("//");
61}
62
Krasimir Georgievea222a72017-05-22 10:07:56 +000063// Checks if \p FormatTok is a line comment that continues the line comment
64// \p Previous. The original column of \p MinColumnToken is used to determine
65// whether \p FormatTok is indented enough to the right to continue \p Previous.
66static bool continuesLineComment(const FormatToken &FormatTok,
67 const FormatToken *Previous,
68 const FormatToken *MinColumnToken) {
69 if (!Previous || !MinColumnToken)
70 return false;
71 unsigned MinContinueColumn =
72 MinColumnToken->OriginalColumn + (isLineComment(*MinColumnToken) ? 0 : 1);
73 return isLineComment(FormatTok) && FormatTok.NewlinesBefore == 1 &&
74 isLineComment(*Previous) &&
75 FormatTok.OriginalColumn >= MinContinueColumn;
76}
77
Manuel Klimek1abf7892013-01-04 23:34:14 +000078class ScopedMacroState : public FormatTokenSource {
79public:
80 ScopedMacroState(UnwrappedLine &Line, FormatTokenSource *&TokenSource,
Manuel Klimek20e0af62015-05-06 11:56:29 +000081 FormatToken *&ResetToken)
Manuel Klimek1abf7892013-01-04 23:34:14 +000082 : Line(Line), TokenSource(TokenSource), ResetToken(ResetToken),
Manuel Klimek1a18c402013-04-12 14:13:36 +000083 PreviousLineLevel(Line.Level), PreviousTokenSource(TokenSource),
Krasimir Georgieva1c30932017-05-19 10:34:57 +000084 Token(nullptr), PreviousToken(nullptr) {
Manuel Klimek1abf7892013-01-04 23:34:14 +000085 TokenSource = this;
Manuel Klimekef2cfb12013-01-05 22:14:16 +000086 Line.Level = 0;
Manuel Klimek1abf7892013-01-04 23:34:14 +000087 Line.InPPDirective = true;
88 }
89
Alexander Kornienko34eb2072015-04-11 02:00:23 +000090 ~ScopedMacroState() override {
Manuel Klimek1abf7892013-01-04 23:34:14 +000091 TokenSource = PreviousTokenSource;
92 ResetToken = Token;
93 Line.InPPDirective = false;
Manuel Klimekef2cfb12013-01-05 22:14:16 +000094 Line.Level = PreviousLineLevel;
Manuel Klimek1abf7892013-01-04 23:34:14 +000095 }
96
Craig Topperfb6b25b2014-03-15 04:29:04 +000097 FormatToken *getNextToken() override {
Manuel Klimek78725712013-01-07 10:03:37 +000098 // The \c UnwrappedLineParser guards against this by never calling
99 // \c getNextToken() after it has encountered the first eof token.
100 assert(!eof());
Krasimir Georgieva1c30932017-05-19 10:34:57 +0000101 PreviousToken = Token;
Manuel Klimek1abf7892013-01-04 23:34:14 +0000102 Token = PreviousTokenSource->getNextToken();
103 if (eof())
Manuel Klimek15dfe7a2013-05-28 11:55:06 +0000104 return getFakeEOF();
Manuel Klimek1abf7892013-01-04 23:34:14 +0000105 return Token;
106 }
107
Craig Topperfb6b25b2014-03-15 04:29:04 +0000108 unsigned getPosition() override { return PreviousTokenSource->getPosition(); }
Manuel Klimekab419912013-05-23 09:41:43 +0000109
Craig Topperfb6b25b2014-03-15 04:29:04 +0000110 FormatToken *setPosition(unsigned Position) override {
Krasimir Georgieva1c30932017-05-19 10:34:57 +0000111 PreviousToken = nullptr;
Manuel Klimekab419912013-05-23 09:41:43 +0000112 Token = PreviousTokenSource->setPosition(Position);
113 return Token;
114 }
115
Manuel Klimek1abf7892013-01-04 23:34:14 +0000116private:
Krasimir Georgieva1c30932017-05-19 10:34:57 +0000117 bool eof() {
118 return Token && Token->HasUnescapedNewline &&
Krasimir Georgievea222a72017-05-22 10:07:56 +0000119 !continuesLineComment(*Token, PreviousToken,
120 /*MinColumnToken=*/PreviousToken);
Krasimir Georgieva1c30932017-05-19 10:34:57 +0000121 }
Manuel Klimek1abf7892013-01-04 23:34:14 +0000122
Manuel Klimek15dfe7a2013-05-28 11:55:06 +0000123 FormatToken *getFakeEOF() {
124 static bool EOFInitialized = false;
125 static FormatToken FormatTok;
126 if (!EOFInitialized) {
127 FormatTok.Tok.startToken();
128 FormatTok.Tok.setKind(tok::eof);
129 EOFInitialized = true;
130 }
131 return &FormatTok;
Manuel Klimek1abf7892013-01-04 23:34:14 +0000132 }
133
134 UnwrappedLine &Line;
135 FormatTokenSource *&TokenSource;
Manuel Klimek15dfe7a2013-05-28 11:55:06 +0000136 FormatToken *&ResetToken;
Manuel Klimekef2cfb12013-01-05 22:14:16 +0000137 unsigned PreviousLineLevel;
Manuel Klimek1abf7892013-01-04 23:34:14 +0000138 FormatTokenSource *PreviousTokenSource;
139
Manuel Klimek15dfe7a2013-05-28 11:55:06 +0000140 FormatToken *Token;
Krasimir Georgieva1c30932017-05-19 10:34:57 +0000141 FormatToken *PreviousToken;
Manuel Klimek1abf7892013-01-04 23:34:14 +0000142};
143
Craig Topper69665e12013-07-01 04:21:54 +0000144} // end anonymous namespace
145
Manuel Klimek8e07a1b2013-01-10 11:52:21 +0000146class ScopedLineState {
147public:
Manuel Klimekd3b92fa2013-01-18 14:04:34 +0000148 ScopedLineState(UnwrappedLineParser &Parser,
149 bool SwitchToPreprocessorLines = false)
David Blaikieefb6eb22014-08-09 20:02:07 +0000150 : Parser(Parser), OriginalLines(Parser.CurrentLines) {
Manuel Klimekd3b92fa2013-01-18 14:04:34 +0000151 if (SwitchToPreprocessorLines)
152 Parser.CurrentLines = &Parser.PreprocessorDirectives;
Daniel Jasper9fe0e8d2013-09-05 09:29:45 +0000153 else if (!Parser.Line->Tokens.empty())
154 Parser.CurrentLines = &Parser.Line->Tokens.back().Children;
David Blaikieefb6eb22014-08-09 20:02:07 +0000155 PreBlockLine = std::move(Parser.Line);
156 Parser.Line = llvm::make_unique<UnwrappedLine>();
Daniel Jasperdaffc0d2013-01-16 09:10:19 +0000157 Parser.Line->Level = PreBlockLine->Level;
158 Parser.Line->InPPDirective = PreBlockLine->InPPDirective;
Manuel Klimek8e07a1b2013-01-10 11:52:21 +0000159 }
160
161 ~ScopedLineState() {
Daniel Jasperdaffc0d2013-01-16 09:10:19 +0000162 if (!Parser.Line->Tokens.empty()) {
Manuel Klimek8e07a1b2013-01-10 11:52:21 +0000163 Parser.addUnwrappedLine();
164 }
Daniel Jasperdaffc0d2013-01-16 09:10:19 +0000165 assert(Parser.Line->Tokens.empty());
David Blaikieefb6eb22014-08-09 20:02:07 +0000166 Parser.Line = std::move(PreBlockLine);
Daniel Jasper9fe0e8d2013-09-05 09:29:45 +0000167 if (Parser.CurrentLines == &Parser.PreprocessorDirectives)
168 Parser.MustBreakBeforeNextToken = true;
169 Parser.CurrentLines = OriginalLines;
Manuel Klimek8e07a1b2013-01-10 11:52:21 +0000170 }
171
172private:
173 UnwrappedLineParser &Parser;
174
David Blaikieefb6eb22014-08-09 20:02:07 +0000175 std::unique_ptr<UnwrappedLine> PreBlockLine;
Daniel Jasper9fe0e8d2013-09-05 09:29:45 +0000176 SmallVectorImpl<UnwrappedLine> *OriginalLines;
Manuel Klimek8e07a1b2013-01-10 11:52:21 +0000177};
178
Alexander Kornienko3a33f022013-12-12 09:49:52 +0000179class CompoundStatementIndenter {
180public:
181 CompoundStatementIndenter(UnwrappedLineParser *Parser,
182 const FormatStyle &Style, unsigned &LineLevel)
183 : LineLevel(LineLevel), OldLineLevel(LineLevel) {
Daniel Jasperc1bc38e2015-09-29 14:57:55 +0000184 if (Style.BraceWrapping.AfterControlStatement)
Alexander Kornienko3a33f022013-12-12 09:49:52 +0000185 Parser->addUnwrappedLine();
Daniel Jasperc1bc38e2015-09-29 14:57:55 +0000186 if (Style.BraceWrapping.IndentBraces)
Alexander Kornienko3a33f022013-12-12 09:49:52 +0000187 ++LineLevel;
Alexander Kornienko3a33f022013-12-12 09:49:52 +0000188 }
Daniel Jasperb05a81d2014-05-09 13:11:16 +0000189 ~CompoundStatementIndenter() { LineLevel = OldLineLevel; }
Alexander Kornienko3a33f022013-12-12 09:49:52 +0000190
191private:
192 unsigned &LineLevel;
193 unsigned OldLineLevel;
194};
195
Craig Topper69665e12013-07-01 04:21:54 +0000196namespace {
197
Manuel Klimekab419912013-05-23 09:41:43 +0000198class IndexedTokenSource : public FormatTokenSource {
199public:
Manuel Klimek15dfe7a2013-05-28 11:55:06 +0000200 IndexedTokenSource(ArrayRef<FormatToken *> Tokens)
Manuel Klimekab419912013-05-23 09:41:43 +0000201 : Tokens(Tokens), Position(-1) {}
202
Craig Topperfb6b25b2014-03-15 04:29:04 +0000203 FormatToken *getNextToken() override {
Manuel Klimekab419912013-05-23 09:41:43 +0000204 ++Position;
205 return Tokens[Position];
206 }
207
Craig Topperfb6b25b2014-03-15 04:29:04 +0000208 unsigned getPosition() override {
Manuel Klimekab419912013-05-23 09:41:43 +0000209 assert(Position >= 0);
210 return Position;
211 }
212
Craig Topperfb6b25b2014-03-15 04:29:04 +0000213 FormatToken *setPosition(unsigned P) override {
Manuel Klimekab419912013-05-23 09:41:43 +0000214 Position = P;
215 return Tokens[Position];
216 }
217
Manuel Klimek71814b42013-10-11 21:25:45 +0000218 void reset() { Position = -1; }
219
Manuel Klimekab419912013-05-23 09:41:43 +0000220private:
Manuel Klimek15dfe7a2013-05-28 11:55:06 +0000221 ArrayRef<FormatToken *> Tokens;
Manuel Klimekab419912013-05-23 09:41:43 +0000222 int Position;
223};
224
Craig Topper69665e12013-07-01 04:21:54 +0000225} // end anonymous namespace
226
Daniel Jasperd2ae41a2013-05-15 08:14:19 +0000227UnwrappedLineParser::UnwrappedLineParser(const FormatStyle &Style,
Daniel Jasperd0ec0d62014-11-04 12:41:02 +0000228 const AdditionalKeywords &Keywords,
Manuel Klimek15dfe7a2013-05-28 11:55:06 +0000229 ArrayRef<FormatToken *> Tokens,
Daniel Jasperd2ae41a2013-05-15 08:14:19 +0000230 UnwrappedLineConsumer &Callback)
Daniel Jasperb05a81d2014-05-09 13:11:16 +0000231 : Line(new UnwrappedLine), MustBreakBeforeNextToken(false),
Krasimir Georgiev00c5c722017-02-02 15:32:19 +0000232 CurrentLines(&Lines), Style(Style), Keywords(Keywords),
233 CommentPragmasRegex(Style.CommentPragmas), Tokens(nullptr),
Manuel Klimek20e0af62015-05-06 11:56:29 +0000234 Callback(Callback), AllTokens(Tokens), PPBranchLevel(-1) {}
Manuel Klimek71814b42013-10-11 21:25:45 +0000235
236void UnwrappedLineParser::reset() {
237 PPBranchLevel = -1;
238 Line.reset(new UnwrappedLine);
239 CommentsBeforeNextToken.clear();
Craig Topper2145bc02014-05-09 08:15:10 +0000240 FormatTok = nullptr;
Manuel Klimek71814b42013-10-11 21:25:45 +0000241 MustBreakBeforeNextToken = false;
242 PreprocessorDirectives.clear();
243 CurrentLines = &Lines;
244 DeclarationScopeStack.clear();
Manuel Klimek71814b42013-10-11 21:25:45 +0000245 PPStack.clear();
246}
Daniel Jasperf7935112012-12-03 18:12:45 +0000247
Manuel Klimek20e0af62015-05-06 11:56:29 +0000248void UnwrappedLineParser::parse() {
Manuel Klimekab419912013-05-23 09:41:43 +0000249 IndexedTokenSource TokenSource(AllTokens);
Manuel Klimek71814b42013-10-11 21:25:45 +0000250 do {
251 DEBUG(llvm::dbgs() << "----\n");
252 reset();
253 Tokens = &TokenSource;
254 TokenSource.reset();
Daniel Jaspera79064a2013-03-01 18:11:39 +0000255
Manuel Klimek71814b42013-10-11 21:25:45 +0000256 readToken();
257 parseFile();
258 // Create line with eof token.
259 pushToken(FormatTok);
260 addUnwrappedLine();
261
262 for (SmallVectorImpl<UnwrappedLine>::iterator I = Lines.begin(),
263 E = Lines.end();
264 I != E; ++I) {
265 Callback.consumeUnwrappedLine(*I);
266 }
267 Callback.finishRun();
268 Lines.clear();
269 while (!PPLevelBranchIndex.empty() &&
Daniel Jasper53bd1672013-10-12 13:32:56 +0000270 PPLevelBranchIndex.back() + 1 >= PPLevelBranchCount.back()) {
Manuel Klimek71814b42013-10-11 21:25:45 +0000271 PPLevelBranchIndex.resize(PPLevelBranchIndex.size() - 1);
272 PPLevelBranchCount.resize(PPLevelBranchCount.size() - 1);
273 }
274 if (!PPLevelBranchIndex.empty()) {
275 ++PPLevelBranchIndex.back();
276 assert(PPLevelBranchIndex.size() == PPLevelBranchCount.size());
277 assert(PPLevelBranchIndex.back() <= PPLevelBranchCount.back());
278 }
279 } while (!PPLevelBranchIndex.empty());
Manuel Klimek1abf7892013-01-04 23:34:14 +0000280}
281
Manuel Klimek1a18c402013-04-12 14:13:36 +0000282void UnwrappedLineParser::parseFile() {
Daniel Jasper9326f912015-05-05 08:40:32 +0000283 // The top-level context in a file always has declarations, except for pre-
284 // processor directives and JavaScript files.
285 bool MustBeDeclaration =
286 !Line->InPPDirective && Style.Language != FormatStyle::LK_JavaScript;
287 ScopedDeclarationState DeclarationState(*Line, DeclarationScopeStack,
288 MustBeDeclaration);
Nico Weber9096fc02013-06-26 00:30:14 +0000289 parseLevel(/*HasOpeningBrace=*/false);
Manuel Klimek1abf7892013-01-04 23:34:14 +0000290 // Make sure to format the remaining tokens.
Manuel Klimekf92f7bc2013-01-22 16:31:55 +0000291 flushComments(true);
Manuel Klimek1abf7892013-01-04 23:34:14 +0000292 addUnwrappedLine();
Daniel Jasperf7935112012-12-03 18:12:45 +0000293}
294
Manuel Klimek1a18c402013-04-12 14:13:36 +0000295void UnwrappedLineParser::parseLevel(bool HasOpeningBrace) {
Daniel Jasper516d7972013-07-25 11:31:57 +0000296 bool SwitchLabelEncountered = false;
Daniel Jasperf7935112012-12-03 18:12:45 +0000297 do {
Birunthan Mohanathasb001a0b2015-07-03 17:25:16 +0000298 tok::TokenKind kind = FormatTok->Tok.getKind();
299 if (FormatTok->Type == TT_MacroBlockBegin) {
300 kind = tok::l_brace;
301 } else if (FormatTok->Type == TT_MacroBlockEnd) {
302 kind = tok::r_brace;
303 }
304
305 switch (kind) {
Daniel Jasperf7935112012-12-03 18:12:45 +0000306 case tok::comment:
Daniel Jaspere25509f2012-12-17 11:29:41 +0000307 nextToken();
308 addUnwrappedLine();
Daniel Jasperf7935112012-12-03 18:12:45 +0000309 break;
310 case tok::l_brace:
Manuel Klimek0a3a3c92013-01-23 09:32:48 +0000311 // FIXME: Add parameter whether this can happen - if this happens, we must
312 // be in a non-declaration context.
Daniel Jasperb86e2722015-08-24 13:23:37 +0000313 if (!FormatTok->is(TT_MacroBlockBegin) && tryToParseBracedList())
314 continue;
Nico Weber9096fc02013-06-26 00:30:14 +0000315 parseBlock(/*MustBeDeclaration=*/false);
Daniel Jasperf7935112012-12-03 18:12:45 +0000316 addUnwrappedLine();
317 break;
318 case tok::r_brace:
Manuel Klimek1a18c402013-04-12 14:13:36 +0000319 if (HasOpeningBrace)
320 return;
Manuel Klimek1a18c402013-04-12 14:13:36 +0000321 nextToken();
322 addUnwrappedLine();
Manuel Klimek1058d982013-01-06 20:07:31 +0000323 break;
Daniel Jasper516d7972013-07-25 11:31:57 +0000324 case tok::kw_default:
325 case tok::kw_case:
Daniel Jasper72407622013-09-02 08:26:29 +0000326 if (!SwitchLabelEncountered &&
327 (Style.IndentCaseLabels || (Line->InPPDirective && Line->Level == 1)))
328 ++Line->Level;
Daniel Jasper516d7972013-07-25 11:31:57 +0000329 SwitchLabelEncountered = true;
330 parseStructuralElement();
331 break;
Daniel Jasperf7935112012-12-03 18:12:45 +0000332 default:
Manuel Klimek6b9eeba2013-01-07 14:56:16 +0000333 parseStructuralElement();
Daniel Jasperf7935112012-12-03 18:12:45 +0000334 break;
335 }
336 } while (!eof());
337}
338
Daniel Jasperadba2aa2015-05-18 12:52:00 +0000339void UnwrappedLineParser::calculateBraceTypes(bool ExpectClassBody) {
Manuel Klimekab419912013-05-23 09:41:43 +0000340 // We'll parse forward through the tokens until we hit
341 // a closing brace or eof - note that getNextToken() will
342 // parse macros, so this will magically work inside macro
343 // definitions, too.
344 unsigned StoredPosition = Tokens->getPosition();
Manuel Klimek15dfe7a2013-05-28 11:55:06 +0000345 FormatToken *Tok = FormatTok;
Daniel Jasperb9a49902016-01-09 15:56:28 +0000346 const FormatToken *PrevTok = getPreviousToken();
Manuel Klimekab419912013-05-23 09:41:43 +0000347 // Keep a stack of positions of lbrace tokens. We will
348 // update information about whether an lbrace starts a
349 // braced init list or a different block during the loop.
Daniel Jasperb1f74a82013-07-09 09:06:29 +0000350 SmallVector<FormatToken *, 8> LBraceStack;
Manuel Klimek15dfe7a2013-05-28 11:55:06 +0000351 assert(Tok->Tok.is(tok::l_brace));
Manuel Klimekab419912013-05-23 09:41:43 +0000352 do {
Daniel Jaspereb65e912015-12-21 18:31:15 +0000353 // Get next non-comment token.
Daniel Jasper7f5d53e2013-07-01 09:15:46 +0000354 FormatToken *NextTok;
Daniel Jasperca7bd722013-07-01 16:43:38 +0000355 unsigned ReadTokens = 0;
Daniel Jasper7f5d53e2013-07-01 09:15:46 +0000356 do {
357 NextTok = Tokens->getNextToken();
Daniel Jasperca7bd722013-07-01 16:43:38 +0000358 ++ReadTokens;
Daniel Jasper7f5d53e2013-07-01 09:15:46 +0000359 } while (NextTok->is(tok::comment));
360
Manuel Klimek15dfe7a2013-05-28 11:55:06 +0000361 switch (Tok->Tok.getKind()) {
Manuel Klimekab419912013-05-23 09:41:43 +0000362 case tok::l_brace:
Martin Probst95ed8e72017-05-31 09:29:40 +0000363 if (Style.Language == FormatStyle::LK_JavaScript && PrevTok) {
364 if (PrevTok->is(tok::colon))
365 // A colon indicates this code is in a type, or a braced list
366 // following a label in an object literal ({a: {b: 1}}). The code
367 // below could be confused by semicolons between the individual
368 // members in a type member list, which would normally trigger
369 // BK_Block. In both cases, this must be parsed as an inline braced
370 // init.
371 Tok->BlockKind = BK_BracedInit;
372 else if (PrevTok->is(tok::r_paren))
373 // `) { }` can only occur in function or method declarations in JS.
374 Tok->BlockKind = BK_Block;
375 } else {
Daniel Jasperb9a49902016-01-09 15:56:28 +0000376 Tok->BlockKind = BK_Unknown;
Martin Probst95ed8e72017-05-31 09:29:40 +0000377 }
Daniel Jasperb1f74a82013-07-09 09:06:29 +0000378 LBraceStack.push_back(Tok);
Manuel Klimekab419912013-05-23 09:41:43 +0000379 break;
380 case tok::r_brace:
Daniel Jasperb9a49902016-01-09 15:56:28 +0000381 if (LBraceStack.empty())
382 break;
383 if (LBraceStack.back()->BlockKind == BK_Unknown) {
384 bool ProbablyBracedList = false;
385 if (Style.Language == FormatStyle::LK_Proto) {
386 ProbablyBracedList = NextTok->isOneOf(tok::comma, tok::r_square);
387 } else {
388 // Using OriginalColumn to distinguish between ObjC methods and
389 // binary operators is a bit hacky.
390 bool NextIsObjCMethod = NextTok->isOneOf(tok::plus, tok::minus) &&
391 NextTok->OriginalColumn == 0;
Daniel Jasper91b032a2014-05-22 12:46:38 +0000392
Daniel Jasperb9a49902016-01-09 15:56:28 +0000393 // If there is a comma, semicolon or right paren after the closing
394 // brace, we assume this is a braced initializer list. Note that
395 // regardless how we mark inner braces here, we will overwrite the
396 // BlockKind later if we parse a braced list (where all blocks
397 // inside are by default braced lists), or when we explicitly detect
398 // blocks (for example while parsing lambdas).
Martin Probst95ed8e72017-05-31 09:29:40 +0000399 // FIXME: Some of these do not apply to JS, e.g. "} {" can never be a
400 // braced list in JS.
Daniel Jasperb9a49902016-01-09 15:56:28 +0000401 ProbablyBracedList =
Daniel Jasperacffeb82016-03-05 18:34:26 +0000402 (Style.Language == FormatStyle::LK_JavaScript &&
Martin Probste1e12a72016-08-19 14:35:01 +0000403 NextTok->isOneOf(Keywords.kw_of, Keywords.kw_in,
404 Keywords.kw_as)) ||
Martin Probstb7fb2672017-05-10 13:53:29 +0000405 (Style.isCpp() && NextTok->is(tok::l_paren)) ||
Daniel Jasperb9a49902016-01-09 15:56:28 +0000406 NextTok->isOneOf(tok::comma, tok::period, tok::colon,
407 tok::r_paren, tok::r_square, tok::l_brace,
Martin Probstb7fb2672017-05-10 13:53:29 +0000408 tok::l_square, tok::ellipsis) ||
Daniel Jaspere4ada022016-12-13 10:05:03 +0000409 (NextTok->is(tok::identifier) &&
410 !PrevTok->isOneOf(tok::semi, tok::r_brace, tok::l_brace)) ||
Daniel Jasperb9a49902016-01-09 15:56:28 +0000411 (NextTok->is(tok::semi) &&
412 (!ExpectClassBody || LBraceStack.size() != 1)) ||
413 (NextTok->isBinaryOperator() && !NextIsObjCMethod);
Manuel Klimekab419912013-05-23 09:41:43 +0000414 }
Daniel Jasperb9a49902016-01-09 15:56:28 +0000415 if (ProbablyBracedList) {
416 Tok->BlockKind = BK_BracedInit;
417 LBraceStack.back()->BlockKind = BK_BracedInit;
418 } else {
419 Tok->BlockKind = BK_Block;
420 LBraceStack.back()->BlockKind = BK_Block;
421 }
Manuel Klimekab419912013-05-23 09:41:43 +0000422 }
Daniel Jasperb9a49902016-01-09 15:56:28 +0000423 LBraceStack.pop_back();
Manuel Klimekab419912013-05-23 09:41:43 +0000424 break;
Daniel Jasperac7e34e2014-03-13 10:11:17 +0000425 case tok::at:
Manuel Klimekab419912013-05-23 09:41:43 +0000426 case tok::semi:
427 case tok::kw_if:
428 case tok::kw_while:
429 case tok::kw_for:
430 case tok::kw_switch:
431 case tok::kw_try:
Nico Weberfac23712015-02-04 15:26:27 +0000432 case tok::kw___try:
Daniel Jasperb9a49902016-01-09 15:56:28 +0000433 if (!LBraceStack.empty() && LBraceStack.back()->BlockKind == BK_Unknown)
Daniel Jasperb1f74a82013-07-09 09:06:29 +0000434 LBraceStack.back()->BlockKind = BK_Block;
Manuel Klimekab419912013-05-23 09:41:43 +0000435 break;
436 default:
437 break;
438 }
Daniel Jasperb9a49902016-01-09 15:56:28 +0000439 PrevTok = Tok;
Manuel Klimekab419912013-05-23 09:41:43 +0000440 Tok = NextTok;
Manuel Klimekbab25fd2013-09-04 08:20:47 +0000441 } while (Tok->Tok.isNot(tok::eof) && !LBraceStack.empty());
Daniel Jasperb9a49902016-01-09 15:56:28 +0000442
Manuel Klimekab419912013-05-23 09:41:43 +0000443 // Assume other blocks for all unclosed opening braces.
444 for (unsigned i = 0, e = LBraceStack.size(); i != e; ++i) {
Daniel Jasperb1f74a82013-07-09 09:06:29 +0000445 if (LBraceStack[i]->BlockKind == BK_Unknown)
446 LBraceStack[i]->BlockKind = BK_Block;
Manuel Klimekab419912013-05-23 09:41:43 +0000447 }
Manuel Klimekbab25fd2013-09-04 08:20:47 +0000448
Manuel Klimekab419912013-05-23 09:41:43 +0000449 FormatTok = Tokens->setPosition(StoredPosition);
450}
451
Manuel Klimekb212f3b2013-10-12 22:46:56 +0000452void UnwrappedLineParser::parseBlock(bool MustBeDeclaration, bool AddLevel,
453 bool MunchSemi) {
Birunthan Mohanathasb001a0b2015-07-03 17:25:16 +0000454 assert(FormatTok->isOneOf(tok::l_brace, TT_MacroBlockBegin) &&
455 "'{' or macro block token expected");
456 const bool MacroBlock = FormatTok->is(TT_MacroBlockBegin);
Daniel Jaspereb65e912015-12-21 18:31:15 +0000457 FormatTok->BlockKind = BK_Block;
Birunthan Mohanathasb001a0b2015-07-03 17:25:16 +0000458
Daniel Jasper516d7972013-07-25 11:31:57 +0000459 unsigned InitialLevel = Line->Level;
Daniel Jasperf7935112012-12-03 18:12:45 +0000460 nextToken();
461
Birunthan Mohanathasb001a0b2015-07-03 17:25:16 +0000462 if (MacroBlock && FormatTok->is(tok::l_paren))
463 parseParens();
464
Manuel Klimeka4fe1c12013-01-21 16:42:44 +0000465 addUnwrappedLine();
Krasimir Georgiev9f5608a2017-05-18 15:16:24 +0000466 size_t OpeningLineIndex = CurrentLines->empty()
467 ? (UnwrappedLine::kInvalidIndex)
468 : (CurrentLines->size() - 1);
Daniel Jasperf7935112012-12-03 18:12:45 +0000469
Manuel Klimek0a3a3c92013-01-23 09:32:48 +0000470 ScopedDeclarationState DeclarationState(*Line, DeclarationScopeStack,
471 MustBeDeclaration);
Daniel Jasper65ee3472013-07-31 23:16:02 +0000472 if (AddLevel)
473 ++Line->Level;
Nico Weber9096fc02013-06-26 00:30:14 +0000474 parseLevel(/*HasOpeningBrace=*/true);
Alexander Kornienko578fdd82012-12-06 18:03:27 +0000475
Marianne Mailhot-Sarrasin03137c62016-04-14 14:56:49 +0000476 if (eof())
477 return;
478
Birunthan Mohanathasb001a0b2015-07-03 17:25:16 +0000479 if (MacroBlock ? !FormatTok->is(TT_MacroBlockEnd)
480 : !FormatTok->is(tok::r_brace)) {
Daniel Jasper516d7972013-07-25 11:31:57 +0000481 Line->Level = InitialLevel;
Daniel Jaspereb65e912015-12-21 18:31:15 +0000482 FormatTok->BlockKind = BK_Block;
Manuel Klimek1a18c402013-04-12 14:13:36 +0000483 return;
Manuel Klimekf92f7bc2013-01-22 16:31:55 +0000484 }
Alexander Kornienko0ea8e102012-12-04 15:40:36 +0000485
Daniel Jasperd1ae3582013-03-20 12:37:50 +0000486 nextToken(); // Munch the closing brace.
Birunthan Mohanathasb001a0b2015-07-03 17:25:16 +0000487
488 if (MacroBlock && FormatTok->is(tok::l_paren))
489 parseParens();
490
Manuel Klimekb212f3b2013-10-12 22:46:56 +0000491 if (MunchSemi && FormatTok->Tok.is(tok::semi))
492 nextToken();
Daniel Jasper516d7972013-07-25 11:31:57 +0000493 Line->Level = InitialLevel;
Krasimir Georgiev7cb267a2017-02-27 13:28:36 +0000494 Line->MatchingOpeningBlockLineIndex = OpeningLineIndex;
Francois Ferrande56a8292017-06-14 12:29:47 +0000495 if (OpeningLineIndex != UnwrappedLine::kInvalidIndex) {
496 // Update the opening line to add the forward reference as well
497 (*CurrentLines)[OpeningLineIndex].MatchingOpeningBlockLineIndex =
498 CurrentLines->size() - 1;
499 }
Daniel Jasperf7935112012-12-03 18:12:45 +0000500}
501
Daniel Jasper02c7bca2015-03-30 09:56:50 +0000502static bool isGoogScope(const UnwrappedLine &Line) {
Daniel Jasper616de8642014-11-23 16:46:28 +0000503 // FIXME: Closure-library specific stuff should not be hard-coded but be
504 // configurable.
Daniel Jasper4a39c842014-05-06 13:54:10 +0000505 if (Line.Tokens.size() < 4)
506 return false;
507 auto I = Line.Tokens.begin();
508 if (I->Tok->TokenText != "goog")
509 return false;
510 ++I;
511 if (I->Tok->isNot(tok::period))
512 return false;
513 ++I;
514 if (I->Tok->TokenText != "scope")
515 return false;
516 ++I;
517 return I->Tok->is(tok::l_paren);
518}
519
Martin Probst101ec892017-05-09 20:04:09 +0000520static bool isIIFE(const UnwrappedLine &Line,
521 const AdditionalKeywords &Keywords) {
522 // Look for the start of an immediately invoked anonymous function.
523 // https://en.wikipedia.org/wiki/Immediately-invoked_function_expression
524 // This is commonly done in JavaScript to create a new, anonymous scope.
525 // Example: (function() { ... })()
526 if (Line.Tokens.size() < 3)
527 return false;
528 auto I = Line.Tokens.begin();
529 if (I->Tok->isNot(tok::l_paren))
530 return false;
531 ++I;
532 if (I->Tok->isNot(Keywords.kw_function))
533 return false;
534 ++I;
535 return I->Tok->is(tok::l_paren);
536}
537
Roman Kashitsyna043ced2014-08-11 12:18:01 +0000538static bool ShouldBreakBeforeBrace(const FormatStyle &Style,
539 const FormatToken &InitialToken) {
Daniel Jasperc1bc38e2015-09-29 14:57:55 +0000540 if (InitialToken.is(tok::kw_namespace))
541 return Style.BraceWrapping.AfterNamespace;
542 if (InitialToken.is(tok::kw_class))
543 return Style.BraceWrapping.AfterClass;
544 if (InitialToken.is(tok::kw_union))
545 return Style.BraceWrapping.AfterUnion;
546 if (InitialToken.is(tok::kw_struct))
547 return Style.BraceWrapping.AfterStruct;
548 return false;
Roman Kashitsyna043ced2014-08-11 12:18:01 +0000549}
550
Manuel Klimek516e0542013-09-04 13:25:30 +0000551void UnwrappedLineParser::parseChildBlock() {
552 FormatTok->BlockKind = BK_Block;
553 nextToken();
554 {
Martin Probst101ec892017-05-09 20:04:09 +0000555 bool SkipIndent =
556 (Style.Language == FormatStyle::LK_JavaScript &&
557 (isGoogScope(*Line) || isIIFE(*Line, Keywords)));
Manuel Klimek516e0542013-09-04 13:25:30 +0000558 ScopedLineState LineState(*this);
559 ScopedDeclarationState DeclarationState(*Line, DeclarationScopeStack,
560 /*MustBeDeclaration=*/false);
Martin Probst101ec892017-05-09 20:04:09 +0000561 Line->Level += SkipIndent ? 0 : 1;
Manuel Klimek516e0542013-09-04 13:25:30 +0000562 parseLevel(/*HasOpeningBrace=*/true);
Daniel Jasper02c7bca2015-03-30 09:56:50 +0000563 flushComments(isOnNewLine(*FormatTok));
Martin Probst101ec892017-05-09 20:04:09 +0000564 Line->Level -= SkipIndent ? 0 : 1;
Manuel Klimek516e0542013-09-04 13:25:30 +0000565 }
566 nextToken();
567}
568
Daniel Jasperf7935112012-12-03 18:12:45 +0000569void UnwrappedLineParser::parsePPDirective() {
Manuel Klimek15dfe7a2013-05-28 11:55:06 +0000570 assert(FormatTok->Tok.is(tok::hash) && "'#' expected");
Manuel Klimek20e0af62015-05-06 11:56:29 +0000571 ScopedMacroState MacroState(*Line, Tokens, FormatTok);
Manuel Klimeka71e5d82013-01-02 16:30:12 +0000572 nextToken();
573
Craig Topper2145bc02014-05-09 08:15:10 +0000574 if (!FormatTok->Tok.getIdentifierInfo()) {
Manuel Klimek591b5802013-01-31 15:58:48 +0000575 parsePPUnknown();
Manuel Klimeka71e5d82013-01-02 16:30:12 +0000576 return;
Daniel Jasperf7935112012-12-03 18:12:45 +0000577 }
Manuel Klimeka71e5d82013-01-02 16:30:12 +0000578
Manuel Klimek15dfe7a2013-05-28 11:55:06 +0000579 switch (FormatTok->Tok.getIdentifierInfo()->getPPKeywordID()) {
Manuel Klimek1abf7892013-01-04 23:34:14 +0000580 case tok::pp_define:
581 parsePPDefine();
Alexander Kornienkof2e02122013-05-24 18:24:24 +0000582 return;
583 case tok::pp_if:
Manuel Klimek71814b42013-10-11 21:25:45 +0000584 parsePPIf(/*IfDef=*/false);
Alexander Kornienkof2e02122013-05-24 18:24:24 +0000585 break;
586 case tok::pp_ifdef:
587 case tok::pp_ifndef:
Manuel Klimek71814b42013-10-11 21:25:45 +0000588 parsePPIf(/*IfDef=*/true);
Alexander Kornienkof2e02122013-05-24 18:24:24 +0000589 break;
590 case tok::pp_else:
591 parsePPElse();
592 break;
593 case tok::pp_elif:
594 parsePPElIf();
595 break;
596 case tok::pp_endif:
597 parsePPEndIf();
Manuel Klimek1abf7892013-01-04 23:34:14 +0000598 break;
599 default:
600 parsePPUnknown();
601 break;
602 }
603}
604
Manuel Klimek68b03042014-04-14 09:14:11 +0000605void UnwrappedLineParser::conditionalCompilationCondition(bool Unreachable) {
606 if (Unreachable || (!PPStack.empty() && PPStack.back() == PP_Unreachable))
Alexander Kornienkof2e02122013-05-24 18:24:24 +0000607 PPStack.push_back(PP_Unreachable);
608 else
609 PPStack.push_back(PP_Conditional);
610}
611
Manuel Klimek68b03042014-04-14 09:14:11 +0000612void UnwrappedLineParser::conditionalCompilationStart(bool Unreachable) {
Manuel Klimek71814b42013-10-11 21:25:45 +0000613 ++PPBranchLevel;
614 assert(PPBranchLevel >= 0 && PPBranchLevel <= (int)PPLevelBranchIndex.size());
615 if (PPBranchLevel == (int)PPLevelBranchIndex.size()) {
616 PPLevelBranchIndex.push_back(0);
617 PPLevelBranchCount.push_back(0);
618 }
619 PPChainBranchIndex.push(0);
Manuel Klimek68b03042014-04-14 09:14:11 +0000620 bool Skip = PPLevelBranchIndex[PPBranchLevel] > 0;
621 conditionalCompilationCondition(Unreachable || Skip);
Alexander Kornienkof2e02122013-05-24 18:24:24 +0000622}
623
Manuel Klimek68b03042014-04-14 09:14:11 +0000624void UnwrappedLineParser::conditionalCompilationAlternative() {
Alexander Kornienkof2e02122013-05-24 18:24:24 +0000625 if (!PPStack.empty())
626 PPStack.pop_back();
Manuel Klimek71814b42013-10-11 21:25:45 +0000627 assert(PPBranchLevel < (int)PPLevelBranchIndex.size());
628 if (!PPChainBranchIndex.empty())
629 ++PPChainBranchIndex.top();
Manuel Klimek68b03042014-04-14 09:14:11 +0000630 conditionalCompilationCondition(
631 PPBranchLevel >= 0 && !PPChainBranchIndex.empty() &&
632 PPLevelBranchIndex[PPBranchLevel] != PPChainBranchIndex.top());
Alexander Kornienkof2e02122013-05-24 18:24:24 +0000633}
634
Manuel Klimek68b03042014-04-14 09:14:11 +0000635void UnwrappedLineParser::conditionalCompilationEnd() {
Manuel Klimek71814b42013-10-11 21:25:45 +0000636 assert(PPBranchLevel < (int)PPLevelBranchIndex.size());
637 if (PPBranchLevel >= 0 && !PPChainBranchIndex.empty()) {
638 if (PPChainBranchIndex.top() + 1 > PPLevelBranchCount[PPBranchLevel]) {
Manuel Klimek71814b42013-10-11 21:25:45 +0000639 PPLevelBranchCount[PPBranchLevel] = PPChainBranchIndex.top() + 1;
640 }
641 }
Manuel Klimek14bd9172014-01-29 08:49:02 +0000642 // Guard against #endif's without #if.
643 if (PPBranchLevel > 0)
644 --PPBranchLevel;
Manuel Klimek71814b42013-10-11 21:25:45 +0000645 if (!PPChainBranchIndex.empty())
646 PPChainBranchIndex.pop();
Alexander Kornienkof2e02122013-05-24 18:24:24 +0000647 if (!PPStack.empty())
648 PPStack.pop_back();
Manuel Klimek68b03042014-04-14 09:14:11 +0000649}
650
651void UnwrappedLineParser::parsePPIf(bool IfDef) {
Daniel Jasper62703eb2017-03-01 11:10:11 +0000652 bool IfNDef = FormatTok->is(tok::pp_ifndef);
Manuel Klimek68b03042014-04-14 09:14:11 +0000653 nextToken();
Daniel Jaspereab6cd42017-03-01 10:47:52 +0000654 bool Unreachable = false;
655 if (!IfDef && (FormatTok->is(tok::kw_false) || FormatTok->TokenText == "0"))
656 Unreachable = true;
Daniel Jasper62703eb2017-03-01 11:10:11 +0000657 if (IfDef && !IfNDef && FormatTok->TokenText == "SWIG")
Daniel Jaspereab6cd42017-03-01 10:47:52 +0000658 Unreachable = true;
659 conditionalCompilationStart(Unreachable);
Manuel Klimek68b03042014-04-14 09:14:11 +0000660 parsePPUnknown();
661}
662
663void UnwrappedLineParser::parsePPElse() {
664 conditionalCompilationAlternative();
665 parsePPUnknown();
666}
667
668void UnwrappedLineParser::parsePPElIf() { parsePPElse(); }
669
670void UnwrappedLineParser::parsePPEndIf() {
671 conditionalCompilationEnd();
Alexander Kornienkof2e02122013-05-24 18:24:24 +0000672 parsePPUnknown();
673}
674
Manuel Klimek1abf7892013-01-04 23:34:14 +0000675void UnwrappedLineParser::parsePPDefine() {
676 nextToken();
677
Manuel Klimek15dfe7a2013-05-28 11:55:06 +0000678 if (FormatTok->Tok.getKind() != tok::identifier) {
Manuel Klimek1abf7892013-01-04 23:34:14 +0000679 parsePPUnknown();
680 return;
681 }
682 nextToken();
Manuel Klimek15dfe7a2013-05-28 11:55:06 +0000683 if (FormatTok->Tok.getKind() == tok::l_paren &&
684 FormatTok->WhitespaceRange.getBegin() ==
685 FormatTok->WhitespaceRange.getEnd()) {
Manuel Klimek1abf7892013-01-04 23:34:14 +0000686 parseParens();
687 }
688 addUnwrappedLine();
Manuel Klimek52b15152013-01-09 15:25:02 +0000689 Line->Level = 1;
Manuel Klimek1b896292013-01-07 09:34:28 +0000690
691 // Errors during a preprocessor directive can only affect the layout of the
692 // preprocessor directive, and thus we ignore them. An alternative approach
693 // would be to use the same approach we use on the file level (no
694 // re-indentation if there was a structural error) within the macro
695 // definition.
Manuel Klimek1abf7892013-01-04 23:34:14 +0000696 parseFile();
697}
698
699void UnwrappedLineParser::parsePPUnknown() {
Manuel Klimeka71e5d82013-01-02 16:30:12 +0000700 do {
Manuel Klimeka71e5d82013-01-02 16:30:12 +0000701 nextToken();
702 } while (!eof());
703 addUnwrappedLine();
Daniel Jasperf7935112012-12-03 18:12:45 +0000704}
705
Alexander Kornienkoa04e5e22013-04-09 16:15:19 +0000706// Here we blacklist certain tokens that are not usually the first token in an
707// unwrapped line. This is used in attempt to distinguish macro calls without
708// trailing semicolons from other constructs split to several lines.
Benjamin Kramer8407df72015-03-09 16:47:52 +0000709static bool tokenCanStartNewLine(const clang::Token &Tok) {
Alexander Kornienkoa04e5e22013-04-09 16:15:19 +0000710 // Semicolon can be a null-statement, l_square can be a start of a macro or
711 // a C++11 attribute, but this doesn't seem to be common.
712 return Tok.isNot(tok::semi) && Tok.isNot(tok::l_brace) &&
713 Tok.isNot(tok::l_square) &&
714 // Tokens that can only be used as binary operators and a part of
715 // overloaded operator names.
716 Tok.isNot(tok::period) && Tok.isNot(tok::periodstar) &&
717 Tok.isNot(tok::arrow) && Tok.isNot(tok::arrowstar) &&
718 Tok.isNot(tok::less) && Tok.isNot(tok::greater) &&
719 Tok.isNot(tok::slash) && Tok.isNot(tok::percent) &&
720 Tok.isNot(tok::lessless) && Tok.isNot(tok::greatergreater) &&
721 Tok.isNot(tok::equal) && Tok.isNot(tok::plusequal) &&
722 Tok.isNot(tok::minusequal) && Tok.isNot(tok::starequal) &&
723 Tok.isNot(tok::slashequal) && Tok.isNot(tok::percentequal) &&
724 Tok.isNot(tok::ampequal) && Tok.isNot(tok::pipeequal) &&
725 Tok.isNot(tok::caretequal) && Tok.isNot(tok::greatergreaterequal) &&
726 Tok.isNot(tok::lesslessequal) &&
727 // Colon is used in labels, base class lists, initializer lists,
728 // range-based for loops, ternary operator, but should never be the
729 // first token in an unwrapped line.
Daniel Jasper5ebb2f32014-05-21 13:08:17 +0000730 Tok.isNot(tok::colon) &&
731 // 'noexcept' is a trailing annotation.
732 Tok.isNot(tok::kw_noexcept);
Alexander Kornienkoa04e5e22013-04-09 16:15:19 +0000733}
734
Martin Probst533965c2016-04-19 18:19:06 +0000735static bool mustBeJSIdent(const AdditionalKeywords &Keywords,
736 const FormatToken *FormatTok) {
Daniel Jasper1dcbbcfc2016-03-14 19:21:36 +0000737 // FIXME: This returns true for C/C++ keywords like 'struct'.
738 return FormatTok->is(tok::identifier) &&
739 (FormatTok->Tok.getIdentifierInfo() == nullptr ||
Martin Probst3dbbefa2016-11-10 16:21:02 +0000740 !FormatTok->isOneOf(
741 Keywords.kw_in, Keywords.kw_of, Keywords.kw_as, Keywords.kw_async,
742 Keywords.kw_await, Keywords.kw_yield, Keywords.kw_finally,
743 Keywords.kw_function, Keywords.kw_import, Keywords.kw_is,
744 Keywords.kw_let, Keywords.kw_var, tok::kw_const,
745 Keywords.kw_abstract, Keywords.kw_extends, Keywords.kw_implements,
746 Keywords.kw_instanceof, Keywords.kw_interface,
747 Keywords.kw_throws));
Daniel Jasper1dcbbcfc2016-03-14 19:21:36 +0000748}
749
Martin Probst533965c2016-04-19 18:19:06 +0000750static bool mustBeJSIdentOrValue(const AdditionalKeywords &Keywords,
751 const FormatToken *FormatTok) {
Martin Probstb9316ff2016-09-18 17:21:52 +0000752 return FormatTok->Tok.isLiteral() ||
753 FormatTok->isOneOf(tok::kw_true, tok::kw_false) ||
754 mustBeJSIdent(Keywords, FormatTok);
Martin Probst533965c2016-04-19 18:19:06 +0000755}
756
Daniel Jasper1dcbbcfc2016-03-14 19:21:36 +0000757// isJSDeclOrStmt returns true if |FormatTok| starts a declaration or statement
758// when encountered after a value (see mustBeJSIdentOrValue).
759static bool isJSDeclOrStmt(const AdditionalKeywords &Keywords,
760 const FormatToken *FormatTok) {
761 return FormatTok->isOneOf(
Martin Probst5f8445b2016-04-24 22:05:09 +0000762 tok::kw_return, Keywords.kw_yield,
Daniel Jasper1dcbbcfc2016-03-14 19:21:36 +0000763 // conditionals
764 tok::kw_if, tok::kw_else,
765 // loops
766 tok::kw_for, tok::kw_while, tok::kw_do, tok::kw_continue, tok::kw_break,
767 // switch/case
768 tok::kw_switch, tok::kw_case,
769 // exceptions
770 tok::kw_throw, tok::kw_try, tok::kw_catch, Keywords.kw_finally,
771 // declaration
772 tok::kw_const, tok::kw_class, Keywords.kw_var, Keywords.kw_let,
Martin Probst5f8445b2016-04-24 22:05:09 +0000773 Keywords.kw_async, Keywords.kw_function,
774 // import/export
775 Keywords.kw_import, tok::kw_export);
Daniel Jasper1dcbbcfc2016-03-14 19:21:36 +0000776}
777
778// readTokenWithJavaScriptASI reads the next token and terminates the current
779// line if JavaScript Automatic Semicolon Insertion must
780// happen between the current token and the next token.
781//
782// This method is conservative - it cannot cover all edge cases of JavaScript,
783// but only aims to correctly handle certain well known cases. It *must not*
784// return true in speculative cases.
785void UnwrappedLineParser::readTokenWithJavaScriptASI() {
786 FormatToken *Previous = FormatTok;
787 readToken();
788 FormatToken *Next = FormatTok;
789
790 bool IsOnSameLine =
791 CommentsBeforeNextToken.empty()
792 ? Next->NewlinesBefore == 0
793 : CommentsBeforeNextToken.front()->NewlinesBefore == 0;
794 if (IsOnSameLine)
795 return;
796
797 bool PreviousMustBeValue = mustBeJSIdentOrValue(Keywords, Previous);
Martin Probst717f6dc2016-10-21 05:11:38 +0000798 bool PreviousStartsTemplateExpr =
799 Previous->is(TT_TemplateString) && Previous->TokenText.endswith("${");
Martin Probstbbffeac2016-04-11 07:35:57 +0000800 if (PreviousMustBeValue && Line && Line->Tokens.size() > 1) {
801 // If the token before the previous one is an '@', the previous token is an
802 // annotation and can precede another identifier/value.
Benjamin Kramer5ffc24e2016-04-11 12:19:19 +0000803 const FormatToken *PrePrevious = std::prev(Line->Tokens.end(), 2)->Tok;
Martin Probstbbffeac2016-04-11 07:35:57 +0000804 if (PrePrevious->is(tok::at))
805 return;
806 }
Daniel Jasper1dcbbcfc2016-03-14 19:21:36 +0000807 if (Next->is(tok::exclaim) && PreviousMustBeValue)
Martin Probstd40bca42017-01-09 08:56:36 +0000808 return addUnwrappedLine();
Daniel Jasper1dcbbcfc2016-03-14 19:21:36 +0000809 bool NextMustBeValue = mustBeJSIdentOrValue(Keywords, Next);
Martin Probst717f6dc2016-10-21 05:11:38 +0000810 bool NextEndsTemplateExpr =
811 Next->is(TT_TemplateString) && Next->TokenText.startswith("}");
812 if (NextMustBeValue && !NextEndsTemplateExpr && !PreviousStartsTemplateExpr &&
813 (PreviousMustBeValue ||
814 Previous->isOneOf(tok::r_square, tok::r_paren, tok::plusplus,
815 tok::minusminus)))
Martin Probstd40bca42017-01-09 08:56:36 +0000816 return addUnwrappedLine();
Martin Probste6b5b342017-01-16 09:52:40 +0000817 if (PreviousMustBeValue && isJSDeclOrStmt(Keywords, Next))
Martin Probstd40bca42017-01-09 08:56:36 +0000818 return addUnwrappedLine();
Daniel Jasper1dcbbcfc2016-03-14 19:21:36 +0000819}
820
Manuel Klimek6b9eeba2013-01-07 14:56:16 +0000821void UnwrappedLineParser::parseStructuralElement() {
Daniel Jasper498f5582015-12-25 08:53:31 +0000822 assert(!FormatTok->is(tok::l_brace));
823 if (Style.Language == FormatStyle::LK_TableGen &&
824 FormatTok->is(tok::pp_include)) {
825 nextToken();
826 if (FormatTok->is(tok::string_literal))
827 nextToken();
828 addUnwrappedLine();
829 return;
830 }
Manuel Klimek15dfe7a2013-05-28 11:55:06 +0000831 switch (FormatTok->Tok.getKind()) {
Nico Weber04e9f1a2013-01-07 19:05:19 +0000832 case tok::at:
833 nextToken();
Manuel Klimek15dfe7a2013-05-28 11:55:06 +0000834 if (FormatTok->Tok.is(tok::l_brace)) {
Nico Weber372d8dc2013-02-10 20:35:35 +0000835 parseBracedList();
836 break;
837 }
Manuel Klimek15dfe7a2013-05-28 11:55:06 +0000838 switch (FormatTok->Tok.getObjCKeywordID()) {
Nico Weber04e9f1a2013-01-07 19:05:19 +0000839 case tok::objc_public:
840 case tok::objc_protected:
841 case tok::objc_package:
842 case tok::objc_private:
843 return parseAccessSpecifier();
Nico Weber7eecf4b2013-01-09 20:25:35 +0000844 case tok::objc_interface:
Nico Weber2ce0ac52013-01-09 23:25:37 +0000845 case tok::objc_implementation:
846 return parseObjCInterfaceOrImplementation();
Nico Weber8696a8d2013-01-09 21:15:03 +0000847 case tok::objc_protocol:
848 return parseObjCProtocol();
Nico Weberd8ffe752013-01-09 21:42:32 +0000849 case tok::objc_end:
850 return; // Handled by the caller.
Nico Weber51306d22013-01-10 00:25:19 +0000851 case tok::objc_optional:
852 case tok::objc_required:
853 nextToken();
854 addUnwrappedLine();
855 return;
Nico Weber45c48122015-06-28 01:06:16 +0000856 case tok::objc_autoreleasepool:
857 nextToken();
858 if (FormatTok->Tok.is(tok::l_brace)) {
Daniel Jasperc1bc38e2015-09-29 14:57:55 +0000859 if (Style.BraceWrapping.AfterObjCDeclaration)
Nico Weber45c48122015-06-28 01:06:16 +0000860 addUnwrappedLine();
861 parseBlock(/*MustBeDeclaration=*/false);
862 }
863 addUnwrappedLine();
864 return;
Nico Weber33381f52015-02-07 01:57:32 +0000865 case tok::objc_try:
866 // This branch isn't strictly necessary (the kw_try case below would
867 // do this too after the tok::at is parsed above). But be explicit.
868 parseTryCatch();
869 return;
Nico Weber04e9f1a2013-01-07 19:05:19 +0000870 default:
871 break;
872 }
873 break;
Daniel Jasper8f463652014-08-26 23:15:12 +0000874 case tok::kw_asm:
Daniel Jasper8f463652014-08-26 23:15:12 +0000875 nextToken();
876 if (FormatTok->is(tok::l_brace)) {
Daniel Jasperc6366072015-05-10 08:42:04 +0000877 FormatTok->Type = TT_InlineASMBrace;
Daniel Jasper2337f282015-01-12 10:14:56 +0000878 nextToken();
Daniel Jasper4429f142014-08-27 17:16:46 +0000879 while (FormatTok && FormatTok->isNot(tok::eof)) {
Daniel Jasper8f463652014-08-26 23:15:12 +0000880 if (FormatTok->is(tok::r_brace)) {
Daniel Jasperc6366072015-05-10 08:42:04 +0000881 FormatTok->Type = TT_InlineASMBrace;
Daniel Jasper8f463652014-08-26 23:15:12 +0000882 nextToken();
Daniel Jasper790d4f92015-05-11 11:59:46 +0000883 addUnwrappedLine();
Daniel Jasper8f463652014-08-26 23:15:12 +0000884 break;
885 }
Daniel Jasper2337f282015-01-12 10:14:56 +0000886 FormatTok->Finalized = true;
Daniel Jasper8f463652014-08-26 23:15:12 +0000887 nextToken();
888 }
889 }
890 break;
Alexander Kornienko578fdd82012-12-06 18:03:27 +0000891 case tok::kw_namespace:
892 parseNamespace();
893 return;
Dmitri Gribenko58d64e22012-12-30 21:27:25 +0000894 case tok::kw_inline:
895 nextToken();
Manuel Klimek15dfe7a2013-05-28 11:55:06 +0000896 if (FormatTok->Tok.is(tok::kw_namespace)) {
Dmitri Gribenko58d64e22012-12-30 21:27:25 +0000897 parseNamespace();
898 return;
899 }
900 break;
Alexander Kornienkob7076a22012-12-04 14:46:19 +0000901 case tok::kw_public:
902 case tok::kw_protected:
903 case tok::kw_private:
Daniel Jasper83709082015-02-18 17:14:05 +0000904 if (Style.Language == FormatStyle::LK_Java ||
905 Style.Language == FormatStyle::LK_JavaScript)
Daniel Jasperc58c70e2014-09-15 11:21:46 +0000906 nextToken();
907 else
908 parseAccessSpecifier();
Daniel Jasperf7935112012-12-03 18:12:45 +0000909 return;
Alexander Kornienkob7076a22012-12-04 14:46:19 +0000910 case tok::kw_if:
911 parseIfThenElse();
Daniel Jasperf7935112012-12-03 18:12:45 +0000912 return;
Alexander Kornienko37d6c942012-12-05 15:06:06 +0000913 case tok::kw_for:
914 case tok::kw_while:
915 parseForOrWhileLoop();
916 return;
Alexander Kornienkob7076a22012-12-04 14:46:19 +0000917 case tok::kw_do:
918 parseDoWhile();
919 return;
920 case tok::kw_switch:
921 parseSwitch();
922 return;
923 case tok::kw_default:
924 nextToken();
925 parseLabel();
926 return;
927 case tok::kw_case:
928 parseCaseLabel();
929 return;
Daniel Jasper04a71a42014-05-08 11:58:24 +0000930 case tok::kw_try:
Nico Weberfac23712015-02-04 15:26:27 +0000931 case tok::kw___try:
Daniel Jasper04a71a42014-05-08 11:58:24 +0000932 parseTryCatch();
933 return;
Manuel Klimekae610d12013-01-21 14:32:05 +0000934 case tok::kw_extern:
935 nextToken();
Manuel Klimek15dfe7a2013-05-28 11:55:06 +0000936 if (FormatTok->Tok.is(tok::string_literal)) {
Manuel Klimekae610d12013-01-21 14:32:05 +0000937 nextToken();
Manuel Klimek15dfe7a2013-05-28 11:55:06 +0000938 if (FormatTok->Tok.is(tok::l_brace)) {
Daniel Jasper65ee3472013-07-31 23:16:02 +0000939 parseBlock(/*MustBeDeclaration=*/true, /*AddLevel=*/false);
Manuel Klimekae610d12013-01-21 14:32:05 +0000940 addUnwrappedLine();
941 return;
942 }
943 }
Daniel Jaspere1e43192014-04-01 12:55:11 +0000944 break;
Daniel Jasperfca735c2015-02-19 16:14:18 +0000945 case tok::kw_export:
946 if (Style.Language == FormatStyle::LK_JavaScript) {
947 parseJavaScriptEs6ImportExport();
948 return;
949 }
950 break;
Daniel Jaspere1e43192014-04-01 12:55:11 +0000951 case tok::identifier:
Daniel Jasper66cb8c52015-05-04 09:22:29 +0000952 if (FormatTok->is(TT_ForEachMacro)) {
Daniel Jaspere1e43192014-04-01 12:55:11 +0000953 parseForOrWhileLoop();
954 return;
955 }
Birunthan Mohanathasb001a0b2015-07-03 17:25:16 +0000956 if (FormatTok->is(TT_MacroBlockBegin)) {
957 parseBlock(/*MustBeDeclaration=*/false, /*AddLevel=*/true,
958 /*MunchSemi=*/false);
959 return;
960 }
Daniel Jasper3d5a7d62016-06-20 18:20:38 +0000961 if (FormatTok->is(Keywords.kw_import)) {
962 if (Style.Language == FormatStyle::LK_JavaScript) {
963 parseJavaScriptEs6ImportExport();
964 return;
965 }
966 if (Style.Language == FormatStyle::LK_Proto) {
967 nextToken();
Daniel Jasper8b61d142016-06-20 20:39:53 +0000968 if (FormatTok->is(tok::kw_public))
969 nextToken();
Daniel Jasper3d5a7d62016-06-20 18:20:38 +0000970 if (!FormatTok->is(tok::string_literal))
971 return;
972 nextToken();
973 if (FormatTok->is(tok::semi))
974 nextToken();
975 addUnwrappedLine();
976 return;
977 }
Daniel Jasper354aa512015-02-19 16:07:32 +0000978 }
Daniel Jasper1dbc2102017-03-31 13:30:24 +0000979 if (Style.isCpp() &&
Daniel Jasper72b33572017-03-31 12:04:37 +0000980 FormatTok->isOneOf(Keywords.kw_signals, Keywords.kw_qsignals,
Daniel Jaspera00de632015-12-01 12:05:04 +0000981 Keywords.kw_slots, Keywords.kw_qslots)) {
Daniel Jasperde0d1f32015-04-24 07:50:34 +0000982 nextToken();
983 if (FormatTok->is(tok::colon)) {
984 nextToken();
985 addUnwrappedLine();
Daniel Jasper31343832016-07-27 10:13:24 +0000986 return;
Daniel Jasperde0d1f32015-04-24 07:50:34 +0000987 }
Daniel Jasper53395402015-04-07 15:04:40 +0000988 }
Manuel Klimekae610d12013-01-21 14:32:05 +0000989 // In all other cases, parse the declaration.
990 break;
Alexander Kornienkob7076a22012-12-04 14:46:19 +0000991 default:
992 break;
Daniel Jasperf7935112012-12-03 18:12:45 +0000993 }
Daniel Jasperf7935112012-12-03 18:12:45 +0000994 do {
Daniel Jaspera7900ad2016-05-08 18:12:22 +0000995 const FormatToken *Previous = getPreviousToken();
Manuel Klimek15dfe7a2013-05-28 11:55:06 +0000996 switch (FormatTok->Tok.getKind()) {
Nico Weber372d8dc2013-02-10 20:35:35 +0000997 case tok::at:
998 nextToken();
Manuel Klimek15dfe7a2013-05-28 11:55:06 +0000999 if (FormatTok->Tok.is(tok::l_brace))
Nico Weber372d8dc2013-02-10 20:35:35 +00001000 parseBracedList();
1001 break;
Alexander Kornienkob7076a22012-12-04 14:46:19 +00001002 case tok::kw_enum:
Daniel Jaspera7900ad2016-05-08 18:12:22 +00001003 // Ignore if this is part of "template <enum ...".
1004 if (Previous && Previous->is(tok::less)) {
1005 nextToken();
1006 break;
1007 }
1008
Daniel Jasper90cf3802015-06-17 09:44:02 +00001009 // parseEnum falls through and does not yet add an unwrapped line as an
1010 // enum definition can start a structural element.
Daniel Jasper6f5a1932015-12-29 08:54:23 +00001011 if (!parseEnum())
1012 break;
Daniel Jasperc6dd2732015-07-16 14:25:43 +00001013 // This only applies for C++.
Daniel Jasper1dbc2102017-03-31 13:30:24 +00001014 if (!Style.isCpp()) {
Daniel Jasper90cf3802015-06-17 09:44:02 +00001015 addUnwrappedLine();
1016 return;
1017 }
Manuel Klimek2cec0192013-01-21 19:17:52 +00001018 break;
Daniel Jaspera88f80a2014-01-30 14:38:37 +00001019 case tok::kw_typedef:
1020 nextToken();
Daniel Jasper31f6c542014-12-05 10:42:21 +00001021 if (FormatTok->isOneOf(Keywords.kw_NS_ENUM, Keywords.kw_NS_OPTIONS,
1022 Keywords.kw_CF_ENUM, Keywords.kw_CF_OPTIONS))
Daniel Jaspera88f80a2014-01-30 14:38:37 +00001023 parseEnum();
1024 break;
Alexander Kornienko1231e062013-01-16 11:43:46 +00001025 case tok::kw_struct:
1026 case tok::kw_union:
Manuel Klimek28cacc72013-01-07 18:10:23 +00001027 case tok::kw_class:
Daniel Jasper910807d2015-06-12 04:52:02 +00001028 // parseRecord falls through and does not yet add an unwrapped line as a
1029 // record declaration or definition can start a structural element.
Manuel Klimeke01bab52013-01-15 13:38:33 +00001030 parseRecord();
Daniel Jasper910807d2015-06-12 04:52:02 +00001031 // This does not apply for Java and JavaScript.
1032 if (Style.Language == FormatStyle::LK_Java ||
1033 Style.Language == FormatStyle::LK_JavaScript) {
Daniel Jasperd5ec65b2016-01-08 07:06:07 +00001034 if (FormatTok->is(tok::semi))
1035 nextToken();
Daniel Jasper910807d2015-06-12 04:52:02 +00001036 addUnwrappedLine();
1037 return;
1038 }
Manuel Klimeke01bab52013-01-15 13:38:33 +00001039 break;
Daniel Jaspere5d74862014-11-26 08:17:08 +00001040 case tok::period:
1041 nextToken();
1042 // In Java, classes have an implicit static member "class".
1043 if (Style.Language == FormatStyle::LK_Java && FormatTok &&
1044 FormatTok->is(tok::kw_class))
1045 nextToken();
Daniel Jasperba52fcb2015-09-28 14:29:45 +00001046 if (Style.Language == FormatStyle::LK_JavaScript && FormatTok &&
1047 FormatTok->Tok.getIdentifierInfo())
1048 // JavaScript only has pseudo keywords, all keywords are allowed to
1049 // appear in "IdentifierName" positions. See http://es5.github.io/#x7.6
1050 nextToken();
Daniel Jaspere5d74862014-11-26 08:17:08 +00001051 break;
Daniel Jasperf7935112012-12-03 18:12:45 +00001052 case tok::semi:
1053 nextToken();
1054 addUnwrappedLine();
1055 return;
Alexander Kornienko1231e062013-01-16 11:43:46 +00001056 case tok::r_brace:
1057 addUnwrappedLine();
1058 return;
Daniel Jasperf7935112012-12-03 18:12:45 +00001059 case tok::l_paren:
1060 parseParens();
1061 break;
Daniel Jasper5af04a42015-10-07 03:43:10 +00001062 case tok::kw_operator:
1063 nextToken();
1064 if (FormatTok->isBinaryOperator())
1065 nextToken();
1066 break;
Manuel Klimek516e0542013-09-04 13:25:30 +00001067 case tok::caret:
1068 nextToken();
Daniel Jasper395193c2014-03-28 07:48:59 +00001069 if (FormatTok->Tok.isAnyIdentifier() ||
1070 FormatTok->isSimpleTypeSpecifier())
1071 nextToken();
1072 if (FormatTok->is(tok::l_paren))
1073 parseParens();
1074 if (FormatTok->is(tok::l_brace))
Manuel Klimek516e0542013-09-04 13:25:30 +00001075 parseChildBlock();
Manuel Klimek516e0542013-09-04 13:25:30 +00001076 break;
Daniel Jasperf7935112012-12-03 18:12:45 +00001077 case tok::l_brace:
Manuel Klimekab419912013-05-23 09:41:43 +00001078 if (!tryToParseBracedList()) {
1079 // A block outside of parentheses must be the last part of a
1080 // structural element.
1081 // FIXME: Figure out cases where this is not true, and add projections
1082 // for them (the one we know is missing are lambdas).
Daniel Jasperc1bc38e2015-09-29 14:57:55 +00001083 if (Style.BraceWrapping.AfterFunction)
Manuel Klimekab419912013-05-23 09:41:43 +00001084 addUnwrappedLine();
Alexander Kornienko3cfa9732013-11-20 16:33:05 +00001085 FormatTok->Type = TT_FunctionLBrace;
Nico Weber9096fc02013-06-26 00:30:14 +00001086 parseBlock(/*MustBeDeclaration=*/false);
Manuel Klimeka8eb9142013-05-13 12:51:40 +00001087 addUnwrappedLine();
Manuel Klimekab419912013-05-23 09:41:43 +00001088 return;
1089 }
1090 // Otherwise this was a braced init list, and the structural
1091 // element continues.
1092 break;
Daniel Jasper04a71a42014-05-08 11:58:24 +00001093 case tok::kw_try:
1094 // We arrive here when parsing function-try blocks.
1095 parseTryCatch();
1096 return;
Daniel Jasper40e19212013-05-29 13:16:10 +00001097 case tok::identifier: {
Birunthan Mohanathasb001a0b2015-07-03 17:25:16 +00001098 if (FormatTok->is(TT_MacroBlockEnd)) {
1099 addUnwrappedLine();
1100 return;
1101 }
1102
Martin Probst973ff792017-04-27 13:07:24 +00001103 // Function declarations (as opposed to function expressions) are parsed
1104 // on their own unwrapped line by continuing this loop. Function
1105 // expressions (functions that are not on their own line) must not create
1106 // a new unwrapped line, so they are special cased below.
1107 size_t TokenCount = Line->Tokens.size();
Daniel Jasper9326f912015-05-05 08:40:32 +00001108 if (Style.Language == FormatStyle::LK_JavaScript &&
Martin Probst973ff792017-04-27 13:07:24 +00001109 FormatTok->is(Keywords.kw_function) &&
1110 (TokenCount > 1 || (TokenCount == 1 && !Line->Tokens.front().Tok->is(
1111 Keywords.kw_async)))) {
Daniel Jasper069e5f42014-05-20 11:14:57 +00001112 tryToParseJSFunction();
1113 break;
1114 }
Daniel Jasper9326f912015-05-05 08:40:32 +00001115 if ((Style.Language == FormatStyle::LK_JavaScript ||
1116 Style.Language == FormatStyle::LK_Java) &&
1117 FormatTok->is(Keywords.kw_interface)) {
Martin Probst1e8261e2016-04-19 18:18:59 +00001118 if (Style.Language == FormatStyle::LK_JavaScript) {
1119 // In JavaScript/TypeScript, "interface" can be used as a standalone
1120 // identifier, e.g. in `var interface = 1;`. If "interface" is
1121 // followed by another identifier, it is very like to be an actual
1122 // interface declaration.
1123 unsigned StoredPosition = Tokens->getPosition();
1124 FormatToken *Next = Tokens->getNextToken();
1125 FormatTok = Tokens->setPosition(StoredPosition);
Martin Probst533965c2016-04-19 18:19:06 +00001126 if (Next && !mustBeJSIdent(Keywords, Next)) {
Martin Probst1e8261e2016-04-19 18:18:59 +00001127 nextToken();
1128 break;
1129 }
1130 }
Daniel Jasper9326f912015-05-05 08:40:32 +00001131 parseRecord();
Daniel Jasper259188b2015-06-12 04:56:34 +00001132 addUnwrappedLine();
Daniel Jasper5c235c02015-07-06 14:26:04 +00001133 return;
Daniel Jasper9326f912015-05-05 08:40:32 +00001134 }
1135
Daniel Jasper1dcbbcfc2016-03-14 19:21:36 +00001136 // See if the following token should start a new unwrapped line.
Daniel Jasper9326f912015-05-05 08:40:32 +00001137 StringRef Text = FormatTok->TokenText;
Daniel Jasperf7935112012-12-03 18:12:45 +00001138 nextToken();
Daniel Jasper83709082015-02-18 17:14:05 +00001139 if (Line->Tokens.size() == 1 &&
1140 // JS doesn't have macros, and within classes colons indicate fields,
1141 // not labels.
Daniel Jasper676e5162015-04-07 14:36:33 +00001142 Style.Language != FormatStyle::LK_JavaScript) {
1143 if (FormatTok->Tok.is(tok::colon) && !Line->MustBeDeclaration) {
Daniel Jasper40609472016-04-06 15:02:46 +00001144 Line->Tokens.begin()->Tok->MustBreakBefore = true;
Alexander Kornienkode644272013-04-08 22:16:06 +00001145 parseLabel();
1146 return;
1147 }
Daniel Jasper680b09b2014-11-05 10:48:04 +00001148 // Recognize function-like macro usages without trailing semicolon as
Daniel Jasper83709082015-02-18 17:14:05 +00001149 // well as free-standing macros like Q_OBJECT.
Daniel Jasper680b09b2014-11-05 10:48:04 +00001150 bool FunctionLike = FormatTok->is(tok::l_paren);
1151 if (FunctionLike)
Alexander Kornienkode644272013-04-08 22:16:06 +00001152 parseParens();
Daniel Jaspere60cba12015-05-13 11:35:53 +00001153
1154 bool FollowedByNewline =
1155 CommentsBeforeNextToken.empty()
1156 ? FormatTok->NewlinesBefore > 0
1157 : CommentsBeforeNextToken.front()->NewlinesBefore > 0;
1158
Daniel Jaspere6fcf7d2015-06-17 13:08:06 +00001159 if (FollowedByNewline && (Text.size() >= 5 || FunctionLike) &&
Daniel Jasper680b09b2014-11-05 10:48:04 +00001160 tokenCanStartNewLine(FormatTok->Tok) && Text == Text.upper()) {
Daniel Jasper40e19212013-05-29 13:16:10 +00001161 addUnwrappedLine();
Daniel Jasper41a0f782013-05-29 14:09:17 +00001162 return;
Alexander Kornienkode644272013-04-08 22:16:06 +00001163 }
Daniel Jasperf7935112012-12-03 18:12:45 +00001164 }
1165 break;
Daniel Jasper40e19212013-05-29 13:16:10 +00001166 }
Daniel Jaspere25509f2012-12-17 11:29:41 +00001167 case tok::equal:
Manuel Klimek79e06082015-05-21 12:23:34 +00001168 // Fat arrows (=>) have tok::TokenKind tok::equal but TokenType
1169 // TT_JsFatArrow. The always start an expression or a child block if
1170 // followed by a curly.
1171 if (FormatTok->is(TT_JsFatArrow)) {
1172 nextToken();
Daniel Jasperbe520bd2015-05-31 08:51:54 +00001173 if (FormatTok->is(tok::l_brace))
Manuel Klimek79e06082015-05-21 12:23:34 +00001174 parseChildBlock();
Manuel Klimek79e06082015-05-21 12:23:34 +00001175 break;
1176 }
1177
Daniel Jaspere25509f2012-12-17 11:29:41 +00001178 nextToken();
Krasimir Georgievff747be2017-06-27 13:43:07 +00001179 if (FormatTok->Tok.is(tok::l_brace))
Manuel Klimek8e07a1b2013-01-10 11:52:21 +00001180 parseBracedList();
Krasimir Georgievff747be2017-06-27 13:43:07 +00001181 else if (Style.Language == FormatStyle::LK_Proto &&
1182 FormatTok->Tok.is(tok::less))
1183 parseBracedList(/*ClosingBraceKind=*/tok::greater);
Daniel Jaspere25509f2012-12-17 11:29:41 +00001184 break;
Manuel Klimekffdeb592013-09-03 15:10:01 +00001185 case tok::l_square:
Daniel Jasperb88b25f2013-12-23 07:29:06 +00001186 parseSquare();
Manuel Klimekffdeb592013-09-03 15:10:01 +00001187 break;
Daniel Jasper6acf5132015-03-12 14:44:29 +00001188 case tok::kw_new:
1189 parseNew();
1190 break;
Alexander Kornienkob7076a22012-12-04 14:46:19 +00001191 default:
1192 nextToken();
1193 break;
Daniel Jasperf7935112012-12-03 18:12:45 +00001194 }
1195 } while (!eof());
1196}
1197
Daniel Jasperb88b25f2013-12-23 07:29:06 +00001198bool UnwrappedLineParser::tryToParseLambda() {
Daniel Jasper1dbc2102017-03-31 13:30:24 +00001199 if (!Style.isCpp()) {
Daniel Jasper1feab0f2015-06-02 15:31:37 +00001200 nextToken();
1201 return false;
1202 }
Daniel Jasperb9a49902016-01-09 15:56:28 +00001203 const FormatToken* Previous = getPreviousToken();
1204 if (Previous &&
1205 (Previous->isOneOf(tok::identifier, tok::kw_operator, tok::kw_new,
1206 tok::kw_delete) ||
1207 Previous->closesScope() || Previous->isSimpleTypeSpecifier())) {
Daniel Jasperbf02b2c12013-09-05 11:49:39 +00001208 nextToken();
Daniel Jasperb88b25f2013-12-23 07:29:06 +00001209 return false;
Daniel Jasperbf02b2c12013-09-05 11:49:39 +00001210 }
Daniel Jasper9fe0e8d2013-09-05 09:29:45 +00001211 assert(FormatTok->is(tok::l_square));
1212 FormatToken &LSquare = *FormatTok;
Daniel Jasper9a8d48b2013-09-05 10:04:31 +00001213 if (!tryToParseLambdaIntroducer())
Daniel Jasperb88b25f2013-12-23 07:29:06 +00001214 return false;
Manuel Klimekffdeb592013-09-03 15:10:01 +00001215
Alexander Kornienkoc2ee9cf2014-03-13 13:59:48 +00001216 while (FormatTok->isNot(tok::l_brace)) {
Daniel Jaspercb51cf42014-01-16 09:11:55 +00001217 if (FormatTok->isSimpleTypeSpecifier()) {
1218 nextToken();
1219 continue;
1220 }
Manuel Klimekffdeb592013-09-03 15:10:01 +00001221 switch (FormatTok->Tok.getKind()) {
Daniel Jasper9a8d48b2013-09-05 10:04:31 +00001222 case tok::l_brace:
1223 break;
1224 case tok::l_paren:
1225 parseParens();
1226 break;
Daniel Jasperbcb55ee2014-11-21 14:08:38 +00001227 case tok::amp:
1228 case tok::star:
1229 case tok::kw_const:
Daniel Jasper3431b752014-12-08 13:22:37 +00001230 case tok::comma:
Daniel Jaspercb51cf42014-01-16 09:11:55 +00001231 case tok::less:
1232 case tok::greater:
Daniel Jasper9a8d48b2013-09-05 10:04:31 +00001233 case tok::identifier:
Daniel Jasper5eaa0092015-08-13 13:37:08 +00001234 case tok::numeric_constant:
Daniel Jasper1067ab02014-02-11 10:16:55 +00001235 case tok::coloncolon:
Daniel Jasper9a8d48b2013-09-05 10:04:31 +00001236 case tok::kw_mutable:
Daniel Jasper81a20782014-03-10 10:02:02 +00001237 nextToken();
1238 break;
Daniel Jaspercb51cf42014-01-16 09:11:55 +00001239 case tok::arrow:
Daniel Jasper6f2b88a2015-06-05 13:18:09 +00001240 FormatTok->Type = TT_LambdaArrow;
Daniel Jasper9a8d48b2013-09-05 10:04:31 +00001241 nextToken();
1242 break;
1243 default:
Daniel Jasperb88b25f2013-12-23 07:29:06 +00001244 return true;
Manuel Klimekffdeb592013-09-03 15:10:01 +00001245 }
1246 }
Daniel Jasper9fe0e8d2013-09-05 09:29:45 +00001247 LSquare.Type = TT_LambdaLSquare;
Manuel Klimek516e0542013-09-04 13:25:30 +00001248 parseChildBlock();
Daniel Jasperb88b25f2013-12-23 07:29:06 +00001249 return true;
Manuel Klimekffdeb592013-09-03 15:10:01 +00001250}
1251
1252bool UnwrappedLineParser::tryToParseLambdaIntroducer() {
1253 nextToken();
1254 if (FormatTok->is(tok::equal)) {
1255 nextToken();
Daniel Jasper9a8d48b2013-09-05 10:04:31 +00001256 if (FormatTok->is(tok::r_square)) {
1257 nextToken();
1258 return true;
1259 }
1260 if (FormatTok->isNot(tok::comma))
1261 return false;
Manuel Klimekffdeb592013-09-03 15:10:01 +00001262 nextToken();
1263 } else if (FormatTok->is(tok::amp)) {
1264 nextToken();
Daniel Jasper9a8d48b2013-09-05 10:04:31 +00001265 if (FormatTok->is(tok::r_square)) {
1266 nextToken();
1267 return true;
1268 }
Manuel Klimekffdeb592013-09-03 15:10:01 +00001269 if (!FormatTok->isOneOf(tok::comma, tok::identifier)) {
1270 return false;
1271 }
Daniel Jasper9a8d48b2013-09-05 10:04:31 +00001272 if (FormatTok->is(tok::comma))
1273 nextToken();
Manuel Klimekffdeb592013-09-03 15:10:01 +00001274 } else if (FormatTok->is(tok::r_square)) {
1275 nextToken();
1276 return true;
1277 }
1278 do {
Daniel Jasper9a8d48b2013-09-05 10:04:31 +00001279 if (FormatTok->is(tok::amp))
1280 nextToken();
1281 if (!FormatTok->isOneOf(tok::identifier, tok::kw_this))
1282 return false;
Manuel Klimekffdeb592013-09-03 15:10:01 +00001283 nextToken();
Daniel Jasperda18fd82014-06-10 06:39:03 +00001284 if (FormatTok->is(tok::ellipsis))
1285 nextToken();
Manuel Klimekffdeb592013-09-03 15:10:01 +00001286 if (FormatTok->is(tok::comma)) {
1287 nextToken();
1288 } else if (FormatTok->is(tok::r_square)) {
1289 nextToken();
1290 return true;
1291 } else {
1292 return false;
1293 }
1294 } while (!eof());
1295 return false;
1296}
1297
Daniel Jasperc03e16a2014-05-08 09:25:39 +00001298void UnwrappedLineParser::tryToParseJSFunction() {
Martin Probst409697e2016-05-29 14:41:07 +00001299 assert(FormatTok->is(Keywords.kw_function) ||
1300 FormatTok->startsSequence(Keywords.kw_async, Keywords.kw_function));
Martin Probst5f8445b2016-04-24 22:05:09 +00001301 if (FormatTok->is(Keywords.kw_async))
1302 nextToken();
1303 // Consume "function".
Daniel Jasperc03e16a2014-05-08 09:25:39 +00001304 nextToken();
Daniel Jasper5217a8b2014-06-13 07:02:04 +00001305
Daniel Jasper71e50af2016-11-01 06:22:59 +00001306 // Consume * (generator function). Treat it like C++'s overloaded operators.
1307 if (FormatTok->is(tok::star)) {
1308 FormatTok->Type = TT_OverloadedOperator;
Martin Probst5f8445b2016-04-24 22:05:09 +00001309 nextToken();
Daniel Jasper71e50af2016-11-01 06:22:59 +00001310 }
Martin Probst5f8445b2016-04-24 22:05:09 +00001311
Daniel Jasper5217a8b2014-06-13 07:02:04 +00001312 // Consume function name.
1313 if (FormatTok->is(tok::identifier))
Daniel Jasperfca735c2015-02-19 16:14:18 +00001314 nextToken();
Daniel Jasper5217a8b2014-06-13 07:02:04 +00001315
Daniel Jasperc03e16a2014-05-08 09:25:39 +00001316 if (FormatTok->isNot(tok::l_paren))
1317 return;
Manuel Klimek79e06082015-05-21 12:23:34 +00001318
1319 // Parse formal parameter list.
Daniel Jasperbe520bd2015-05-31 08:51:54 +00001320 parseParens();
Manuel Klimek79e06082015-05-21 12:23:34 +00001321
1322 if (FormatTok->is(tok::colon)) {
1323 // Parse a type definition.
1324 nextToken();
1325
1326 // Eat the type declaration. For braced inline object types, balance braces,
1327 // otherwise just parse until finding an l_brace for the function body.
Daniel Jasperbe520bd2015-05-31 08:51:54 +00001328 if (FormatTok->is(tok::l_brace))
1329 tryToParseBracedList();
1330 else
Martin Probstaf16c502017-01-04 13:36:43 +00001331 while (!FormatTok->isOneOf(tok::l_brace, tok::semi) && !eof())
Manuel Klimek79e06082015-05-21 12:23:34 +00001332 nextToken();
Manuel Klimek79e06082015-05-21 12:23:34 +00001333 }
1334
Martin Probstaf16c502017-01-04 13:36:43 +00001335 if (FormatTok->is(tok::semi))
1336 return;
1337
Manuel Klimek79e06082015-05-21 12:23:34 +00001338 parseChildBlock();
1339}
1340
Daniel Jasper3c883d12015-05-18 14:49:19 +00001341bool UnwrappedLineParser::tryToParseBracedList() {
Daniel Jasperb1f74a82013-07-09 09:06:29 +00001342 if (FormatTok->BlockKind == BK_Unknown)
Daniel Jasper3c883d12015-05-18 14:49:19 +00001343 calculateBraceTypes();
Daniel Jasperb1f74a82013-07-09 09:06:29 +00001344 assert(FormatTok->BlockKind != BK_Unknown);
1345 if (FormatTok->BlockKind == BK_Block)
Manuel Klimekab419912013-05-23 09:41:43 +00001346 return false;
1347 parseBracedList();
1348 return true;
1349}
1350
Krasimir Georgievff747be2017-06-27 13:43:07 +00001351bool UnwrappedLineParser::parseBracedList(bool ContinueOnSemicolons,
1352 tok::TokenKind ClosingBraceKind) {
Daniel Jasper015ed022013-09-13 09:20:45 +00001353 bool HasError = false;
Manuel Klimek8e07a1b2013-01-10 11:52:21 +00001354 nextToken();
1355
Manuel Klimeka3ff45e2013-04-10 09:52:05 +00001356 // FIXME: Once we have an expression parser in the UnwrappedLineParser,
1357 // replace this by using parseAssigmentExpression() inside.
Manuel Klimek8e07a1b2013-01-10 11:52:21 +00001358 do {
Manuel Klimek79e06082015-05-21 12:23:34 +00001359 if (Style.Language == FormatStyle::LK_JavaScript) {
Martin Probst409697e2016-05-29 14:41:07 +00001360 if (FormatTok->is(Keywords.kw_function) ||
1361 FormatTok->startsSequence(Keywords.kw_async, Keywords.kw_function)) {
Manuel Klimek79e06082015-05-21 12:23:34 +00001362 tryToParseJSFunction();
1363 continue;
Daniel Jasperbe520bd2015-05-31 08:51:54 +00001364 }
1365 if (FormatTok->is(TT_JsFatArrow)) {
Manuel Klimek79e06082015-05-21 12:23:34 +00001366 nextToken();
1367 // Fat arrows can be followed by simple expressions or by child blocks
1368 // in curly braces.
Daniel Jaspere6fcf7d2015-06-17 13:08:06 +00001369 if (FormatTok->is(tok::l_brace)) {
Manuel Klimek79e06082015-05-21 12:23:34 +00001370 parseChildBlock();
1371 continue;
1372 }
1373 }
Martin Probst8e3eba02017-02-07 16:33:13 +00001374 if (FormatTok->is(tok::l_brace)) {
1375 // Could be a method inside of a braced list `{a() { return 1; }}`.
1376 if (tryToParseBracedList())
1377 continue;
1378 parseChildBlock();
1379 }
Daniel Jasperc03e16a2014-05-08 09:25:39 +00001380 }
Krasimir Georgievff747be2017-06-27 13:43:07 +00001381 if (FormatTok->Tok.getKind() == ClosingBraceKind) {
1382 nextToken();
1383 return !HasError;
1384 }
Manuel Klimek15dfe7a2013-05-28 11:55:06 +00001385 switch (FormatTok->Tok.getKind()) {
Manuel Klimek516e0542013-09-04 13:25:30 +00001386 case tok::caret:
1387 nextToken();
1388 if (FormatTok->is(tok::l_brace)) {
1389 parseChildBlock();
1390 }
1391 break;
1392 case tok::l_square:
1393 tryToParseLambda();
1394 break;
Daniel Jaspera87af7a2015-06-30 11:32:22 +00001395 case tok::l_paren:
1396 parseParens();
Daniel Jasperf46dec82015-03-31 14:34:15 +00001397 // JavaScript can just have free standing methods and getters/setters in
1398 // object literals. Detect them by a "{" following ")".
1399 if (Style.Language == FormatStyle::LK_JavaScript) {
Daniel Jasperf46dec82015-03-31 14:34:15 +00001400 if (FormatTok->is(tok::l_brace))
1401 parseChildBlock();
1402 break;
1403 }
Daniel Jasperf46dec82015-03-31 14:34:15 +00001404 break;
Martin Probst8e3eba02017-02-07 16:33:13 +00001405 case tok::l_brace:
1406 // Assume there are no blocks inside a braced init list apart
1407 // from the ones we explicitly parse out (like lambdas).
1408 FormatTok->BlockKind = BK_BracedInit;
1409 parseBracedList();
1410 break;
Manuel Klimeka3ff45e2013-04-10 09:52:05 +00001411 case tok::semi:
Daniel Jasperb9a49902016-01-09 15:56:28 +00001412 // JavaScript (or more precisely TypeScript) can have semicolons in braced
1413 // lists (in so-called TypeMemberLists). Thus, the semicolon cannot be
1414 // used for error recovery if we have otherwise determined that this is
1415 // a braced list.
1416 if (Style.Language == FormatStyle::LK_JavaScript) {
1417 nextToken();
1418 break;
1419 }
Daniel Jasper015ed022013-09-13 09:20:45 +00001420 HasError = true;
1421 if (!ContinueOnSemicolons)
1422 return !HasError;
1423 nextToken();
1424 break;
Manuel Klimeka3ff45e2013-04-10 09:52:05 +00001425 case tok::comma:
1426 nextToken();
Manuel Klimeka3ff45e2013-04-10 09:52:05 +00001427 break;
Manuel Klimek8e07a1b2013-01-10 11:52:21 +00001428 default:
1429 nextToken();
1430 break;
1431 }
1432 } while (!eof());
Daniel Jasper015ed022013-09-13 09:20:45 +00001433 return false;
Manuel Klimek8e07a1b2013-01-10 11:52:21 +00001434}
1435
Daniel Jasperf7935112012-12-03 18:12:45 +00001436void UnwrappedLineParser::parseParens() {
Manuel Klimek15dfe7a2013-05-28 11:55:06 +00001437 assert(FormatTok->Tok.is(tok::l_paren) && "'(' expected.");
Daniel Jasperf7935112012-12-03 18:12:45 +00001438 nextToken();
1439 do {
Manuel Klimek15dfe7a2013-05-28 11:55:06 +00001440 switch (FormatTok->Tok.getKind()) {
Daniel Jasperf7935112012-12-03 18:12:45 +00001441 case tok::l_paren:
1442 parseParens();
Daniel Jasper5f1fa852015-01-04 20:40:51 +00001443 if (Style.Language == FormatStyle::LK_Java && FormatTok->is(tok::l_brace))
1444 parseChildBlock();
Daniel Jasperf7935112012-12-03 18:12:45 +00001445 break;
1446 case tok::r_paren:
1447 nextToken();
1448 return;
Daniel Jasper393564f2013-05-31 14:56:29 +00001449 case tok::r_brace:
1450 // A "}" inside parenthesis is an error if there wasn't a matching "{".
1451 return;
Daniel Jasper9a8d48b2013-09-05 10:04:31 +00001452 case tok::l_square:
1453 tryToParseLambda();
1454 break;
Daniel Jasper5f1fa852015-01-04 20:40:51 +00001455 case tok::l_brace:
Daniel Jasperadba2aa2015-05-18 12:52:00 +00001456 if (!tryToParseBracedList())
Manuel Klimekf017dc02013-09-04 13:34:14 +00001457 parseChildBlock();
Manuel Klimek8e07a1b2013-01-10 11:52:21 +00001458 break;
Nico Weber372d8dc2013-02-10 20:35:35 +00001459 case tok::at:
1460 nextToken();
Manuel Klimek15dfe7a2013-05-28 11:55:06 +00001461 if (FormatTok->Tok.is(tok::l_brace))
Nico Weber372d8dc2013-02-10 20:35:35 +00001462 parseBracedList();
1463 break;
Martin Probst1027fb82017-02-07 14:05:30 +00001464 case tok::kw_class:
1465 if (Style.Language == FormatStyle::LK_JavaScript)
1466 parseRecord(/*ParseAsExpr=*/true);
1467 else
1468 nextToken();
1469 break;
Daniel Jasper3f69ba12014-09-05 08:42:27 +00001470 case tok::identifier:
1471 if (Style.Language == FormatStyle::LK_JavaScript &&
Martin Probst409697e2016-05-29 14:41:07 +00001472 (FormatTok->is(Keywords.kw_function) ||
1473 FormatTok->startsSequence(Keywords.kw_async, Keywords.kw_function)))
Daniel Jasper3f69ba12014-09-05 08:42:27 +00001474 tryToParseJSFunction();
1475 else
1476 nextToken();
1477 break;
Daniel Jasperf7935112012-12-03 18:12:45 +00001478 default:
1479 nextToken();
1480 break;
1481 }
1482 } while (!eof());
1483}
1484
Daniel Jasperb88b25f2013-12-23 07:29:06 +00001485void UnwrappedLineParser::parseSquare() {
1486 assert(FormatTok->Tok.is(tok::l_square) && "'[' expected.");
1487 if (tryToParseLambda())
1488 return;
1489 do {
Daniel Jasperb88b25f2013-12-23 07:29:06 +00001490 switch (FormatTok->Tok.getKind()) {
1491 case tok::l_paren:
1492 parseParens();
1493 break;
1494 case tok::r_square:
1495 nextToken();
1496 return;
1497 case tok::r_brace:
1498 // A "}" inside parenthesis is an error if there wasn't a matching "{".
1499 return;
1500 case tok::l_square:
1501 parseSquare();
1502 break;
1503 case tok::l_brace: {
Daniel Jasperadba2aa2015-05-18 12:52:00 +00001504 if (!tryToParseBracedList())
Daniel Jasperb88b25f2013-12-23 07:29:06 +00001505 parseChildBlock();
Daniel Jasperb88b25f2013-12-23 07:29:06 +00001506 break;
1507 }
1508 case tok::at:
1509 nextToken();
1510 if (FormatTok->Tok.is(tok::l_brace))
1511 parseBracedList();
1512 break;
1513 default:
1514 nextToken();
1515 break;
1516 }
1517 } while (!eof());
1518}
1519
Daniel Jasperf7935112012-12-03 18:12:45 +00001520void UnwrappedLineParser::parseIfThenElse() {
Manuel Klimek15dfe7a2013-05-28 11:55:06 +00001521 assert(FormatTok->Tok.is(tok::kw_if) && "'if' expected");
Daniel Jasperf7935112012-12-03 18:12:45 +00001522 nextToken();
Daniel Jasper6a7d5a72017-06-19 07:40:49 +00001523 if (FormatTok->Tok.is(tok::kw_constexpr))
1524 nextToken();
Manuel Klimek15dfe7a2013-05-28 11:55:06 +00001525 if (FormatTok->Tok.is(tok::l_paren))
Manuel Klimekadededf2013-01-11 18:28:36 +00001526 parseParens();
Daniel Jasperf7935112012-12-03 18:12:45 +00001527 bool NeedsUnwrappedLine = false;
Manuel Klimek15dfe7a2013-05-28 11:55:06 +00001528 if (FormatTok->Tok.is(tok::l_brace)) {
Alexander Kornienko3a33f022013-12-12 09:49:52 +00001529 CompoundStatementIndenter Indenter(this, Style, Line->Level);
Nico Weber9096fc02013-06-26 00:30:14 +00001530 parseBlock(/*MustBeDeclaration=*/false);
Daniel Jasperc1bc38e2015-09-29 14:57:55 +00001531 if (Style.BraceWrapping.BeforeElse)
Manuel Klimekd3ed59a2013-08-02 21:31:59 +00001532 addUnwrappedLine();
Daniel Jasperc1bc38e2015-09-29 14:57:55 +00001533 else
Manuel Klimekd3ed59a2013-08-02 21:31:59 +00001534 NeedsUnwrappedLine = true;
Daniel Jasperf7935112012-12-03 18:12:45 +00001535 } else {
1536 addUnwrappedLine();
Manuel Klimek52b15152013-01-09 15:25:02 +00001537 ++Line->Level;
Manuel Klimek6b9eeba2013-01-07 14:56:16 +00001538 parseStructuralElement();
Manuel Klimek52b15152013-01-09 15:25:02 +00001539 --Line->Level;
Daniel Jasperf7935112012-12-03 18:12:45 +00001540 }
Manuel Klimek15dfe7a2013-05-28 11:55:06 +00001541 if (FormatTok->Tok.is(tok::kw_else)) {
Daniel Jasperf7935112012-12-03 18:12:45 +00001542 nextToken();
Manuel Klimek15dfe7a2013-05-28 11:55:06 +00001543 if (FormatTok->Tok.is(tok::l_brace)) {
Alexander Kornienko3a33f022013-12-12 09:49:52 +00001544 CompoundStatementIndenter Indenter(this, Style, Line->Level);
Nico Weber9096fc02013-06-26 00:30:14 +00001545 parseBlock(/*MustBeDeclaration=*/false);
Daniel Jasperf7935112012-12-03 18:12:45 +00001546 addUnwrappedLine();
Manuel Klimek15dfe7a2013-05-28 11:55:06 +00001547 } else if (FormatTok->Tok.is(tok::kw_if)) {
Daniel Jasperf7935112012-12-03 18:12:45 +00001548 parseIfThenElse();
1549 } else {
1550 addUnwrappedLine();
Manuel Klimek52b15152013-01-09 15:25:02 +00001551 ++Line->Level;
Manuel Klimek6b9eeba2013-01-07 14:56:16 +00001552 parseStructuralElement();
Daniel Jasper451544a2016-05-19 06:30:48 +00001553 if (FormatTok->is(tok::eof))
1554 addUnwrappedLine();
Manuel Klimek52b15152013-01-09 15:25:02 +00001555 --Line->Level;
Daniel Jasperf7935112012-12-03 18:12:45 +00001556 }
1557 } else if (NeedsUnwrappedLine) {
1558 addUnwrappedLine();
1559 }
1560}
1561
Daniel Jasper04a71a42014-05-08 11:58:24 +00001562void UnwrappedLineParser::parseTryCatch() {
Nico Weberfac23712015-02-04 15:26:27 +00001563 assert(FormatTok->isOneOf(tok::kw_try, tok::kw___try) && "'try' expected");
Daniel Jasper04a71a42014-05-08 11:58:24 +00001564 nextToken();
1565 bool NeedsUnwrappedLine = false;
1566 if (FormatTok->is(tok::colon)) {
1567 // We are in a function try block, what comes is an initializer list.
1568 nextToken();
1569 while (FormatTok->is(tok::identifier)) {
1570 nextToken();
1571 if (FormatTok->is(tok::l_paren))
1572 parseParens();
Daniel Jasper04a71a42014-05-08 11:58:24 +00001573 if (FormatTok->is(tok::comma))
1574 nextToken();
1575 }
1576 }
Daniel Jaspere189d462015-01-14 10:48:41 +00001577 // Parse try with resource.
1578 if (Style.Language == FormatStyle::LK_Java && FormatTok->is(tok::l_paren)) {
1579 parseParens();
1580 }
Daniel Jasper04a71a42014-05-08 11:58:24 +00001581 if (FormatTok->is(tok::l_brace)) {
1582 CompoundStatementIndenter Indenter(this, Style, Line->Level);
1583 parseBlock(/*MustBeDeclaration=*/false);
Daniel Jasperc1bc38e2015-09-29 14:57:55 +00001584 if (Style.BraceWrapping.BeforeCatch) {
Daniel Jasper04a71a42014-05-08 11:58:24 +00001585 addUnwrappedLine();
1586 } else {
1587 NeedsUnwrappedLine = true;
1588 }
1589 } else if (!FormatTok->is(tok::kw_catch)) {
1590 // The C++ standard requires a compound-statement after a try.
1591 // If there's none, we try to assume there's a structuralElement
1592 // and try to continue.
Daniel Jasper04a71a42014-05-08 11:58:24 +00001593 addUnwrappedLine();
1594 ++Line->Level;
1595 parseStructuralElement();
1596 --Line->Level;
1597 }
Nico Weber33381f52015-02-07 01:57:32 +00001598 while (1) {
1599 if (FormatTok->is(tok::at))
1600 nextToken();
1601 if (!(FormatTok->isOneOf(tok::kw_catch, Keywords.kw___except,
1602 tok::kw___finally) ||
1603 ((Style.Language == FormatStyle::LK_Java ||
1604 Style.Language == FormatStyle::LK_JavaScript) &&
1605 FormatTok->is(Keywords.kw_finally)) ||
1606 (FormatTok->Tok.isObjCAtKeyword(tok::objc_catch) ||
1607 FormatTok->Tok.isObjCAtKeyword(tok::objc_finally))))
1608 break;
Daniel Jasper04a71a42014-05-08 11:58:24 +00001609 nextToken();
1610 while (FormatTok->isNot(tok::l_brace)) {
1611 if (FormatTok->is(tok::l_paren)) {
1612 parseParens();
1613 continue;
1614 }
Daniel Jasper2bd7a642015-01-19 10:50:51 +00001615 if (FormatTok->isOneOf(tok::semi, tok::r_brace, tok::eof))
Daniel Jasper04a71a42014-05-08 11:58:24 +00001616 return;
1617 nextToken();
1618 }
1619 NeedsUnwrappedLine = false;
1620 CompoundStatementIndenter Indenter(this, Style, Line->Level);
1621 parseBlock(/*MustBeDeclaration=*/false);
Daniel Jasperc1bc38e2015-09-29 14:57:55 +00001622 if (Style.BraceWrapping.BeforeCatch)
Daniel Jasper04a71a42014-05-08 11:58:24 +00001623 addUnwrappedLine();
Daniel Jasperc1bc38e2015-09-29 14:57:55 +00001624 else
Daniel Jasper04a71a42014-05-08 11:58:24 +00001625 NeedsUnwrappedLine = true;
Daniel Jasper04a71a42014-05-08 11:58:24 +00001626 }
Daniel Jasperc1bc38e2015-09-29 14:57:55 +00001627 if (NeedsUnwrappedLine)
Daniel Jasper04a71a42014-05-08 11:58:24 +00001628 addUnwrappedLine();
Daniel Jasper04a71a42014-05-08 11:58:24 +00001629}
1630
Alexander Kornienko578fdd82012-12-06 18:03:27 +00001631void UnwrappedLineParser::parseNamespace() {
Manuel Klimek15dfe7a2013-05-28 11:55:06 +00001632 assert(FormatTok->Tok.is(tok::kw_namespace) && "'namespace' expected");
Roman Kashitsyna043ced2014-08-11 12:18:01 +00001633
1634 const FormatToken &InitialToken = *FormatTok;
Alexander Kornienko578fdd82012-12-06 18:03:27 +00001635 nextToken();
Saleem Abdulrasool328085f2015-10-30 05:07:56 +00001636 while (FormatTok->isOneOf(tok::identifier, tok::coloncolon))
Alexander Kornienko578fdd82012-12-06 18:03:27 +00001637 nextToken();
Manuel Klimek15dfe7a2013-05-28 11:55:06 +00001638 if (FormatTok->Tok.is(tok::l_brace)) {
Roman Kashitsyna043ced2014-08-11 12:18:01 +00001639 if (ShouldBreakBeforeBrace(Style, InitialToken))
Manuel Klimeka8eb9142013-05-13 12:51:40 +00001640 addUnwrappedLine();
1641
Daniel Jasper65ee3472013-07-31 23:16:02 +00001642 bool AddLevel = Style.NamespaceIndentation == FormatStyle::NI_All ||
1643 (Style.NamespaceIndentation == FormatStyle::NI_Inner &&
1644 DeclarationScopeStack.size() > 1);
1645 parseBlock(/*MustBeDeclaration=*/true, AddLevel);
Manuel Klimek046b9302013-02-06 16:08:09 +00001646 // Munch the semicolon after a namespace. This is more common than one would
1647 // think. Puttin the semicolon into its own line is very ugly.
Manuel Klimek15dfe7a2013-05-28 11:55:06 +00001648 if (FormatTok->Tok.is(tok::semi))
Manuel Klimek046b9302013-02-06 16:08:09 +00001649 nextToken();
Alexander Kornienko578fdd82012-12-06 18:03:27 +00001650 addUnwrappedLine();
1651 }
1652 // FIXME: Add error handling.
1653}
1654
Daniel Jasper6acf5132015-03-12 14:44:29 +00001655void UnwrappedLineParser::parseNew() {
1656 assert(FormatTok->is(tok::kw_new) && "'new' expected");
1657 nextToken();
1658 if (Style.Language != FormatStyle::LK_Java)
1659 return;
1660
1661 // In Java, we can parse everything up to the parens, which aren't optional.
1662 do {
1663 // There should not be a ;, { or } before the new's open paren.
1664 if (FormatTok->isOneOf(tok::semi, tok::l_brace, tok::r_brace))
1665 return;
1666
1667 // Consume the parens.
1668 if (FormatTok->is(tok::l_paren)) {
1669 parseParens();
1670
1671 // If there is a class body of an anonymous class, consume that as child.
1672 if (FormatTok->is(tok::l_brace))
1673 parseChildBlock();
1674 return;
1675 }
1676 nextToken();
1677 } while (!eof());
1678}
1679
Alexander Kornienko37d6c942012-12-05 15:06:06 +00001680void UnwrappedLineParser::parseForOrWhileLoop() {
Daniel Jasper66cb8c52015-05-04 09:22:29 +00001681 assert(FormatTok->isOneOf(tok::kw_for, tok::kw_while, TT_ForEachMacro) &&
Daniel Jaspere1e43192014-04-01 12:55:11 +00001682 "'for', 'while' or foreach macro expected");
Alexander Kornienko37d6c942012-12-05 15:06:06 +00001683 nextToken();
Martin Probsta050f412017-05-18 21:19:29 +00001684 // JS' for await ( ...
Martin Probstbd49e322017-05-15 19:33:20 +00001685 if (Style.Language == FormatStyle::LK_JavaScript &&
Martin Probsta050f412017-05-18 21:19:29 +00001686 FormatTok->is(Keywords.kw_await))
Martin Probstbd49e322017-05-15 19:33:20 +00001687 nextToken();
Manuel Klimek15dfe7a2013-05-28 11:55:06 +00001688 if (FormatTok->Tok.is(tok::l_paren))
Manuel Klimek9fa8d552013-01-11 19:23:05 +00001689 parseParens();
Manuel Klimek15dfe7a2013-05-28 11:55:06 +00001690 if (FormatTok->Tok.is(tok::l_brace)) {
Alexander Kornienko3a33f022013-12-12 09:49:52 +00001691 CompoundStatementIndenter Indenter(this, Style, Line->Level);
Nico Weber9096fc02013-06-26 00:30:14 +00001692 parseBlock(/*MustBeDeclaration=*/false);
Alexander Kornienko37d6c942012-12-05 15:06:06 +00001693 addUnwrappedLine();
1694 } else {
1695 addUnwrappedLine();
Manuel Klimek52b15152013-01-09 15:25:02 +00001696 ++Line->Level;
Manuel Klimek6b9eeba2013-01-07 14:56:16 +00001697 parseStructuralElement();
Manuel Klimek52b15152013-01-09 15:25:02 +00001698 --Line->Level;
Alexander Kornienko37d6c942012-12-05 15:06:06 +00001699 }
1700}
1701
Daniel Jasperf7935112012-12-03 18:12:45 +00001702void UnwrappedLineParser::parseDoWhile() {
Manuel Klimek15dfe7a2013-05-28 11:55:06 +00001703 assert(FormatTok->Tok.is(tok::kw_do) && "'do' expected");
Daniel Jasperf7935112012-12-03 18:12:45 +00001704 nextToken();
Manuel Klimek15dfe7a2013-05-28 11:55:06 +00001705 if (FormatTok->Tok.is(tok::l_brace)) {
Alexander Kornienko3a33f022013-12-12 09:49:52 +00001706 CompoundStatementIndenter Indenter(this, Style, Line->Level);
Nico Weber9096fc02013-06-26 00:30:14 +00001707 parseBlock(/*MustBeDeclaration=*/false);
Daniel Jasperc1bc38e2015-09-29 14:57:55 +00001708 if (Style.BraceWrapping.IndentBraces)
Alexander Kornienko3a33f022013-12-12 09:49:52 +00001709 addUnwrappedLine();
Daniel Jasperf7935112012-12-03 18:12:45 +00001710 } else {
1711 addUnwrappedLine();
Manuel Klimek52b15152013-01-09 15:25:02 +00001712 ++Line->Level;
Manuel Klimek6b9eeba2013-01-07 14:56:16 +00001713 parseStructuralElement();
Manuel Klimek52b15152013-01-09 15:25:02 +00001714 --Line->Level;
Daniel Jasperf7935112012-12-03 18:12:45 +00001715 }
1716
Alexander Kornienko0ea8e102012-12-04 15:40:36 +00001717 // FIXME: Add error handling.
Manuel Klimek15dfe7a2013-05-28 11:55:06 +00001718 if (!FormatTok->Tok.is(tok::kw_while)) {
Alexander Kornienko0ea8e102012-12-04 15:40:36 +00001719 addUnwrappedLine();
1720 return;
1721 }
1722
Daniel Jasperf7935112012-12-03 18:12:45 +00001723 nextToken();
Manuel Klimek6b9eeba2013-01-07 14:56:16 +00001724 parseStructuralElement();
Daniel Jasperf7935112012-12-03 18:12:45 +00001725}
1726
1727void UnwrappedLineParser::parseLabel() {
Daniel Jasperf7935112012-12-03 18:12:45 +00001728 nextToken();
Manuel Klimek52b15152013-01-09 15:25:02 +00001729 unsigned OldLineLevel = Line->Level;
Daniel Jaspera1275122013-03-20 10:23:53 +00001730 if (Line->Level > 1 || (!Line->InPPDirective && Line->Level > 0))
Manuel Klimek52b15152013-01-09 15:25:02 +00001731 --Line->Level;
Manuel Klimek15dfe7a2013-05-28 11:55:06 +00001732 if (CommentsBeforeNextToken.empty() && FormatTok->Tok.is(tok::l_brace)) {
Alexander Kornienko3a33f022013-12-12 09:49:52 +00001733 CompoundStatementIndenter Indenter(this, Style, Line->Level);
Nico Weber9096fc02013-06-26 00:30:14 +00001734 parseBlock(/*MustBeDeclaration=*/false);
Manuel Klimekd3ed59a2013-08-02 21:31:59 +00001735 if (FormatTok->Tok.is(tok::kw_break)) {
Daniel Jasperc1bc38e2015-09-29 14:57:55 +00001736 if (Style.BraceWrapping.AfterControlStatement)
Manuel Klimekd3ed59a2013-08-02 21:31:59 +00001737 addUnwrappedLine();
1738 parseStructuralElement();
1739 }
Alexander Kornienko3a33f022013-12-12 09:49:52 +00001740 addUnwrappedLine();
1741 } else {
Daniel Jasper1fe0d5c2015-05-06 15:19:47 +00001742 if (FormatTok->is(tok::semi))
1743 nextToken();
Alexander Kornienko3a33f022013-12-12 09:49:52 +00001744 addUnwrappedLine();
Daniel Jasperf7935112012-12-03 18:12:45 +00001745 }
Manuel Klimek52b15152013-01-09 15:25:02 +00001746 Line->Level = OldLineLevel;
Daniel Jasper2cce7b72016-04-06 16:41:39 +00001747 if (FormatTok->isNot(tok::l_brace)) {
Daniel Jasper40609472016-04-06 15:02:46 +00001748 parseStructuralElement();
Daniel Jasper2cce7b72016-04-06 16:41:39 +00001749 addUnwrappedLine();
1750 }
Daniel Jasperf7935112012-12-03 18:12:45 +00001751}
1752
1753void UnwrappedLineParser::parseCaseLabel() {
Manuel Klimek15dfe7a2013-05-28 11:55:06 +00001754 assert(FormatTok->Tok.is(tok::kw_case) && "'case' expected");
Daniel Jasperf7935112012-12-03 18:12:45 +00001755 // FIXME: fix handling of complex expressions here.
1756 do {
1757 nextToken();
Manuel Klimek15dfe7a2013-05-28 11:55:06 +00001758 } while (!eof() && !FormatTok->Tok.is(tok::colon));
Daniel Jasperf7935112012-12-03 18:12:45 +00001759 parseLabel();
1760}
1761
1762void UnwrappedLineParser::parseSwitch() {
Manuel Klimek15dfe7a2013-05-28 11:55:06 +00001763 assert(FormatTok->Tok.is(tok::kw_switch) && "'switch' expected");
Daniel Jasperf7935112012-12-03 18:12:45 +00001764 nextToken();
Manuel Klimek15dfe7a2013-05-28 11:55:06 +00001765 if (FormatTok->Tok.is(tok::l_paren))
Manuel Klimek9fa8d552013-01-11 19:23:05 +00001766 parseParens();
Manuel Klimek15dfe7a2013-05-28 11:55:06 +00001767 if (FormatTok->Tok.is(tok::l_brace)) {
Alexander Kornienko3a33f022013-12-12 09:49:52 +00001768 CompoundStatementIndenter Indenter(this, Style, Line->Level);
Daniel Jasper65ee3472013-07-31 23:16:02 +00001769 parseBlock(/*MustBeDeclaration=*/false);
Daniel Jasperf7935112012-12-03 18:12:45 +00001770 addUnwrappedLine();
1771 } else {
1772 addUnwrappedLine();
Daniel Jasper516d7972013-07-25 11:31:57 +00001773 ++Line->Level;
Manuel Klimek6b9eeba2013-01-07 14:56:16 +00001774 parseStructuralElement();
Daniel Jasper516d7972013-07-25 11:31:57 +00001775 --Line->Level;
Daniel Jasperf7935112012-12-03 18:12:45 +00001776 }
1777}
1778
1779void UnwrappedLineParser::parseAccessSpecifier() {
1780 nextToken();
Daniel Jasper84c47a12013-11-23 17:53:41 +00001781 // Understand Qt's slots.
Daniel Jasper53395402015-04-07 15:04:40 +00001782 if (FormatTok->isOneOf(Keywords.kw_slots, Keywords.kw_qslots))
Daniel Jasper84c47a12013-11-23 17:53:41 +00001783 nextToken();
Alexander Kornienko2ca766f2012-12-10 16:34:48 +00001784 // Otherwise, we don't know what it is, and we'd better keep the next token.
Manuel Klimek15dfe7a2013-05-28 11:55:06 +00001785 if (FormatTok->Tok.is(tok::colon))
Alexander Kornienko2ca766f2012-12-10 16:34:48 +00001786 nextToken();
Daniel Jasperf7935112012-12-03 18:12:45 +00001787 addUnwrappedLine();
1788}
1789
Daniel Jasper6f5a1932015-12-29 08:54:23 +00001790bool UnwrappedLineParser::parseEnum() {
Daniel Jasper6be0f552014-11-13 15:56:28 +00001791 // Won't be 'enum' for NS_ENUMs.
1792 if (FormatTok->Tok.is(tok::kw_enum))
Daniel Jasperccb68b42014-11-19 22:38:18 +00001793 nextToken();
Daniel Jasper6be0f552014-11-13 15:56:28 +00001794
Daniel Jasper6f5a1932015-12-29 08:54:23 +00001795 // In TypeScript, "enum" can also be used as property name, e.g. in interface
1796 // declarations. An "enum" keyword followed by a colon would be a syntax
1797 // error and thus assume it is just an identifier.
Daniel Jasper87379302016-02-03 05:33:44 +00001798 if (Style.Language == FormatStyle::LK_JavaScript &&
1799 FormatTok->isOneOf(tok::colon, tok::question))
Daniel Jasper6f5a1932015-12-29 08:54:23 +00001800 return false;
1801
Daniel Jasper2b41a822013-08-20 12:42:50 +00001802 // Eat up enum class ...
Daniel Jasperb05a81d2014-05-09 13:11:16 +00001803 if (FormatTok->Tok.is(tok::kw_class) || FormatTok->Tok.is(tok::kw_struct))
1804 nextToken();
Daniel Jasperb5a0b852015-06-19 08:17:32 +00001805
Daniel Jasper786a5502013-09-06 21:32:35 +00001806 while (FormatTok->Tok.getIdentifierInfo() ||
Daniel Jasperccb68b42014-11-19 22:38:18 +00001807 FormatTok->isOneOf(tok::colon, tok::coloncolon, tok::less,
1808 tok::greater, tok::comma, tok::question)) {
Manuel Klimek2cec0192013-01-21 19:17:52 +00001809 nextToken();
1810 // We can have macros or attributes in between 'enum' and the enum name.
Daniel Jasperccb68b42014-11-19 22:38:18 +00001811 if (FormatTok->is(tok::l_paren))
Alexander Kornienkob7076a22012-12-04 14:46:19 +00001812 parseParens();
Daniel Jasperb5a0b852015-06-19 08:17:32 +00001813 if (FormatTok->is(tok::identifier)) {
Manuel Klimek2cec0192013-01-21 19:17:52 +00001814 nextToken();
Daniel Jasperb5a0b852015-06-19 08:17:32 +00001815 // If there are two identifiers in a row, this is likely an elaborate
1816 // return type. In Java, this can be "implements", etc.
Daniel Jasper1dbc2102017-03-31 13:30:24 +00001817 if (Style.isCpp() && FormatTok->is(tok::identifier))
Daniel Jasper6f5a1932015-12-29 08:54:23 +00001818 return false;
Daniel Jasperb5a0b852015-06-19 08:17:32 +00001819 }
Manuel Klimek2cec0192013-01-21 19:17:52 +00001820 }
Daniel Jasper6be0f552014-11-13 15:56:28 +00001821
1822 // Just a declaration or something is wrong.
Daniel Jasperccb68b42014-11-19 22:38:18 +00001823 if (FormatTok->isNot(tok::l_brace))
Daniel Jasper6f5a1932015-12-29 08:54:23 +00001824 return true;
Daniel Jasper6be0f552014-11-13 15:56:28 +00001825 FormatTok->BlockKind = BK_Block;
1826
1827 if (Style.Language == FormatStyle::LK_Java) {
1828 // Java enums are different.
1829 parseJavaEnumBody();
Daniel Jasper6f5a1932015-12-29 08:54:23 +00001830 return true;
1831 }
1832 if (Style.Language == FormatStyle::LK_Proto) {
Daniel Jasperc6dd2732015-07-16 14:25:43 +00001833 parseBlock(/*MustBeDeclaration=*/true);
Daniel Jasper6f5a1932015-12-29 08:54:23 +00001834 return true;
Manuel Klimek2cec0192013-01-21 19:17:52 +00001835 }
Daniel Jasper6be0f552014-11-13 15:56:28 +00001836
1837 // Parse enum body.
1838 bool HasError = !parseBracedList(/*ContinueOnSemicolons=*/true);
1839 if (HasError) {
1840 if (FormatTok->is(tok::semi))
1841 nextToken();
1842 addUnwrappedLine();
1843 }
Daniel Jasper6f5a1932015-12-29 08:54:23 +00001844 return true;
Daniel Jasper6be0f552014-11-13 15:56:28 +00001845
Daniel Jasper90cf3802015-06-17 09:44:02 +00001846 // There is no addUnwrappedLine() here so that we fall through to parsing a
1847 // structural element afterwards. Thus, in "enum A {} n, m;",
Manuel Klimek2cec0192013-01-21 19:17:52 +00001848 // "} n, m;" will end up in one unwrapped line.
Daniel Jasper6be0f552014-11-13 15:56:28 +00001849}
1850
1851void UnwrappedLineParser::parseJavaEnumBody() {
1852 // Determine whether the enum is simple, i.e. does not have a semicolon or
1853 // constants with class bodies. Simple enums can be formatted like braced
1854 // lists, contracted to a single line, etc.
1855 unsigned StoredPosition = Tokens->getPosition();
1856 bool IsSimple = true;
1857 FormatToken *Tok = Tokens->getNextToken();
1858 while (Tok) {
1859 if (Tok->is(tok::r_brace))
1860 break;
1861 if (Tok->isOneOf(tok::l_brace, tok::semi)) {
1862 IsSimple = false;
1863 break;
1864 }
1865 // FIXME: This will also mark enums with braces in the arguments to enum
1866 // constants as "not simple". This is probably fine in practice, though.
1867 Tok = Tokens->getNextToken();
1868 }
1869 FormatTok = Tokens->setPosition(StoredPosition);
1870
1871 if (IsSimple) {
1872 parseBracedList();
Daniel Jasperdf2ff002014-11-02 22:31:39 +00001873 addUnwrappedLine();
Daniel Jasper6be0f552014-11-13 15:56:28 +00001874 return;
1875 }
1876
1877 // Parse the body of a more complex enum.
1878 // First add a line for everything up to the "{".
1879 nextToken();
1880 addUnwrappedLine();
1881 ++Line->Level;
1882
1883 // Parse the enum constants.
1884 while (FormatTok) {
1885 if (FormatTok->is(tok::l_brace)) {
1886 // Parse the constant's class body.
1887 parseBlock(/*MustBeDeclaration=*/true, /*AddLevel=*/true,
1888 /*MunchSemi=*/false);
1889 } else if (FormatTok->is(tok::l_paren)) {
1890 parseParens();
1891 } else if (FormatTok->is(tok::comma)) {
1892 nextToken();
1893 addUnwrappedLine();
1894 } else if (FormatTok->is(tok::semi)) {
1895 nextToken();
1896 addUnwrappedLine();
1897 break;
1898 } else if (FormatTok->is(tok::r_brace)) {
1899 addUnwrappedLine();
1900 break;
1901 } else {
1902 nextToken();
1903 }
1904 }
1905
1906 // Parse the class body after the enum's ";" if any.
1907 parseLevel(/*HasOpeningBrace=*/true);
1908 nextToken();
1909 --Line->Level;
1910 addUnwrappedLine();
Daniel Jasperf7935112012-12-03 18:12:45 +00001911}
1912
Martin Probst1027fb82017-02-07 14:05:30 +00001913void UnwrappedLineParser::parseRecord(bool ParseAsExpr) {
Roman Kashitsyna043ced2014-08-11 12:18:01 +00001914 const FormatToken &InitialToken = *FormatTok;
Manuel Klimek28cacc72013-01-07 18:10:23 +00001915 nextToken();
Daniel Jasper04785d02015-05-06 14:03:02 +00001916
Daniel Jasper04785d02015-05-06 14:03:02 +00001917 // The actual identifier can be a nested name specifier, and in macros
1918 // it is often token-pasted.
1919 while (FormatTok->isOneOf(tok::identifier, tok::coloncolon, tok::hashhash,
1920 tok::kw___attribute, tok::kw___declspec,
1921 tok::kw_alignas) ||
1922 ((Style.Language == FormatStyle::LK_Java ||
1923 Style.Language == FormatStyle::LK_JavaScript) &&
1924 FormatTok->isOneOf(tok::period, tok::comma))) {
1925 bool IsNonMacroIdentifier =
1926 FormatTok->is(tok::identifier) &&
1927 FormatTok->TokenText != FormatTok->TokenText.upper();
Manuel Klimeke01bab52013-01-15 13:38:33 +00001928 nextToken();
1929 // We can have macros or attributes in between 'class' and the class name.
Daniel Jasper04785d02015-05-06 14:03:02 +00001930 if (!IsNonMacroIdentifier && FormatTok->Tok.is(tok::l_paren))
Manuel Klimeke01bab52013-01-15 13:38:33 +00001931 parseParens();
Daniel Jasper04785d02015-05-06 14:03:02 +00001932 }
Manuel Klimeke01bab52013-01-15 13:38:33 +00001933
Daniel Jasper04785d02015-05-06 14:03:02 +00001934 // Note that parsing away template declarations here leads to incorrectly
1935 // accepting function declarations as record declarations.
1936 // In general, we cannot solve this problem. Consider:
1937 // class A<int> B() {}
1938 // which can be a function definition or a class definition when B() is a
1939 // macro. If we find enough real-world cases where this is a problem, we
1940 // can parse for the 'template' keyword in the beginning of the statement,
1941 // and thus rule out the record production in case there is no template
1942 // (this would still leave us with an ambiguity between template function
1943 // and class declarations).
Daniel Jasperadba2aa2015-05-18 12:52:00 +00001944 if (FormatTok->isOneOf(tok::colon, tok::less)) {
1945 while (!eof()) {
Daniel Jasper3c883d12015-05-18 14:49:19 +00001946 if (FormatTok->is(tok::l_brace)) {
1947 calculateBraceTypes(/*ExpectClassBody=*/true);
1948 if (!tryToParseBracedList())
1949 break;
1950 }
Daniel Jasper04785d02015-05-06 14:03:02 +00001951 if (FormatTok->Tok.is(tok::semi))
1952 return;
1953 nextToken();
Manuel Klimeke01bab52013-01-15 13:38:33 +00001954 }
1955 }
Manuel Klimek15dfe7a2013-05-28 11:55:06 +00001956 if (FormatTok->Tok.is(tok::l_brace)) {
Martin Probst1027fb82017-02-07 14:05:30 +00001957 if (ParseAsExpr) {
1958 parseChildBlock();
1959 } else {
1960 if (ShouldBreakBeforeBrace(Style, InitialToken))
1961 addUnwrappedLine();
Manuel Klimeka8eb9142013-05-13 12:51:40 +00001962
Martin Probst1027fb82017-02-07 14:05:30 +00001963 parseBlock(/*MustBeDeclaration=*/true, /*AddLevel=*/true,
1964 /*MunchSemi=*/false);
1965 }
Manuel Klimeka8eb9142013-05-13 12:51:40 +00001966 }
Daniel Jasper90cf3802015-06-17 09:44:02 +00001967 // There is no addUnwrappedLine() here so that we fall through to parsing a
1968 // structural element afterwards. Thus, in "class A {} n, m;",
1969 // "} n, m;" will end up in one unwrapped line.
Manuel Klimek28cacc72013-01-07 18:10:23 +00001970}
1971
Nico Weber8696a8d2013-01-09 21:15:03 +00001972void UnwrappedLineParser::parseObjCProtocolList() {
Manuel Klimek15dfe7a2013-05-28 11:55:06 +00001973 assert(FormatTok->Tok.is(tok::less) && "'<' expected.");
Nico Weber8696a8d2013-01-09 21:15:03 +00001974 do
1975 nextToken();
Manuel Klimek15dfe7a2013-05-28 11:55:06 +00001976 while (!eof() && FormatTok->Tok.isNot(tok::greater));
Nico Weber8696a8d2013-01-09 21:15:03 +00001977 nextToken(); // Skip '>'.
1978}
1979
1980void UnwrappedLineParser::parseObjCUntilAtEnd() {
1981 do {
Manuel Klimek15dfe7a2013-05-28 11:55:06 +00001982 if (FormatTok->Tok.isObjCAtKeyword(tok::objc_end)) {
Nico Weber8696a8d2013-01-09 21:15:03 +00001983 nextToken();
1984 addUnwrappedLine();
1985 break;
1986 }
Daniel Jaspera15da302013-08-28 08:04:23 +00001987 if (FormatTok->is(tok::l_brace)) {
1988 parseBlock(/*MustBeDeclaration=*/false);
1989 // In ObjC interfaces, nothing should be following the "}".
1990 addUnwrappedLine();
Benjamin Kramere21cb742014-01-08 15:59:42 +00001991 } else if (FormatTok->is(tok::r_brace)) {
1992 // Ignore stray "}". parseStructuralElement doesn't consume them.
1993 nextToken();
1994 addUnwrappedLine();
Daniel Jaspera15da302013-08-28 08:04:23 +00001995 } else {
1996 parseStructuralElement();
1997 }
Nico Weber8696a8d2013-01-09 21:15:03 +00001998 } while (!eof());
1999}
2000
Nico Weber2ce0ac52013-01-09 23:25:37 +00002001void UnwrappedLineParser::parseObjCInterfaceOrImplementation() {
Nico Weber7eecf4b2013-01-09 20:25:35 +00002002 nextToken();
Daniel Jasperd1ae3582013-03-20 12:37:50 +00002003 nextToken(); // interface name
Nico Weber7eecf4b2013-01-09 20:25:35 +00002004
2005 // @interface can be followed by either a base class, or a category.
Manuel Klimek15dfe7a2013-05-28 11:55:06 +00002006 if (FormatTok->Tok.is(tok::colon)) {
Nico Weber7eecf4b2013-01-09 20:25:35 +00002007 nextToken();
Daniel Jasperd1ae3582013-03-20 12:37:50 +00002008 nextToken(); // base class name
Manuel Klimek15dfe7a2013-05-28 11:55:06 +00002009 } else if (FormatTok->Tok.is(tok::l_paren))
Nico Weber7eecf4b2013-01-09 20:25:35 +00002010 // Skip category, if present.
2011 parseParens();
2012
Manuel Klimek15dfe7a2013-05-28 11:55:06 +00002013 if (FormatTok->Tok.is(tok::less))
Nico Weber8696a8d2013-01-09 21:15:03 +00002014 parseObjCProtocolList();
Nico Weber7eecf4b2013-01-09 20:25:35 +00002015
Dinesh Dwivediea3aca82014-05-02 17:01:46 +00002016 if (FormatTok->Tok.is(tok::l_brace)) {
Daniel Jasperc1bc38e2015-09-29 14:57:55 +00002017 if (Style.BraceWrapping.AfterObjCDeclaration)
Dinesh Dwivediea3aca82014-05-02 17:01:46 +00002018 addUnwrappedLine();
Nico Weber9096fc02013-06-26 00:30:14 +00002019 parseBlock(/*MustBeDeclaration=*/true);
Dinesh Dwivediea3aca82014-05-02 17:01:46 +00002020 }
Nico Weber7eecf4b2013-01-09 20:25:35 +00002021
2022 // With instance variables, this puts '}' on its own line. Without instance
2023 // variables, this ends the @interface line.
2024 addUnwrappedLine();
2025
Nico Weber8696a8d2013-01-09 21:15:03 +00002026 parseObjCUntilAtEnd();
2027}
Nico Weber7eecf4b2013-01-09 20:25:35 +00002028
Nico Weber8696a8d2013-01-09 21:15:03 +00002029void UnwrappedLineParser::parseObjCProtocol() {
2030 nextToken();
Daniel Jasperd1ae3582013-03-20 12:37:50 +00002031 nextToken(); // protocol name
Nico Weber8696a8d2013-01-09 21:15:03 +00002032
Manuel Klimek15dfe7a2013-05-28 11:55:06 +00002033 if (FormatTok->Tok.is(tok::less))
Nico Weber8696a8d2013-01-09 21:15:03 +00002034 parseObjCProtocolList();
2035
2036 // Check for protocol declaration.
Manuel Klimek15dfe7a2013-05-28 11:55:06 +00002037 if (FormatTok->Tok.is(tok::semi)) {
Nico Weber8696a8d2013-01-09 21:15:03 +00002038 nextToken();
2039 return addUnwrappedLine();
2040 }
2041
2042 addUnwrappedLine();
2043 parseObjCUntilAtEnd();
Nico Weber7eecf4b2013-01-09 20:25:35 +00002044}
2045
Daniel Jasperfca735c2015-02-19 16:14:18 +00002046void UnwrappedLineParser::parseJavaScriptEs6ImportExport() {
Martin Probst053f1aa2016-04-19 14:55:37 +00002047 bool IsImport = FormatTok->is(Keywords.kw_import);
2048 assert(IsImport || FormatTok->is(tok::kw_export));
Daniel Jasper354aa512015-02-19 16:07:32 +00002049 nextToken();
Daniel Jasperfca735c2015-02-19 16:14:18 +00002050
Daniel Jasperec05fc72015-05-11 09:14:50 +00002051 // Consume the "default" in "export default class/function".
Daniel Jasper668c7bb2015-05-11 09:03:10 +00002052 if (FormatTok->is(tok::kw_default))
2053 nextToken();
Daniel Jasperec05fc72015-05-11 09:14:50 +00002054
Martin Probst5f8445b2016-04-24 22:05:09 +00002055 // Consume "async function", "function" and "default function", so that these
2056 // get parsed as free-standing JS functions, i.e. do not require a trailing
2057 // semicolon.
2058 if (FormatTok->is(Keywords.kw_async))
2059 nextToken();
Daniel Jasper668c7bb2015-05-11 09:03:10 +00002060 if (FormatTok->is(Keywords.kw_function)) {
2061 nextToken();
2062 return;
2063 }
2064
Martin Probst053f1aa2016-04-19 14:55:37 +00002065 // For imports, `export *`, `export {...}`, consume the rest of the line up
2066 // to the terminating `;`. For everything else, just return and continue
2067 // parsing the structural element, i.e. the declaration or expression for
2068 // `export default`.
2069 if (!IsImport && !FormatTok->isOneOf(tok::l_brace, tok::star) &&
2070 !FormatTok->isStringLiteral())
2071 return;
Daniel Jasperfca735c2015-02-19 16:14:18 +00002072
Martin Probstd40bca42017-01-09 08:56:36 +00002073 while (!eof()) {
2074 if (FormatTok->is(tok::semi))
2075 return;
2076 if (Line->Tokens.size() == 0) {
2077 // Common issue: Automatic Semicolon Insertion wrapped the line, so the
2078 // import statement should terminate.
2079 return;
2080 }
Daniel Jasperefc1a832016-01-07 08:53:35 +00002081 if (FormatTok->is(tok::l_brace)) {
2082 FormatTok->BlockKind = BK_Block;
2083 parseBracedList();
2084 } else {
2085 nextToken();
2086 }
Daniel Jasper354aa512015-02-19 16:07:32 +00002087 }
2088}
2089
Daniel Jasper3b203a62013-09-05 16:05:56 +00002090LLVM_ATTRIBUTE_UNUSED static void printDebugInfo(const UnwrappedLine &Line,
2091 StringRef Prefix = "") {
Daniel Jasper9fe0e8d2013-09-05 09:29:45 +00002092 llvm::dbgs() << Prefix << "Line(" << Line.Level << ")"
2093 << (Line.InPPDirective ? " MACRO" : "") << ": ";
2094 for (std::list<UnwrappedLineNode>::const_iterator I = Line.Tokens.begin(),
2095 E = Line.Tokens.end();
2096 I != E; ++I) {
Krasimir Georgiev91834222017-01-25 13:58:58 +00002097 llvm::dbgs() << I->Tok->Tok.getName() << "["
2098 << "T=" << I->Tok->Type
2099 << ", OC=" << I->Tok->OriginalColumn << "] ";
Daniel Jasper9fe0e8d2013-09-05 09:29:45 +00002100 }
2101 for (std::list<UnwrappedLineNode>::const_iterator I = Line.Tokens.begin(),
2102 E = Line.Tokens.end();
2103 I != E; ++I) {
2104 const UnwrappedLineNode &Node = *I;
2105 for (SmallVectorImpl<UnwrappedLine>::const_iterator
2106 I = Node.Children.begin(),
2107 E = Node.Children.end();
2108 I != E; ++I) {
2109 printDebugInfo(*I, "\nChild: ");
2110 }
2111 }
2112 llvm::dbgs() << "\n";
2113}
2114
Daniel Jasperf7935112012-12-03 18:12:45 +00002115void UnwrappedLineParser::addUnwrappedLine() {
Daniel Jasperdaffc0d2013-01-16 09:10:19 +00002116 if (Line->Tokens.empty())
Daniel Jasper7c85fde2013-01-08 14:56:18 +00002117 return;
Manuel Klimekab3dc002013-01-16 12:31:12 +00002118 DEBUG({
Daniel Jasper9fe0e8d2013-09-05 09:29:45 +00002119 if (CurrentLines == &Lines)
2120 printDebugInfo(*Line);
Manuel Klimekab3dc002013-01-16 12:31:12 +00002121 });
Benjamin Kramerc7551a42015-05-31 11:18:05 +00002122 CurrentLines->push_back(std::move(*Line));
Daniel Jasperdaffc0d2013-01-16 09:10:19 +00002123 Line->Tokens.clear();
Krasimir Georgiev85c37042017-03-01 16:38:08 +00002124 Line->MatchingOpeningBlockLineIndex = UnwrappedLine::kInvalidIndex;
Manuel Klimekd3b92fa2013-01-18 14:04:34 +00002125 if (CurrentLines == &Lines && !PreprocessorDirectives.empty()) {
Benjamin Kramerc7551a42015-05-31 11:18:05 +00002126 CurrentLines->append(
2127 std::make_move_iterator(PreprocessorDirectives.begin()),
2128 std::make_move_iterator(PreprocessorDirectives.end()));
Manuel Klimekd3b92fa2013-01-18 14:04:34 +00002129 PreprocessorDirectives.clear();
2130 }
Daniel Jasperf7935112012-12-03 18:12:45 +00002131}
2132
Manuel Klimek15dfe7a2013-05-28 11:55:06 +00002133bool UnwrappedLineParser::eof() const { return FormatTok->Tok.is(tok::eof); }
Daniel Jasperf7935112012-12-03 18:12:45 +00002134
Daniel Jasperb05a81d2014-05-09 13:11:16 +00002135bool UnwrappedLineParser::isOnNewLine(const FormatToken &FormatTok) {
Manuel Klimek1fcbe672014-04-11 12:27:47 +00002136 return (Line->InPPDirective || FormatTok.HasUnescapedNewline) &&
2137 FormatTok.NewlinesBefore > 0;
2138}
2139
Krasimir Georgiev91834222017-01-25 13:58:58 +00002140// Checks if \p FormatTok is a line comment that continues the line comment
2141// section on \p Line.
Krasimir Georgievea222a72017-05-22 10:07:56 +00002142static bool continuesLineCommentSection(const FormatToken &FormatTok,
2143 const UnwrappedLine &Line,
2144 llvm::Regex &CommentPragmasRegex) {
Krasimir Georgiev91834222017-01-25 13:58:58 +00002145 if (Line.Tokens.empty())
2146 return false;
Krasimir Georgiev84321612017-01-30 19:18:55 +00002147
Krasimir Georgiev00c5c722017-02-02 15:32:19 +00002148 StringRef IndentContent = FormatTok.TokenText;
2149 if (FormatTok.TokenText.startswith("//") ||
2150 FormatTok.TokenText.startswith("/*"))
2151 IndentContent = FormatTok.TokenText.substr(2);
2152 if (CommentPragmasRegex.match(IndentContent))
2153 return false;
2154
Krasimir Georgiev91834222017-01-25 13:58:58 +00002155 // If Line starts with a line comment, then FormatTok continues the comment
Krasimir Georgiev84321612017-01-30 19:18:55 +00002156 // section if its original column is greater or equal to the original start
Krasimir Georgiev91834222017-01-25 13:58:58 +00002157 // column of the line.
2158 //
Krasimir Georgiev84321612017-01-30 19:18:55 +00002159 // Define the min column token of a line as follows: if a line ends in '{' or
2160 // contains a '{' followed by a line comment, then the min column token is
2161 // that '{'. Otherwise, the min column token of the line is the first token of
2162 // the line.
2163 //
2164 // If Line starts with a token other than a line comment, then FormatTok
2165 // continues the comment section if its original column is greater than the
2166 // original start column of the min column token of the line.
Krasimir Georgiev91834222017-01-25 13:58:58 +00002167 //
2168 // For example, the second line comment continues the first in these cases:
Krasimir Georgievb6ccd382017-02-02 14:36:50 +00002169 //
Krasimir Georgiev91834222017-01-25 13:58:58 +00002170 // // first line
2171 // // second line
Krasimir Georgievb6ccd382017-02-02 14:36:50 +00002172 //
Krasimir Georgiev91834222017-01-25 13:58:58 +00002173 // and:
Krasimir Georgievb6ccd382017-02-02 14:36:50 +00002174 //
Krasimir Georgiev91834222017-01-25 13:58:58 +00002175 // // first line
2176 // // second line
Krasimir Georgievb6ccd382017-02-02 14:36:50 +00002177 //
Krasimir Georgiev91834222017-01-25 13:58:58 +00002178 // and:
Krasimir Georgievb6ccd382017-02-02 14:36:50 +00002179 //
Krasimir Georgiev91834222017-01-25 13:58:58 +00002180 // int i; // first line
2181 // // second line
Krasimir Georgievb6ccd382017-02-02 14:36:50 +00002182 //
Krasimir Georgiev84321612017-01-30 19:18:55 +00002183 // and:
Krasimir Georgievb6ccd382017-02-02 14:36:50 +00002184 //
Krasimir Georgiev84321612017-01-30 19:18:55 +00002185 // do { // first line
2186 // // second line
2187 // int i;
2188 // } while (true);
Krasimir Georgiev91834222017-01-25 13:58:58 +00002189 //
Krasimir Georgievb6ccd382017-02-02 14:36:50 +00002190 // and:
2191 //
2192 // enum {
2193 // a, // first line
2194 // // second line
2195 // b
2196 // };
2197 //
Krasimir Georgiev91834222017-01-25 13:58:58 +00002198 // The second line comment doesn't continue the first in these cases:
Krasimir Georgievb6ccd382017-02-02 14:36:50 +00002199 //
Krasimir Georgiev91834222017-01-25 13:58:58 +00002200 // // first line
2201 // // second line
Krasimir Georgievb6ccd382017-02-02 14:36:50 +00002202 //
Krasimir Georgiev91834222017-01-25 13:58:58 +00002203 // and:
Krasimir Georgievb6ccd382017-02-02 14:36:50 +00002204 //
Krasimir Georgiev91834222017-01-25 13:58:58 +00002205 // int i; // first line
2206 // // second line
Krasimir Georgievb6ccd382017-02-02 14:36:50 +00002207 //
Krasimir Georgiev84321612017-01-30 19:18:55 +00002208 // and:
Krasimir Georgievb6ccd382017-02-02 14:36:50 +00002209 //
Krasimir Georgiev84321612017-01-30 19:18:55 +00002210 // do { // first line
2211 // // second line
2212 // int i;
2213 // } while (true);
Krasimir Georgievb6ccd382017-02-02 14:36:50 +00002214 //
2215 // and:
2216 //
2217 // enum {
2218 // a, // first line
2219 // // second line
2220 // };
Krasimir Georgiev84321612017-01-30 19:18:55 +00002221 const FormatToken *MinColumnToken = Line.Tokens.front().Tok;
2222
2223 // Scan for '{//'. If found, use the column of '{' as a min column for line
2224 // comment section continuation.
2225 const FormatToken *PreviousToken = nullptr;
Krasimir Georgievd86c25d2017-03-10 13:09:29 +00002226 for (const UnwrappedLineNode &Node : Line.Tokens) {
Krasimir Georgiev84321612017-01-30 19:18:55 +00002227 if (PreviousToken && PreviousToken->is(tok::l_brace) &&
2228 isLineComment(*Node.Tok)) {
2229 MinColumnToken = PreviousToken;
2230 break;
2231 }
2232 PreviousToken = Node.Tok;
Krasimir Georgievb6ccd382017-02-02 14:36:50 +00002233
2234 // Grab the last newline preceding a token in this unwrapped line.
2235 if (Node.Tok->NewlinesBefore > 0) {
2236 MinColumnToken = Node.Tok;
2237 }
Krasimir Georgiev84321612017-01-30 19:18:55 +00002238 }
2239 if (PreviousToken && PreviousToken->is(tok::l_brace)) {
2240 MinColumnToken = PreviousToken;
2241 }
2242
Krasimir Georgievea222a72017-05-22 10:07:56 +00002243 return continuesLineComment(FormatTok, /*Previous=*/Line.Tokens.back().Tok,
2244 MinColumnToken);
Krasimir Georgiev91834222017-01-25 13:58:58 +00002245}
2246
Manuel Klimekf92f7bc2013-01-22 16:31:55 +00002247void UnwrappedLineParser::flushComments(bool NewlineBeforeNext) {
2248 bool JustComments = Line->Tokens.empty();
Manuel Klimek15dfe7a2013-05-28 11:55:06 +00002249 for (SmallVectorImpl<FormatToken *>::const_iterator
Manuel Klimekf92f7bc2013-01-22 16:31:55 +00002250 I = CommentsBeforeNextToken.begin(),
2251 E = CommentsBeforeNextToken.end();
2252 I != E; ++I) {
Krasimir Georgiev91834222017-01-25 13:58:58 +00002253 // Line comments that belong to the same line comment section are put on the
2254 // same line since later we might want to reflow content between them.
Krasimir Georgiev753625b2017-01-31 13:32:38 +00002255 // Additional fine-grained breaking of line comment sections is controlled
2256 // by the class BreakableLineCommentSection in case it is desirable to keep
2257 // several line comment sections in the same unwrapped line.
2258 //
2259 // FIXME: Consider putting separate line comment sections as children to the
2260 // unwrapped line instead.
Krasimir Georgiev00c5c722017-02-02 15:32:19 +00002261 (*I)->ContinuesLineCommentSection =
Krasimir Georgievea222a72017-05-22 10:07:56 +00002262 continuesLineCommentSection(**I, *Line, CommentPragmasRegex);
Krasimir Georgievb6ccd382017-02-02 14:36:50 +00002263 if (isOnNewLine(**I) && JustComments && !(*I)->ContinuesLineCommentSection)
Manuel Klimekf92f7bc2013-01-22 16:31:55 +00002264 addUnwrappedLine();
Manuel Klimekf92f7bc2013-01-22 16:31:55 +00002265 pushToken(*I);
2266 }
Daniel Jaspere60cba12015-05-13 11:35:53 +00002267 if (NewlineBeforeNext && JustComments)
Manuel Klimekf92f7bc2013-01-22 16:31:55 +00002268 addUnwrappedLine();
Manuel Klimekf92f7bc2013-01-22 16:31:55 +00002269 CommentsBeforeNextToken.clear();
2270}
2271
Daniel Jasperf7935112012-12-03 18:12:45 +00002272void UnwrappedLineParser::nextToken() {
2273 if (eof())
2274 return;
Manuel Klimek1fcbe672014-04-11 12:27:47 +00002275 flushComments(isOnNewLine(*FormatTok));
Manuel Klimekf92f7bc2013-01-22 16:31:55 +00002276 pushToken(FormatTok);
Daniel Jasper1dcbbcfc2016-03-14 19:21:36 +00002277 if (Style.Language != FormatStyle::LK_JavaScript)
2278 readToken();
2279 else
2280 readTokenWithJavaScriptASI();
Manuel Klimek1abf7892013-01-04 23:34:14 +00002281}
2282
Daniel Jasperb9a49902016-01-09 15:56:28 +00002283const FormatToken *UnwrappedLineParser::getPreviousToken() {
2284 // FIXME: This is a dirty way to access the previous token. Find a better
2285 // solution.
2286 if (!Line || Line->Tokens.empty())
2287 return nullptr;
2288 return Line->Tokens.back().Tok;
2289}
2290
Krasimir Georgievf62f9582017-02-08 10:30:44 +00002291void UnwrappedLineParser::distributeComments(
2292 const SmallVectorImpl<FormatToken *> &Comments,
2293 const FormatToken *NextTok) {
2294 // Whether or not a line comment token continues a line is controlled by
Krasimir Georgievea222a72017-05-22 10:07:56 +00002295 // the method continuesLineCommentSection, with the following caveat:
Krasimir Georgievf62f9582017-02-08 10:30:44 +00002296 //
2297 // Define a trail of Comments to be a nonempty proper postfix of Comments such
2298 // that each comment line from the trail is aligned with the next token, if
2299 // the next token exists. If a trail exists, the beginning of the maximal
2300 // trail is marked as a start of a new comment section.
2301 //
2302 // For example in this code:
2303 //
2304 // int a; // line about a
2305 // // line 1 about b
2306 // // line 2 about b
2307 // int b;
2308 //
2309 // the two lines about b form a maximal trail, so there are two sections, the
2310 // first one consisting of the single comment "// line about a" and the
2311 // second one consisting of the next two comments.
2312 if (Comments.empty())
2313 return;
2314 bool ShouldPushCommentsInCurrentLine = true;
2315 bool HasTrailAlignedWithNextToken = false;
2316 unsigned StartOfTrailAlignedWithNextToken = 0;
2317 if (NextTok) {
2318 // We are skipping the first element intentionally.
2319 for (unsigned i = Comments.size() - 1; i > 0; --i) {
2320 if (Comments[i]->OriginalColumn == NextTok->OriginalColumn) {
2321 HasTrailAlignedWithNextToken = true;
2322 StartOfTrailAlignedWithNextToken = i;
2323 }
2324 }
2325 }
2326 for (unsigned i = 0, e = Comments.size(); i < e; ++i) {
2327 FormatToken *FormatTok = Comments[i];
2328 if (HasTrailAlignedWithNextToken &&
2329 i == StartOfTrailAlignedWithNextToken) {
2330 FormatTok->ContinuesLineCommentSection = false;
2331 } else {
2332 FormatTok->ContinuesLineCommentSection =
Krasimir Georgievea222a72017-05-22 10:07:56 +00002333 continuesLineCommentSection(*FormatTok, *Line, CommentPragmasRegex);
Krasimir Georgievf62f9582017-02-08 10:30:44 +00002334 }
2335 if (!FormatTok->ContinuesLineCommentSection &&
2336 (isOnNewLine(*FormatTok) || FormatTok->IsFirst)) {
2337 ShouldPushCommentsInCurrentLine = false;
2338 }
2339 if (ShouldPushCommentsInCurrentLine) {
2340 pushToken(FormatTok);
2341 } else {
2342 CommentsBeforeNextToken.push_back(FormatTok);
2343 }
2344 }
2345}
2346
Manuel Klimek1abf7892013-01-04 23:34:14 +00002347void UnwrappedLineParser::readToken() {
Krasimir Georgievf62f9582017-02-08 10:30:44 +00002348 SmallVector<FormatToken *, 1> Comments;
Manuel Klimekf92f7bc2013-01-22 16:31:55 +00002349 do {
2350 FormatTok = Tokens->getNextToken();
Alexander Kornienkoc2ee9cf2014-03-13 13:59:48 +00002351 assert(FormatTok);
Manuel Klimek15dfe7a2013-05-28 11:55:06 +00002352 while (!Line->InPPDirective && FormatTok->Tok.is(tok::hash) &&
2353 (FormatTok->HasUnescapedNewline || FormatTok->IsFirst)) {
Krasimir Georgievf62f9582017-02-08 10:30:44 +00002354 distributeComments(Comments, FormatTok);
2355 Comments.clear();
Manuel Klimekf92f7bc2013-01-22 16:31:55 +00002356 // If there is an unfinished unwrapped line, we flush the preprocessor
2357 // directives only after that unwrapped line was finished later.
Daniel Jasper29d39d52015-02-08 09:34:49 +00002358 bool SwitchToPreprocessorLines = !Line->Tokens.empty();
Manuel Klimekf92f7bc2013-01-22 16:31:55 +00002359 ScopedLineState BlockState(*this, SwitchToPreprocessorLines);
Alexander Kornienkob1be9d62013-04-03 12:38:53 +00002360 // Comments stored before the preprocessor directive need to be output
2361 // before the preprocessor directive, at the same level as the
2362 // preprocessor directive, as we consider them to apply to the directive.
Manuel Klimek1fcbe672014-04-11 12:27:47 +00002363 flushComments(isOnNewLine(*FormatTok));
Manuel Klimekf92f7bc2013-01-22 16:31:55 +00002364 parsePPDirective();
2365 }
Manuel Klimek68b03042014-04-14 09:14:11 +00002366 while (FormatTok->Type == TT_ConflictStart ||
2367 FormatTok->Type == TT_ConflictEnd ||
2368 FormatTok->Type == TT_ConflictAlternative) {
2369 if (FormatTok->Type == TT_ConflictStart) {
2370 conditionalCompilationStart(/*Unreachable=*/false);
2371 } else if (FormatTok->Type == TT_ConflictAlternative) {
2372 conditionalCompilationAlternative();
Daniel Jasperb05a81d2014-05-09 13:11:16 +00002373 } else if (FormatTok->Type == TT_ConflictEnd) {
Manuel Klimek68b03042014-04-14 09:14:11 +00002374 conditionalCompilationEnd();
2375 }
2376 FormatTok = Tokens->getNextToken();
2377 FormatTok->MustBreakBefore = true;
2378 }
Alexander Kornienkof2e02122013-05-24 18:24:24 +00002379
2380 if (!PPStack.empty() && (PPStack.back() == PP_Unreachable) &&
2381 !Line->InPPDirective) {
2382 continue;
2383 }
2384
Krasimir Georgievf62f9582017-02-08 10:30:44 +00002385 if (!FormatTok->Tok.is(tok::comment)) {
2386 distributeComments(Comments, FormatTok);
2387 Comments.clear();
Manuel Klimekf92f7bc2013-01-22 16:31:55 +00002388 return;
Manuel Klimekf92f7bc2013-01-22 16:31:55 +00002389 }
Krasimir Georgievf62f9582017-02-08 10:30:44 +00002390
2391 Comments.push_back(FormatTok);
Manuel Klimekf92f7bc2013-01-22 16:31:55 +00002392 } while (!eof());
Krasimir Georgievf62f9582017-02-08 10:30:44 +00002393
2394 distributeComments(Comments, nullptr);
2395 Comments.clear();
Manuel Klimekf92f7bc2013-01-22 16:31:55 +00002396}
2397
Manuel Klimek15dfe7a2013-05-28 11:55:06 +00002398void UnwrappedLineParser::pushToken(FormatToken *Tok) {
Daniel Jasper9fe0e8d2013-09-05 09:29:45 +00002399 Line->Tokens.push_back(UnwrappedLineNode(Tok));
Manuel Klimekf92f7bc2013-01-22 16:31:55 +00002400 if (MustBreakBeforeNextToken) {
Daniel Jasper9fe0e8d2013-09-05 09:29:45 +00002401 Line->Tokens.back().Tok->MustBreakBefore = true;
Manuel Klimekf92f7bc2013-01-22 16:31:55 +00002402 MustBreakBeforeNextToken = false;
Manuel Klimek1abf7892013-01-04 23:34:14 +00002403 }
Daniel Jasperf7935112012-12-03 18:12:45 +00002404}
2405
Daniel Jasper8d1832e2013-01-07 13:26:07 +00002406} // end namespace format
2407} // end namespace clang