blob: ae79ea5d8a66899bd89ecf53f5807aecaf2f1b64 [file] [log] [blame]
Daniel Jasperf7935112012-12-03 18:12:45 +00001//===--- UnwrappedLineParser.cpp - Format C++ code ------------------------===//
2//
3// The LLVM Compiler Infrastructure
4//
5// This file is distributed under the University of Illinois Open Source
6// License. See LICENSE.TXT for details.
7//
8//===----------------------------------------------------------------------===//
9///
10/// \file
11/// \brief This file contains the implementation of the UnwrappedLineParser,
12/// which turns a stream of tokens into UnwrappedLines.
13///
Daniel Jasperf7935112012-12-03 18:12:45 +000014//===----------------------------------------------------------------------===//
15
Chandler Carruth4b417452013-01-19 08:09:44 +000016#include "UnwrappedLineParser.h"
Benjamin Kramer33335df2015-03-01 21:36:40 +000017#include "llvm/ADT/STLExtras.h"
Manuel Klimekab3dc002013-01-16 12:31:12 +000018#include "llvm/Support/Debug.h"
Benjamin Kramer53f5e892015-03-23 18:05:43 +000019#include "llvm/Support/raw_ostream.h"
Manuel Klimekab3dc002013-01-16 12:31:12 +000020
Chandler Carruth10346662014-04-22 03:17:02 +000021#define DEBUG_TYPE "format-parser"
22
Daniel Jasperf7935112012-12-03 18:12:45 +000023namespace clang {
24namespace format {
25
Manuel Klimek15dfe7a2013-05-28 11:55:06 +000026class FormatTokenSource {
27public:
Angel Garcia Gomez637d1e62015-10-20 13:23:58 +000028 virtual ~FormatTokenSource() {}
Manuel Klimek15dfe7a2013-05-28 11:55:06 +000029 virtual FormatToken *getNextToken() = 0;
30
31 virtual unsigned getPosition() = 0;
32 virtual FormatToken *setPosition(unsigned Position) = 0;
33};
34
Craig Topper69665e12013-07-01 04:21:54 +000035namespace {
36
Manuel Klimek0a3a3c92013-01-23 09:32:48 +000037class ScopedDeclarationState {
38public:
39 ScopedDeclarationState(UnwrappedLine &Line, std::vector<bool> &Stack,
40 bool MustBeDeclaration)
41 : Line(Line), Stack(Stack) {
Manuel Klimek0a3a3c92013-01-23 09:32:48 +000042 Line.MustBeDeclaration = MustBeDeclaration;
Manuel Klimek39080572013-01-23 11:03:04 +000043 Stack.push_back(MustBeDeclaration);
Manuel Klimek0a3a3c92013-01-23 09:32:48 +000044 }
45 ~ScopedDeclarationState() {
Manuel Klimek0a3a3c92013-01-23 09:32:48 +000046 Stack.pop_back();
Manuel Klimekc1237a82013-01-23 14:08:21 +000047 if (!Stack.empty())
48 Line.MustBeDeclaration = Stack.back();
49 else
50 Line.MustBeDeclaration = true;
Manuel Klimek0a3a3c92013-01-23 09:32:48 +000051 }
Daniel Jasper393564f2013-05-31 14:56:29 +000052
Manuel Klimek0a3a3c92013-01-23 09:32:48 +000053private:
54 UnwrappedLine &Line;
55 std::vector<bool> &Stack;
56};
57
Krasimir Georgieva1c30932017-05-19 10:34:57 +000058static bool isLineComment(const FormatToken &FormatTok) {
59 return FormatTok.is(tok::comment) &&
60 FormatTok.TokenText.startswith("//");
61}
62
Krasimir Georgievea222a72017-05-22 10:07:56 +000063// Checks if \p FormatTok is a line comment that continues the line comment
64// \p Previous. The original column of \p MinColumnToken is used to determine
65// whether \p FormatTok is indented enough to the right to continue \p Previous.
66static bool continuesLineComment(const FormatToken &FormatTok,
67 const FormatToken *Previous,
68 const FormatToken *MinColumnToken) {
69 if (!Previous || !MinColumnToken)
70 return false;
71 unsigned MinContinueColumn =
72 MinColumnToken->OriginalColumn + (isLineComment(*MinColumnToken) ? 0 : 1);
73 return isLineComment(FormatTok) && FormatTok.NewlinesBefore == 1 &&
74 isLineComment(*Previous) &&
75 FormatTok.OriginalColumn >= MinContinueColumn;
76}
77
Manuel Klimek1abf7892013-01-04 23:34:14 +000078class ScopedMacroState : public FormatTokenSource {
79public:
80 ScopedMacroState(UnwrappedLine &Line, FormatTokenSource *&TokenSource,
Manuel Klimek20e0af62015-05-06 11:56:29 +000081 FormatToken *&ResetToken)
Manuel Klimek1abf7892013-01-04 23:34:14 +000082 : Line(Line), TokenSource(TokenSource), ResetToken(ResetToken),
Manuel Klimek1a18c402013-04-12 14:13:36 +000083 PreviousLineLevel(Line.Level), PreviousTokenSource(TokenSource),
Krasimir Georgieva1c30932017-05-19 10:34:57 +000084 Token(nullptr), PreviousToken(nullptr) {
Manuel Klimek1abf7892013-01-04 23:34:14 +000085 TokenSource = this;
Manuel Klimekef2cfb12013-01-05 22:14:16 +000086 Line.Level = 0;
Manuel Klimek1abf7892013-01-04 23:34:14 +000087 Line.InPPDirective = true;
88 }
89
Alexander Kornienko34eb2072015-04-11 02:00:23 +000090 ~ScopedMacroState() override {
Manuel Klimek1abf7892013-01-04 23:34:14 +000091 TokenSource = PreviousTokenSource;
92 ResetToken = Token;
93 Line.InPPDirective = false;
Manuel Klimekef2cfb12013-01-05 22:14:16 +000094 Line.Level = PreviousLineLevel;
Manuel Klimek1abf7892013-01-04 23:34:14 +000095 }
96
Craig Topperfb6b25b2014-03-15 04:29:04 +000097 FormatToken *getNextToken() override {
Manuel Klimek78725712013-01-07 10:03:37 +000098 // The \c UnwrappedLineParser guards against this by never calling
99 // \c getNextToken() after it has encountered the first eof token.
100 assert(!eof());
Krasimir Georgieva1c30932017-05-19 10:34:57 +0000101 PreviousToken = Token;
Manuel Klimek1abf7892013-01-04 23:34:14 +0000102 Token = PreviousTokenSource->getNextToken();
103 if (eof())
Manuel Klimek15dfe7a2013-05-28 11:55:06 +0000104 return getFakeEOF();
Manuel Klimek1abf7892013-01-04 23:34:14 +0000105 return Token;
106 }
107
Craig Topperfb6b25b2014-03-15 04:29:04 +0000108 unsigned getPosition() override { return PreviousTokenSource->getPosition(); }
Manuel Klimekab419912013-05-23 09:41:43 +0000109
Craig Topperfb6b25b2014-03-15 04:29:04 +0000110 FormatToken *setPosition(unsigned Position) override {
Krasimir Georgieva1c30932017-05-19 10:34:57 +0000111 PreviousToken = nullptr;
Manuel Klimekab419912013-05-23 09:41:43 +0000112 Token = PreviousTokenSource->setPosition(Position);
113 return Token;
114 }
115
Manuel Klimek1abf7892013-01-04 23:34:14 +0000116private:
Krasimir Georgieva1c30932017-05-19 10:34:57 +0000117 bool eof() {
118 return Token && Token->HasUnescapedNewline &&
Krasimir Georgievea222a72017-05-22 10:07:56 +0000119 !continuesLineComment(*Token, PreviousToken,
120 /*MinColumnToken=*/PreviousToken);
Krasimir Georgieva1c30932017-05-19 10:34:57 +0000121 }
Manuel Klimek1abf7892013-01-04 23:34:14 +0000122
Manuel Klimek15dfe7a2013-05-28 11:55:06 +0000123 FormatToken *getFakeEOF() {
124 static bool EOFInitialized = false;
125 static FormatToken FormatTok;
126 if (!EOFInitialized) {
127 FormatTok.Tok.startToken();
128 FormatTok.Tok.setKind(tok::eof);
129 EOFInitialized = true;
130 }
131 return &FormatTok;
Manuel Klimek1abf7892013-01-04 23:34:14 +0000132 }
133
134 UnwrappedLine &Line;
135 FormatTokenSource *&TokenSource;
Manuel Klimek15dfe7a2013-05-28 11:55:06 +0000136 FormatToken *&ResetToken;
Manuel Klimekef2cfb12013-01-05 22:14:16 +0000137 unsigned PreviousLineLevel;
Manuel Klimek1abf7892013-01-04 23:34:14 +0000138 FormatTokenSource *PreviousTokenSource;
139
Manuel Klimek15dfe7a2013-05-28 11:55:06 +0000140 FormatToken *Token;
Krasimir Georgieva1c30932017-05-19 10:34:57 +0000141 FormatToken *PreviousToken;
Manuel Klimek1abf7892013-01-04 23:34:14 +0000142};
143
Craig Topper69665e12013-07-01 04:21:54 +0000144} // end anonymous namespace
145
Manuel Klimek8e07a1b2013-01-10 11:52:21 +0000146class ScopedLineState {
147public:
Manuel Klimekd3b92fa2013-01-18 14:04:34 +0000148 ScopedLineState(UnwrappedLineParser &Parser,
149 bool SwitchToPreprocessorLines = false)
David Blaikieefb6eb22014-08-09 20:02:07 +0000150 : Parser(Parser), OriginalLines(Parser.CurrentLines) {
Manuel Klimekd3b92fa2013-01-18 14:04:34 +0000151 if (SwitchToPreprocessorLines)
152 Parser.CurrentLines = &Parser.PreprocessorDirectives;
Daniel Jasper9fe0e8d2013-09-05 09:29:45 +0000153 else if (!Parser.Line->Tokens.empty())
154 Parser.CurrentLines = &Parser.Line->Tokens.back().Children;
David Blaikieefb6eb22014-08-09 20:02:07 +0000155 PreBlockLine = std::move(Parser.Line);
156 Parser.Line = llvm::make_unique<UnwrappedLine>();
Daniel Jasperdaffc0d2013-01-16 09:10:19 +0000157 Parser.Line->Level = PreBlockLine->Level;
158 Parser.Line->InPPDirective = PreBlockLine->InPPDirective;
Manuel Klimek8e07a1b2013-01-10 11:52:21 +0000159 }
160
161 ~ScopedLineState() {
Daniel Jasperdaffc0d2013-01-16 09:10:19 +0000162 if (!Parser.Line->Tokens.empty()) {
Manuel Klimek8e07a1b2013-01-10 11:52:21 +0000163 Parser.addUnwrappedLine();
164 }
Daniel Jasperdaffc0d2013-01-16 09:10:19 +0000165 assert(Parser.Line->Tokens.empty());
David Blaikieefb6eb22014-08-09 20:02:07 +0000166 Parser.Line = std::move(PreBlockLine);
Daniel Jasper9fe0e8d2013-09-05 09:29:45 +0000167 if (Parser.CurrentLines == &Parser.PreprocessorDirectives)
168 Parser.MustBreakBeforeNextToken = true;
169 Parser.CurrentLines = OriginalLines;
Manuel Klimek8e07a1b2013-01-10 11:52:21 +0000170 }
171
172private:
173 UnwrappedLineParser &Parser;
174
David Blaikieefb6eb22014-08-09 20:02:07 +0000175 std::unique_ptr<UnwrappedLine> PreBlockLine;
Daniel Jasper9fe0e8d2013-09-05 09:29:45 +0000176 SmallVectorImpl<UnwrappedLine> *OriginalLines;
Manuel Klimek8e07a1b2013-01-10 11:52:21 +0000177};
178
Alexander Kornienko3a33f022013-12-12 09:49:52 +0000179class CompoundStatementIndenter {
180public:
181 CompoundStatementIndenter(UnwrappedLineParser *Parser,
182 const FormatStyle &Style, unsigned &LineLevel)
183 : LineLevel(LineLevel), OldLineLevel(LineLevel) {
Daniel Jasperc1bc38e2015-09-29 14:57:55 +0000184 if (Style.BraceWrapping.AfterControlStatement)
Alexander Kornienko3a33f022013-12-12 09:49:52 +0000185 Parser->addUnwrappedLine();
Daniel Jasperc1bc38e2015-09-29 14:57:55 +0000186 if (Style.BraceWrapping.IndentBraces)
Alexander Kornienko3a33f022013-12-12 09:49:52 +0000187 ++LineLevel;
Alexander Kornienko3a33f022013-12-12 09:49:52 +0000188 }
Daniel Jasperb05a81d2014-05-09 13:11:16 +0000189 ~CompoundStatementIndenter() { LineLevel = OldLineLevel; }
Alexander Kornienko3a33f022013-12-12 09:49:52 +0000190
191private:
192 unsigned &LineLevel;
193 unsigned OldLineLevel;
194};
195
Craig Topper69665e12013-07-01 04:21:54 +0000196namespace {
197
Manuel Klimekab419912013-05-23 09:41:43 +0000198class IndexedTokenSource : public FormatTokenSource {
199public:
Manuel Klimek15dfe7a2013-05-28 11:55:06 +0000200 IndexedTokenSource(ArrayRef<FormatToken *> Tokens)
Manuel Klimekab419912013-05-23 09:41:43 +0000201 : Tokens(Tokens), Position(-1) {}
202
Craig Topperfb6b25b2014-03-15 04:29:04 +0000203 FormatToken *getNextToken() override {
Manuel Klimekab419912013-05-23 09:41:43 +0000204 ++Position;
205 return Tokens[Position];
206 }
207
Craig Topperfb6b25b2014-03-15 04:29:04 +0000208 unsigned getPosition() override {
Manuel Klimekab419912013-05-23 09:41:43 +0000209 assert(Position >= 0);
210 return Position;
211 }
212
Craig Topperfb6b25b2014-03-15 04:29:04 +0000213 FormatToken *setPosition(unsigned P) override {
Manuel Klimekab419912013-05-23 09:41:43 +0000214 Position = P;
215 return Tokens[Position];
216 }
217
Manuel Klimek71814b42013-10-11 21:25:45 +0000218 void reset() { Position = -1; }
219
Manuel Klimekab419912013-05-23 09:41:43 +0000220private:
Manuel Klimek15dfe7a2013-05-28 11:55:06 +0000221 ArrayRef<FormatToken *> Tokens;
Manuel Klimekab419912013-05-23 09:41:43 +0000222 int Position;
223};
224
Craig Topper69665e12013-07-01 04:21:54 +0000225} // end anonymous namespace
226
Daniel Jasperd2ae41a2013-05-15 08:14:19 +0000227UnwrappedLineParser::UnwrappedLineParser(const FormatStyle &Style,
Daniel Jasperd0ec0d62014-11-04 12:41:02 +0000228 const AdditionalKeywords &Keywords,
Manuel Klimek15dfe7a2013-05-28 11:55:06 +0000229 ArrayRef<FormatToken *> Tokens,
Daniel Jasperd2ae41a2013-05-15 08:14:19 +0000230 UnwrappedLineConsumer &Callback)
Daniel Jasperb05a81d2014-05-09 13:11:16 +0000231 : Line(new UnwrappedLine), MustBreakBeforeNextToken(false),
Krasimir Georgiev00c5c722017-02-02 15:32:19 +0000232 CurrentLines(&Lines), Style(Style), Keywords(Keywords),
233 CommentPragmasRegex(Style.CommentPragmas), Tokens(nullptr),
Manuel Klimek20e0af62015-05-06 11:56:29 +0000234 Callback(Callback), AllTokens(Tokens), PPBranchLevel(-1) {}
Manuel Klimek71814b42013-10-11 21:25:45 +0000235
236void UnwrappedLineParser::reset() {
237 PPBranchLevel = -1;
238 Line.reset(new UnwrappedLine);
239 CommentsBeforeNextToken.clear();
Craig Topper2145bc02014-05-09 08:15:10 +0000240 FormatTok = nullptr;
Manuel Klimek71814b42013-10-11 21:25:45 +0000241 MustBreakBeforeNextToken = false;
242 PreprocessorDirectives.clear();
243 CurrentLines = &Lines;
244 DeclarationScopeStack.clear();
Manuel Klimek71814b42013-10-11 21:25:45 +0000245 PPStack.clear();
246}
Daniel Jasperf7935112012-12-03 18:12:45 +0000247
Manuel Klimek20e0af62015-05-06 11:56:29 +0000248void UnwrappedLineParser::parse() {
Manuel Klimekab419912013-05-23 09:41:43 +0000249 IndexedTokenSource TokenSource(AllTokens);
Manuel Klimek71814b42013-10-11 21:25:45 +0000250 do {
251 DEBUG(llvm::dbgs() << "----\n");
252 reset();
253 Tokens = &TokenSource;
254 TokenSource.reset();
Daniel Jaspera79064a2013-03-01 18:11:39 +0000255
Manuel Klimek71814b42013-10-11 21:25:45 +0000256 readToken();
257 parseFile();
258 // Create line with eof token.
259 pushToken(FormatTok);
260 addUnwrappedLine();
261
262 for (SmallVectorImpl<UnwrappedLine>::iterator I = Lines.begin(),
263 E = Lines.end();
264 I != E; ++I) {
265 Callback.consumeUnwrappedLine(*I);
266 }
267 Callback.finishRun();
268 Lines.clear();
269 while (!PPLevelBranchIndex.empty() &&
Daniel Jasper53bd1672013-10-12 13:32:56 +0000270 PPLevelBranchIndex.back() + 1 >= PPLevelBranchCount.back()) {
Manuel Klimek71814b42013-10-11 21:25:45 +0000271 PPLevelBranchIndex.resize(PPLevelBranchIndex.size() - 1);
272 PPLevelBranchCount.resize(PPLevelBranchCount.size() - 1);
273 }
274 if (!PPLevelBranchIndex.empty()) {
275 ++PPLevelBranchIndex.back();
276 assert(PPLevelBranchIndex.size() == PPLevelBranchCount.size());
277 assert(PPLevelBranchIndex.back() <= PPLevelBranchCount.back());
278 }
279 } while (!PPLevelBranchIndex.empty());
Manuel Klimek1abf7892013-01-04 23:34:14 +0000280}
281
Manuel Klimek1a18c402013-04-12 14:13:36 +0000282void UnwrappedLineParser::parseFile() {
Daniel Jasper9326f912015-05-05 08:40:32 +0000283 // The top-level context in a file always has declarations, except for pre-
284 // processor directives and JavaScript files.
285 bool MustBeDeclaration =
286 !Line->InPPDirective && Style.Language != FormatStyle::LK_JavaScript;
287 ScopedDeclarationState DeclarationState(*Line, DeclarationScopeStack,
288 MustBeDeclaration);
Nico Weber9096fc02013-06-26 00:30:14 +0000289 parseLevel(/*HasOpeningBrace=*/false);
Manuel Klimek1abf7892013-01-04 23:34:14 +0000290 // Make sure to format the remaining tokens.
Manuel Klimekf92f7bc2013-01-22 16:31:55 +0000291 flushComments(true);
Manuel Klimek1abf7892013-01-04 23:34:14 +0000292 addUnwrappedLine();
Daniel Jasperf7935112012-12-03 18:12:45 +0000293}
294
Manuel Klimek1a18c402013-04-12 14:13:36 +0000295void UnwrappedLineParser::parseLevel(bool HasOpeningBrace) {
Daniel Jasper516d7972013-07-25 11:31:57 +0000296 bool SwitchLabelEncountered = false;
Daniel Jasperf7935112012-12-03 18:12:45 +0000297 do {
Birunthan Mohanathasb001a0b2015-07-03 17:25:16 +0000298 tok::TokenKind kind = FormatTok->Tok.getKind();
299 if (FormatTok->Type == TT_MacroBlockBegin) {
300 kind = tok::l_brace;
301 } else if (FormatTok->Type == TT_MacroBlockEnd) {
302 kind = tok::r_brace;
303 }
304
305 switch (kind) {
Daniel Jasperf7935112012-12-03 18:12:45 +0000306 case tok::comment:
Daniel Jaspere25509f2012-12-17 11:29:41 +0000307 nextToken();
308 addUnwrappedLine();
Daniel Jasperf7935112012-12-03 18:12:45 +0000309 break;
310 case tok::l_brace:
Manuel Klimek0a3a3c92013-01-23 09:32:48 +0000311 // FIXME: Add parameter whether this can happen - if this happens, we must
312 // be in a non-declaration context.
Daniel Jasperb86e2722015-08-24 13:23:37 +0000313 if (!FormatTok->is(TT_MacroBlockBegin) && tryToParseBracedList())
314 continue;
Nico Weber9096fc02013-06-26 00:30:14 +0000315 parseBlock(/*MustBeDeclaration=*/false);
Daniel Jasperf7935112012-12-03 18:12:45 +0000316 addUnwrappedLine();
317 break;
318 case tok::r_brace:
Manuel Klimek1a18c402013-04-12 14:13:36 +0000319 if (HasOpeningBrace)
320 return;
Manuel Klimek1a18c402013-04-12 14:13:36 +0000321 nextToken();
322 addUnwrappedLine();
Manuel Klimek1058d982013-01-06 20:07:31 +0000323 break;
Daniel Jasper516d7972013-07-25 11:31:57 +0000324 case tok::kw_default:
325 case tok::kw_case:
Daniel Jasper72407622013-09-02 08:26:29 +0000326 if (!SwitchLabelEncountered &&
327 (Style.IndentCaseLabels || (Line->InPPDirective && Line->Level == 1)))
328 ++Line->Level;
Daniel Jasper516d7972013-07-25 11:31:57 +0000329 SwitchLabelEncountered = true;
330 parseStructuralElement();
331 break;
Daniel Jasperf7935112012-12-03 18:12:45 +0000332 default:
Manuel Klimek6b9eeba2013-01-07 14:56:16 +0000333 parseStructuralElement();
Daniel Jasperf7935112012-12-03 18:12:45 +0000334 break;
335 }
336 } while (!eof());
337}
338
Daniel Jasperadba2aa2015-05-18 12:52:00 +0000339void UnwrappedLineParser::calculateBraceTypes(bool ExpectClassBody) {
Manuel Klimekab419912013-05-23 09:41:43 +0000340 // We'll parse forward through the tokens until we hit
341 // a closing brace or eof - note that getNextToken() will
342 // parse macros, so this will magically work inside macro
343 // definitions, too.
344 unsigned StoredPosition = Tokens->getPosition();
Manuel Klimek15dfe7a2013-05-28 11:55:06 +0000345 FormatToken *Tok = FormatTok;
Daniel Jasperb9a49902016-01-09 15:56:28 +0000346 const FormatToken *PrevTok = getPreviousToken();
Manuel Klimekab419912013-05-23 09:41:43 +0000347 // Keep a stack of positions of lbrace tokens. We will
348 // update information about whether an lbrace starts a
349 // braced init list or a different block during the loop.
Daniel Jasperb1f74a82013-07-09 09:06:29 +0000350 SmallVector<FormatToken *, 8> LBraceStack;
Manuel Klimek15dfe7a2013-05-28 11:55:06 +0000351 assert(Tok->Tok.is(tok::l_brace));
Manuel Klimekab419912013-05-23 09:41:43 +0000352 do {
Daniel Jaspereb65e912015-12-21 18:31:15 +0000353 // Get next non-comment token.
Daniel Jasper7f5d53e2013-07-01 09:15:46 +0000354 FormatToken *NextTok;
Daniel Jasperca7bd722013-07-01 16:43:38 +0000355 unsigned ReadTokens = 0;
Daniel Jasper7f5d53e2013-07-01 09:15:46 +0000356 do {
357 NextTok = Tokens->getNextToken();
Daniel Jasperca7bd722013-07-01 16:43:38 +0000358 ++ReadTokens;
Daniel Jasper7f5d53e2013-07-01 09:15:46 +0000359 } while (NextTok->is(tok::comment));
360
Manuel Klimek15dfe7a2013-05-28 11:55:06 +0000361 switch (Tok->Tok.getKind()) {
Manuel Klimekab419912013-05-23 09:41:43 +0000362 case tok::l_brace:
Daniel Jasperb9a49902016-01-09 15:56:28 +0000363 if (Style.Language == FormatStyle::LK_JavaScript && PrevTok &&
364 PrevTok->is(tok::colon))
Martin Probst8e3eba02017-02-07 16:33:13 +0000365 // A colon indicates this code is in a type, or a braced list following
366 // a label in an object literal ({a: {b: 1}}).
367 // The code below could be confused by semicolons between the individual
368 // members in a type member list, which would normally trigger BK_Block.
369 // In both cases, this must be parsed as an inline braced init.
Daniel Jasperb9a49902016-01-09 15:56:28 +0000370 Tok->BlockKind = BK_BracedInit;
371 else
372 Tok->BlockKind = BK_Unknown;
Daniel Jasperb1f74a82013-07-09 09:06:29 +0000373 LBraceStack.push_back(Tok);
Manuel Klimekab419912013-05-23 09:41:43 +0000374 break;
375 case tok::r_brace:
Daniel Jasperb9a49902016-01-09 15:56:28 +0000376 if (LBraceStack.empty())
377 break;
378 if (LBraceStack.back()->BlockKind == BK_Unknown) {
379 bool ProbablyBracedList = false;
380 if (Style.Language == FormatStyle::LK_Proto) {
381 ProbablyBracedList = NextTok->isOneOf(tok::comma, tok::r_square);
382 } else {
383 // Using OriginalColumn to distinguish between ObjC methods and
384 // binary operators is a bit hacky.
385 bool NextIsObjCMethod = NextTok->isOneOf(tok::plus, tok::minus) &&
386 NextTok->OriginalColumn == 0;
Daniel Jasper91b032a2014-05-22 12:46:38 +0000387
Daniel Jasperb9a49902016-01-09 15:56:28 +0000388 // If there is a comma, semicolon or right paren after the closing
389 // brace, we assume this is a braced initializer list. Note that
390 // regardless how we mark inner braces here, we will overwrite the
391 // BlockKind later if we parse a braced list (where all blocks
392 // inside are by default braced lists), or when we explicitly detect
393 // blocks (for example while parsing lambdas).
Daniel Jasperb9a49902016-01-09 15:56:28 +0000394 ProbablyBracedList =
Daniel Jasperacffeb82016-03-05 18:34:26 +0000395 (Style.Language == FormatStyle::LK_JavaScript &&
Martin Probste1e12a72016-08-19 14:35:01 +0000396 NextTok->isOneOf(Keywords.kw_of, Keywords.kw_in,
397 Keywords.kw_as)) ||
Martin Probstb7fb2672017-05-10 13:53:29 +0000398 (Style.isCpp() && NextTok->is(tok::l_paren)) ||
Daniel Jasperb9a49902016-01-09 15:56:28 +0000399 NextTok->isOneOf(tok::comma, tok::period, tok::colon,
400 tok::r_paren, tok::r_square, tok::l_brace,
Martin Probstb7fb2672017-05-10 13:53:29 +0000401 tok::l_square, tok::ellipsis) ||
Daniel Jaspere4ada022016-12-13 10:05:03 +0000402 (NextTok->is(tok::identifier) &&
403 !PrevTok->isOneOf(tok::semi, tok::r_brace, tok::l_brace)) ||
Daniel Jasperb9a49902016-01-09 15:56:28 +0000404 (NextTok->is(tok::semi) &&
405 (!ExpectClassBody || LBraceStack.size() != 1)) ||
406 (NextTok->isBinaryOperator() && !NextIsObjCMethod);
Manuel Klimekab419912013-05-23 09:41:43 +0000407 }
Daniel Jasperb9a49902016-01-09 15:56:28 +0000408 if (ProbablyBracedList) {
409 Tok->BlockKind = BK_BracedInit;
410 LBraceStack.back()->BlockKind = BK_BracedInit;
411 } else {
412 Tok->BlockKind = BK_Block;
413 LBraceStack.back()->BlockKind = BK_Block;
414 }
Manuel Klimekab419912013-05-23 09:41:43 +0000415 }
Daniel Jasperb9a49902016-01-09 15:56:28 +0000416 LBraceStack.pop_back();
Manuel Klimekab419912013-05-23 09:41:43 +0000417 break;
Daniel Jasperac7e34e2014-03-13 10:11:17 +0000418 case tok::at:
Manuel Klimekab419912013-05-23 09:41:43 +0000419 case tok::semi:
420 case tok::kw_if:
421 case tok::kw_while:
422 case tok::kw_for:
423 case tok::kw_switch:
424 case tok::kw_try:
Nico Weberfac23712015-02-04 15:26:27 +0000425 case tok::kw___try:
Daniel Jasperb9a49902016-01-09 15:56:28 +0000426 if (!LBraceStack.empty() && LBraceStack.back()->BlockKind == BK_Unknown)
Daniel Jasperb1f74a82013-07-09 09:06:29 +0000427 LBraceStack.back()->BlockKind = BK_Block;
Manuel Klimekab419912013-05-23 09:41:43 +0000428 break;
429 default:
430 break;
431 }
Daniel Jasperb9a49902016-01-09 15:56:28 +0000432 PrevTok = Tok;
Manuel Klimekab419912013-05-23 09:41:43 +0000433 Tok = NextTok;
Manuel Klimekbab25fd2013-09-04 08:20:47 +0000434 } while (Tok->Tok.isNot(tok::eof) && !LBraceStack.empty());
Daniel Jasperb9a49902016-01-09 15:56:28 +0000435
Manuel Klimekab419912013-05-23 09:41:43 +0000436 // Assume other blocks for all unclosed opening braces.
437 for (unsigned i = 0, e = LBraceStack.size(); i != e; ++i) {
Daniel Jasperb1f74a82013-07-09 09:06:29 +0000438 if (LBraceStack[i]->BlockKind == BK_Unknown)
439 LBraceStack[i]->BlockKind = BK_Block;
Manuel Klimekab419912013-05-23 09:41:43 +0000440 }
Manuel Klimekbab25fd2013-09-04 08:20:47 +0000441
Manuel Klimekab419912013-05-23 09:41:43 +0000442 FormatTok = Tokens->setPosition(StoredPosition);
443}
444
Manuel Klimekb212f3b2013-10-12 22:46:56 +0000445void UnwrappedLineParser::parseBlock(bool MustBeDeclaration, bool AddLevel,
446 bool MunchSemi) {
Birunthan Mohanathasb001a0b2015-07-03 17:25:16 +0000447 assert(FormatTok->isOneOf(tok::l_brace, TT_MacroBlockBegin) &&
448 "'{' or macro block token expected");
449 const bool MacroBlock = FormatTok->is(TT_MacroBlockBegin);
Daniel Jaspereb65e912015-12-21 18:31:15 +0000450 FormatTok->BlockKind = BK_Block;
Birunthan Mohanathasb001a0b2015-07-03 17:25:16 +0000451
Daniel Jasper516d7972013-07-25 11:31:57 +0000452 unsigned InitialLevel = Line->Level;
Daniel Jasperf7935112012-12-03 18:12:45 +0000453 nextToken();
454
Birunthan Mohanathasb001a0b2015-07-03 17:25:16 +0000455 if (MacroBlock && FormatTok->is(tok::l_paren))
456 parseParens();
457
Manuel Klimeka4fe1c12013-01-21 16:42:44 +0000458 addUnwrappedLine();
Krasimir Georgiev9f5608a2017-05-18 15:16:24 +0000459 size_t OpeningLineIndex = CurrentLines->empty()
460 ? (UnwrappedLine::kInvalidIndex)
461 : (CurrentLines->size() - 1);
Daniel Jasperf7935112012-12-03 18:12:45 +0000462
Manuel Klimek0a3a3c92013-01-23 09:32:48 +0000463 ScopedDeclarationState DeclarationState(*Line, DeclarationScopeStack,
464 MustBeDeclaration);
Daniel Jasper65ee3472013-07-31 23:16:02 +0000465 if (AddLevel)
466 ++Line->Level;
Nico Weber9096fc02013-06-26 00:30:14 +0000467 parseLevel(/*HasOpeningBrace=*/true);
Alexander Kornienko578fdd82012-12-06 18:03:27 +0000468
Marianne Mailhot-Sarrasin03137c62016-04-14 14:56:49 +0000469 if (eof())
470 return;
471
Birunthan Mohanathasb001a0b2015-07-03 17:25:16 +0000472 if (MacroBlock ? !FormatTok->is(TT_MacroBlockEnd)
473 : !FormatTok->is(tok::r_brace)) {
Daniel Jasper516d7972013-07-25 11:31:57 +0000474 Line->Level = InitialLevel;
Daniel Jaspereb65e912015-12-21 18:31:15 +0000475 FormatTok->BlockKind = BK_Block;
Manuel Klimek1a18c402013-04-12 14:13:36 +0000476 return;
Manuel Klimekf92f7bc2013-01-22 16:31:55 +0000477 }
Alexander Kornienko0ea8e102012-12-04 15:40:36 +0000478
Daniel Jasperd1ae3582013-03-20 12:37:50 +0000479 nextToken(); // Munch the closing brace.
Birunthan Mohanathasb001a0b2015-07-03 17:25:16 +0000480
481 if (MacroBlock && FormatTok->is(tok::l_paren))
482 parseParens();
483
Manuel Klimekb212f3b2013-10-12 22:46:56 +0000484 if (MunchSemi && FormatTok->Tok.is(tok::semi))
485 nextToken();
Daniel Jasper516d7972013-07-25 11:31:57 +0000486 Line->Level = InitialLevel;
Krasimir Georgiev7cb267a2017-02-27 13:28:36 +0000487 Line->MatchingOpeningBlockLineIndex = OpeningLineIndex;
Daniel Jasperf7935112012-12-03 18:12:45 +0000488}
489
Daniel Jasper02c7bca2015-03-30 09:56:50 +0000490static bool isGoogScope(const UnwrappedLine &Line) {
Daniel Jasper616de8642014-11-23 16:46:28 +0000491 // FIXME: Closure-library specific stuff should not be hard-coded but be
492 // configurable.
Daniel Jasper4a39c842014-05-06 13:54:10 +0000493 if (Line.Tokens.size() < 4)
494 return false;
495 auto I = Line.Tokens.begin();
496 if (I->Tok->TokenText != "goog")
497 return false;
498 ++I;
499 if (I->Tok->isNot(tok::period))
500 return false;
501 ++I;
502 if (I->Tok->TokenText != "scope")
503 return false;
504 ++I;
505 return I->Tok->is(tok::l_paren);
506}
507
Martin Probst101ec892017-05-09 20:04:09 +0000508static bool isIIFE(const UnwrappedLine &Line,
509 const AdditionalKeywords &Keywords) {
510 // Look for the start of an immediately invoked anonymous function.
511 // https://en.wikipedia.org/wiki/Immediately-invoked_function_expression
512 // This is commonly done in JavaScript to create a new, anonymous scope.
513 // Example: (function() { ... })()
514 if (Line.Tokens.size() < 3)
515 return false;
516 auto I = Line.Tokens.begin();
517 if (I->Tok->isNot(tok::l_paren))
518 return false;
519 ++I;
520 if (I->Tok->isNot(Keywords.kw_function))
521 return false;
522 ++I;
523 return I->Tok->is(tok::l_paren);
524}
525
Roman Kashitsyna043ced2014-08-11 12:18:01 +0000526static bool ShouldBreakBeforeBrace(const FormatStyle &Style,
527 const FormatToken &InitialToken) {
Daniel Jasperc1bc38e2015-09-29 14:57:55 +0000528 if (InitialToken.is(tok::kw_namespace))
529 return Style.BraceWrapping.AfterNamespace;
530 if (InitialToken.is(tok::kw_class))
531 return Style.BraceWrapping.AfterClass;
532 if (InitialToken.is(tok::kw_union))
533 return Style.BraceWrapping.AfterUnion;
534 if (InitialToken.is(tok::kw_struct))
535 return Style.BraceWrapping.AfterStruct;
536 return false;
Roman Kashitsyna043ced2014-08-11 12:18:01 +0000537}
538
Manuel Klimek516e0542013-09-04 13:25:30 +0000539void UnwrappedLineParser::parseChildBlock() {
540 FormatTok->BlockKind = BK_Block;
541 nextToken();
542 {
Martin Probst101ec892017-05-09 20:04:09 +0000543 bool SkipIndent =
544 (Style.Language == FormatStyle::LK_JavaScript &&
545 (isGoogScope(*Line) || isIIFE(*Line, Keywords)));
Manuel Klimek516e0542013-09-04 13:25:30 +0000546 ScopedLineState LineState(*this);
547 ScopedDeclarationState DeclarationState(*Line, DeclarationScopeStack,
548 /*MustBeDeclaration=*/false);
Martin Probst101ec892017-05-09 20:04:09 +0000549 Line->Level += SkipIndent ? 0 : 1;
Manuel Klimek516e0542013-09-04 13:25:30 +0000550 parseLevel(/*HasOpeningBrace=*/true);
Daniel Jasper02c7bca2015-03-30 09:56:50 +0000551 flushComments(isOnNewLine(*FormatTok));
Martin Probst101ec892017-05-09 20:04:09 +0000552 Line->Level -= SkipIndent ? 0 : 1;
Manuel Klimek516e0542013-09-04 13:25:30 +0000553 }
554 nextToken();
555}
556
Daniel Jasperf7935112012-12-03 18:12:45 +0000557void UnwrappedLineParser::parsePPDirective() {
Manuel Klimek15dfe7a2013-05-28 11:55:06 +0000558 assert(FormatTok->Tok.is(tok::hash) && "'#' expected");
Manuel Klimek20e0af62015-05-06 11:56:29 +0000559 ScopedMacroState MacroState(*Line, Tokens, FormatTok);
Manuel Klimeka71e5d82013-01-02 16:30:12 +0000560 nextToken();
561
Craig Topper2145bc02014-05-09 08:15:10 +0000562 if (!FormatTok->Tok.getIdentifierInfo()) {
Manuel Klimek591b5802013-01-31 15:58:48 +0000563 parsePPUnknown();
Manuel Klimeka71e5d82013-01-02 16:30:12 +0000564 return;
Daniel Jasperf7935112012-12-03 18:12:45 +0000565 }
Manuel Klimeka71e5d82013-01-02 16:30:12 +0000566
Manuel Klimek15dfe7a2013-05-28 11:55:06 +0000567 switch (FormatTok->Tok.getIdentifierInfo()->getPPKeywordID()) {
Manuel Klimek1abf7892013-01-04 23:34:14 +0000568 case tok::pp_define:
569 parsePPDefine();
Alexander Kornienkof2e02122013-05-24 18:24:24 +0000570 return;
571 case tok::pp_if:
Manuel Klimek71814b42013-10-11 21:25:45 +0000572 parsePPIf(/*IfDef=*/false);
Alexander Kornienkof2e02122013-05-24 18:24:24 +0000573 break;
574 case tok::pp_ifdef:
575 case tok::pp_ifndef:
Manuel Klimek71814b42013-10-11 21:25:45 +0000576 parsePPIf(/*IfDef=*/true);
Alexander Kornienkof2e02122013-05-24 18:24:24 +0000577 break;
578 case tok::pp_else:
579 parsePPElse();
580 break;
581 case tok::pp_elif:
582 parsePPElIf();
583 break;
584 case tok::pp_endif:
585 parsePPEndIf();
Manuel Klimek1abf7892013-01-04 23:34:14 +0000586 break;
587 default:
588 parsePPUnknown();
589 break;
590 }
591}
592
Manuel Klimek68b03042014-04-14 09:14:11 +0000593void UnwrappedLineParser::conditionalCompilationCondition(bool Unreachable) {
594 if (Unreachable || (!PPStack.empty() && PPStack.back() == PP_Unreachable))
Alexander Kornienkof2e02122013-05-24 18:24:24 +0000595 PPStack.push_back(PP_Unreachable);
596 else
597 PPStack.push_back(PP_Conditional);
598}
599
Manuel Klimek68b03042014-04-14 09:14:11 +0000600void UnwrappedLineParser::conditionalCompilationStart(bool Unreachable) {
Manuel Klimek71814b42013-10-11 21:25:45 +0000601 ++PPBranchLevel;
602 assert(PPBranchLevel >= 0 && PPBranchLevel <= (int)PPLevelBranchIndex.size());
603 if (PPBranchLevel == (int)PPLevelBranchIndex.size()) {
604 PPLevelBranchIndex.push_back(0);
605 PPLevelBranchCount.push_back(0);
606 }
607 PPChainBranchIndex.push(0);
Manuel Klimek68b03042014-04-14 09:14:11 +0000608 bool Skip = PPLevelBranchIndex[PPBranchLevel] > 0;
609 conditionalCompilationCondition(Unreachable || Skip);
Alexander Kornienkof2e02122013-05-24 18:24:24 +0000610}
611
Manuel Klimek68b03042014-04-14 09:14:11 +0000612void UnwrappedLineParser::conditionalCompilationAlternative() {
Alexander Kornienkof2e02122013-05-24 18:24:24 +0000613 if (!PPStack.empty())
614 PPStack.pop_back();
Manuel Klimek71814b42013-10-11 21:25:45 +0000615 assert(PPBranchLevel < (int)PPLevelBranchIndex.size());
616 if (!PPChainBranchIndex.empty())
617 ++PPChainBranchIndex.top();
Manuel Klimek68b03042014-04-14 09:14:11 +0000618 conditionalCompilationCondition(
619 PPBranchLevel >= 0 && !PPChainBranchIndex.empty() &&
620 PPLevelBranchIndex[PPBranchLevel] != PPChainBranchIndex.top());
Alexander Kornienkof2e02122013-05-24 18:24:24 +0000621}
622
Manuel Klimek68b03042014-04-14 09:14:11 +0000623void UnwrappedLineParser::conditionalCompilationEnd() {
Manuel Klimek71814b42013-10-11 21:25:45 +0000624 assert(PPBranchLevel < (int)PPLevelBranchIndex.size());
625 if (PPBranchLevel >= 0 && !PPChainBranchIndex.empty()) {
626 if (PPChainBranchIndex.top() + 1 > PPLevelBranchCount[PPBranchLevel]) {
Manuel Klimek71814b42013-10-11 21:25:45 +0000627 PPLevelBranchCount[PPBranchLevel] = PPChainBranchIndex.top() + 1;
628 }
629 }
Manuel Klimek14bd9172014-01-29 08:49:02 +0000630 // Guard against #endif's without #if.
631 if (PPBranchLevel > 0)
632 --PPBranchLevel;
Manuel Klimek71814b42013-10-11 21:25:45 +0000633 if (!PPChainBranchIndex.empty())
634 PPChainBranchIndex.pop();
Alexander Kornienkof2e02122013-05-24 18:24:24 +0000635 if (!PPStack.empty())
636 PPStack.pop_back();
Manuel Klimek68b03042014-04-14 09:14:11 +0000637}
638
639void UnwrappedLineParser::parsePPIf(bool IfDef) {
Daniel Jasper62703eb2017-03-01 11:10:11 +0000640 bool IfNDef = FormatTok->is(tok::pp_ifndef);
Manuel Klimek68b03042014-04-14 09:14:11 +0000641 nextToken();
Daniel Jaspereab6cd42017-03-01 10:47:52 +0000642 bool Unreachable = false;
643 if (!IfDef && (FormatTok->is(tok::kw_false) || FormatTok->TokenText == "0"))
644 Unreachable = true;
Daniel Jasper62703eb2017-03-01 11:10:11 +0000645 if (IfDef && !IfNDef && FormatTok->TokenText == "SWIG")
Daniel Jaspereab6cd42017-03-01 10:47:52 +0000646 Unreachable = true;
647 conditionalCompilationStart(Unreachable);
Manuel Klimek68b03042014-04-14 09:14:11 +0000648 parsePPUnknown();
649}
650
651void UnwrappedLineParser::parsePPElse() {
652 conditionalCompilationAlternative();
653 parsePPUnknown();
654}
655
656void UnwrappedLineParser::parsePPElIf() { parsePPElse(); }
657
658void UnwrappedLineParser::parsePPEndIf() {
659 conditionalCompilationEnd();
Alexander Kornienkof2e02122013-05-24 18:24:24 +0000660 parsePPUnknown();
661}
662
Manuel Klimek1abf7892013-01-04 23:34:14 +0000663void UnwrappedLineParser::parsePPDefine() {
664 nextToken();
665
Manuel Klimek15dfe7a2013-05-28 11:55:06 +0000666 if (FormatTok->Tok.getKind() != tok::identifier) {
Manuel Klimek1abf7892013-01-04 23:34:14 +0000667 parsePPUnknown();
668 return;
669 }
670 nextToken();
Manuel Klimek15dfe7a2013-05-28 11:55:06 +0000671 if (FormatTok->Tok.getKind() == tok::l_paren &&
672 FormatTok->WhitespaceRange.getBegin() ==
673 FormatTok->WhitespaceRange.getEnd()) {
Manuel Klimek1abf7892013-01-04 23:34:14 +0000674 parseParens();
675 }
676 addUnwrappedLine();
Manuel Klimek52b15152013-01-09 15:25:02 +0000677 Line->Level = 1;
Manuel Klimek1b896292013-01-07 09:34:28 +0000678
679 // Errors during a preprocessor directive can only affect the layout of the
680 // preprocessor directive, and thus we ignore them. An alternative approach
681 // would be to use the same approach we use on the file level (no
682 // re-indentation if there was a structural error) within the macro
683 // definition.
Manuel Klimek1abf7892013-01-04 23:34:14 +0000684 parseFile();
685}
686
687void UnwrappedLineParser::parsePPUnknown() {
Manuel Klimeka71e5d82013-01-02 16:30:12 +0000688 do {
Manuel Klimeka71e5d82013-01-02 16:30:12 +0000689 nextToken();
690 } while (!eof());
691 addUnwrappedLine();
Daniel Jasperf7935112012-12-03 18:12:45 +0000692}
693
Alexander Kornienkoa04e5e22013-04-09 16:15:19 +0000694// Here we blacklist certain tokens that are not usually the first token in an
695// unwrapped line. This is used in attempt to distinguish macro calls without
696// trailing semicolons from other constructs split to several lines.
Benjamin Kramer8407df72015-03-09 16:47:52 +0000697static bool tokenCanStartNewLine(const clang::Token &Tok) {
Alexander Kornienkoa04e5e22013-04-09 16:15:19 +0000698 // Semicolon can be a null-statement, l_square can be a start of a macro or
699 // a C++11 attribute, but this doesn't seem to be common.
700 return Tok.isNot(tok::semi) && Tok.isNot(tok::l_brace) &&
701 Tok.isNot(tok::l_square) &&
702 // Tokens that can only be used as binary operators and a part of
703 // overloaded operator names.
704 Tok.isNot(tok::period) && Tok.isNot(tok::periodstar) &&
705 Tok.isNot(tok::arrow) && Tok.isNot(tok::arrowstar) &&
706 Tok.isNot(tok::less) && Tok.isNot(tok::greater) &&
707 Tok.isNot(tok::slash) && Tok.isNot(tok::percent) &&
708 Tok.isNot(tok::lessless) && Tok.isNot(tok::greatergreater) &&
709 Tok.isNot(tok::equal) && Tok.isNot(tok::plusequal) &&
710 Tok.isNot(tok::minusequal) && Tok.isNot(tok::starequal) &&
711 Tok.isNot(tok::slashequal) && Tok.isNot(tok::percentequal) &&
712 Tok.isNot(tok::ampequal) && Tok.isNot(tok::pipeequal) &&
713 Tok.isNot(tok::caretequal) && Tok.isNot(tok::greatergreaterequal) &&
714 Tok.isNot(tok::lesslessequal) &&
715 // Colon is used in labels, base class lists, initializer lists,
716 // range-based for loops, ternary operator, but should never be the
717 // first token in an unwrapped line.
Daniel Jasper5ebb2f32014-05-21 13:08:17 +0000718 Tok.isNot(tok::colon) &&
719 // 'noexcept' is a trailing annotation.
720 Tok.isNot(tok::kw_noexcept);
Alexander Kornienkoa04e5e22013-04-09 16:15:19 +0000721}
722
Martin Probst533965c2016-04-19 18:19:06 +0000723static bool mustBeJSIdent(const AdditionalKeywords &Keywords,
724 const FormatToken *FormatTok) {
Daniel Jasper1dcbbcfc2016-03-14 19:21:36 +0000725 // FIXME: This returns true for C/C++ keywords like 'struct'.
726 return FormatTok->is(tok::identifier) &&
727 (FormatTok->Tok.getIdentifierInfo() == nullptr ||
Martin Probst3dbbefa2016-11-10 16:21:02 +0000728 !FormatTok->isOneOf(
729 Keywords.kw_in, Keywords.kw_of, Keywords.kw_as, Keywords.kw_async,
730 Keywords.kw_await, Keywords.kw_yield, Keywords.kw_finally,
731 Keywords.kw_function, Keywords.kw_import, Keywords.kw_is,
732 Keywords.kw_let, Keywords.kw_var, tok::kw_const,
733 Keywords.kw_abstract, Keywords.kw_extends, Keywords.kw_implements,
734 Keywords.kw_instanceof, Keywords.kw_interface,
735 Keywords.kw_throws));
Daniel Jasper1dcbbcfc2016-03-14 19:21:36 +0000736}
737
Martin Probst533965c2016-04-19 18:19:06 +0000738static bool mustBeJSIdentOrValue(const AdditionalKeywords &Keywords,
739 const FormatToken *FormatTok) {
Martin Probstb9316ff2016-09-18 17:21:52 +0000740 return FormatTok->Tok.isLiteral() ||
741 FormatTok->isOneOf(tok::kw_true, tok::kw_false) ||
742 mustBeJSIdent(Keywords, FormatTok);
Martin Probst533965c2016-04-19 18:19:06 +0000743}
744
Daniel Jasper1dcbbcfc2016-03-14 19:21:36 +0000745// isJSDeclOrStmt returns true if |FormatTok| starts a declaration or statement
746// when encountered after a value (see mustBeJSIdentOrValue).
747static bool isJSDeclOrStmt(const AdditionalKeywords &Keywords,
748 const FormatToken *FormatTok) {
749 return FormatTok->isOneOf(
Martin Probst5f8445b2016-04-24 22:05:09 +0000750 tok::kw_return, Keywords.kw_yield,
Daniel Jasper1dcbbcfc2016-03-14 19:21:36 +0000751 // conditionals
752 tok::kw_if, tok::kw_else,
753 // loops
754 tok::kw_for, tok::kw_while, tok::kw_do, tok::kw_continue, tok::kw_break,
755 // switch/case
756 tok::kw_switch, tok::kw_case,
757 // exceptions
758 tok::kw_throw, tok::kw_try, tok::kw_catch, Keywords.kw_finally,
759 // declaration
760 tok::kw_const, tok::kw_class, Keywords.kw_var, Keywords.kw_let,
Martin Probst5f8445b2016-04-24 22:05:09 +0000761 Keywords.kw_async, Keywords.kw_function,
762 // import/export
763 Keywords.kw_import, tok::kw_export);
Daniel Jasper1dcbbcfc2016-03-14 19:21:36 +0000764}
765
766// readTokenWithJavaScriptASI reads the next token and terminates the current
767// line if JavaScript Automatic Semicolon Insertion must
768// happen between the current token and the next token.
769//
770// This method is conservative - it cannot cover all edge cases of JavaScript,
771// but only aims to correctly handle certain well known cases. It *must not*
772// return true in speculative cases.
773void UnwrappedLineParser::readTokenWithJavaScriptASI() {
774 FormatToken *Previous = FormatTok;
775 readToken();
776 FormatToken *Next = FormatTok;
777
778 bool IsOnSameLine =
779 CommentsBeforeNextToken.empty()
780 ? Next->NewlinesBefore == 0
781 : CommentsBeforeNextToken.front()->NewlinesBefore == 0;
782 if (IsOnSameLine)
783 return;
784
785 bool PreviousMustBeValue = mustBeJSIdentOrValue(Keywords, Previous);
Martin Probst717f6dc2016-10-21 05:11:38 +0000786 bool PreviousStartsTemplateExpr =
787 Previous->is(TT_TemplateString) && Previous->TokenText.endswith("${");
Martin Probstbbffeac2016-04-11 07:35:57 +0000788 if (PreviousMustBeValue && Line && Line->Tokens.size() > 1) {
789 // If the token before the previous one is an '@', the previous token is an
790 // annotation and can precede another identifier/value.
Benjamin Kramer5ffc24e2016-04-11 12:19:19 +0000791 const FormatToken *PrePrevious = std::prev(Line->Tokens.end(), 2)->Tok;
Martin Probstbbffeac2016-04-11 07:35:57 +0000792 if (PrePrevious->is(tok::at))
793 return;
794 }
Daniel Jasper1dcbbcfc2016-03-14 19:21:36 +0000795 if (Next->is(tok::exclaim) && PreviousMustBeValue)
Martin Probstd40bca42017-01-09 08:56:36 +0000796 return addUnwrappedLine();
Daniel Jasper1dcbbcfc2016-03-14 19:21:36 +0000797 bool NextMustBeValue = mustBeJSIdentOrValue(Keywords, Next);
Martin Probst717f6dc2016-10-21 05:11:38 +0000798 bool NextEndsTemplateExpr =
799 Next->is(TT_TemplateString) && Next->TokenText.startswith("}");
800 if (NextMustBeValue && !NextEndsTemplateExpr && !PreviousStartsTemplateExpr &&
801 (PreviousMustBeValue ||
802 Previous->isOneOf(tok::r_square, tok::r_paren, tok::plusplus,
803 tok::minusminus)))
Martin Probstd40bca42017-01-09 08:56:36 +0000804 return addUnwrappedLine();
Martin Probste6b5b342017-01-16 09:52:40 +0000805 if (PreviousMustBeValue && isJSDeclOrStmt(Keywords, Next))
Martin Probstd40bca42017-01-09 08:56:36 +0000806 return addUnwrappedLine();
Daniel Jasper1dcbbcfc2016-03-14 19:21:36 +0000807}
808
Manuel Klimek6b9eeba2013-01-07 14:56:16 +0000809void UnwrappedLineParser::parseStructuralElement() {
Daniel Jasper498f5582015-12-25 08:53:31 +0000810 assert(!FormatTok->is(tok::l_brace));
811 if (Style.Language == FormatStyle::LK_TableGen &&
812 FormatTok->is(tok::pp_include)) {
813 nextToken();
814 if (FormatTok->is(tok::string_literal))
815 nextToken();
816 addUnwrappedLine();
817 return;
818 }
Manuel Klimek15dfe7a2013-05-28 11:55:06 +0000819 switch (FormatTok->Tok.getKind()) {
Nico Weber04e9f1a2013-01-07 19:05:19 +0000820 case tok::at:
821 nextToken();
Manuel Klimek15dfe7a2013-05-28 11:55:06 +0000822 if (FormatTok->Tok.is(tok::l_brace)) {
Nico Weber372d8dc2013-02-10 20:35:35 +0000823 parseBracedList();
824 break;
825 }
Manuel Klimek15dfe7a2013-05-28 11:55:06 +0000826 switch (FormatTok->Tok.getObjCKeywordID()) {
Nico Weber04e9f1a2013-01-07 19:05:19 +0000827 case tok::objc_public:
828 case tok::objc_protected:
829 case tok::objc_package:
830 case tok::objc_private:
831 return parseAccessSpecifier();
Nico Weber7eecf4b2013-01-09 20:25:35 +0000832 case tok::objc_interface:
Nico Weber2ce0ac52013-01-09 23:25:37 +0000833 case tok::objc_implementation:
834 return parseObjCInterfaceOrImplementation();
Nico Weber8696a8d2013-01-09 21:15:03 +0000835 case tok::objc_protocol:
836 return parseObjCProtocol();
Nico Weberd8ffe752013-01-09 21:42:32 +0000837 case tok::objc_end:
838 return; // Handled by the caller.
Nico Weber51306d22013-01-10 00:25:19 +0000839 case tok::objc_optional:
840 case tok::objc_required:
841 nextToken();
842 addUnwrappedLine();
843 return;
Nico Weber45c48122015-06-28 01:06:16 +0000844 case tok::objc_autoreleasepool:
845 nextToken();
846 if (FormatTok->Tok.is(tok::l_brace)) {
Daniel Jasperc1bc38e2015-09-29 14:57:55 +0000847 if (Style.BraceWrapping.AfterObjCDeclaration)
Nico Weber45c48122015-06-28 01:06:16 +0000848 addUnwrappedLine();
849 parseBlock(/*MustBeDeclaration=*/false);
850 }
851 addUnwrappedLine();
852 return;
Nico Weber33381f52015-02-07 01:57:32 +0000853 case tok::objc_try:
854 // This branch isn't strictly necessary (the kw_try case below would
855 // do this too after the tok::at is parsed above). But be explicit.
856 parseTryCatch();
857 return;
Nico Weber04e9f1a2013-01-07 19:05:19 +0000858 default:
859 break;
860 }
861 break;
Daniel Jasper8f463652014-08-26 23:15:12 +0000862 case tok::kw_asm:
Daniel Jasper8f463652014-08-26 23:15:12 +0000863 nextToken();
864 if (FormatTok->is(tok::l_brace)) {
Daniel Jasperc6366072015-05-10 08:42:04 +0000865 FormatTok->Type = TT_InlineASMBrace;
Daniel Jasper2337f282015-01-12 10:14:56 +0000866 nextToken();
Daniel Jasper4429f142014-08-27 17:16:46 +0000867 while (FormatTok && FormatTok->isNot(tok::eof)) {
Daniel Jasper8f463652014-08-26 23:15:12 +0000868 if (FormatTok->is(tok::r_brace)) {
Daniel Jasperc6366072015-05-10 08:42:04 +0000869 FormatTok->Type = TT_InlineASMBrace;
Daniel Jasper8f463652014-08-26 23:15:12 +0000870 nextToken();
Daniel Jasper790d4f92015-05-11 11:59:46 +0000871 addUnwrappedLine();
Daniel Jasper8f463652014-08-26 23:15:12 +0000872 break;
873 }
Daniel Jasper2337f282015-01-12 10:14:56 +0000874 FormatTok->Finalized = true;
Daniel Jasper8f463652014-08-26 23:15:12 +0000875 nextToken();
876 }
877 }
878 break;
Alexander Kornienko578fdd82012-12-06 18:03:27 +0000879 case tok::kw_namespace:
880 parseNamespace();
881 return;
Dmitri Gribenko58d64e22012-12-30 21:27:25 +0000882 case tok::kw_inline:
883 nextToken();
Manuel Klimek15dfe7a2013-05-28 11:55:06 +0000884 if (FormatTok->Tok.is(tok::kw_namespace)) {
Dmitri Gribenko58d64e22012-12-30 21:27:25 +0000885 parseNamespace();
886 return;
887 }
888 break;
Alexander Kornienkob7076a22012-12-04 14:46:19 +0000889 case tok::kw_public:
890 case tok::kw_protected:
891 case tok::kw_private:
Daniel Jasper83709082015-02-18 17:14:05 +0000892 if (Style.Language == FormatStyle::LK_Java ||
893 Style.Language == FormatStyle::LK_JavaScript)
Daniel Jasperc58c70e2014-09-15 11:21:46 +0000894 nextToken();
895 else
896 parseAccessSpecifier();
Daniel Jasperf7935112012-12-03 18:12:45 +0000897 return;
Alexander Kornienkob7076a22012-12-04 14:46:19 +0000898 case tok::kw_if:
899 parseIfThenElse();
Daniel Jasperf7935112012-12-03 18:12:45 +0000900 return;
Alexander Kornienko37d6c942012-12-05 15:06:06 +0000901 case tok::kw_for:
902 case tok::kw_while:
903 parseForOrWhileLoop();
904 return;
Alexander Kornienkob7076a22012-12-04 14:46:19 +0000905 case tok::kw_do:
906 parseDoWhile();
907 return;
908 case tok::kw_switch:
909 parseSwitch();
910 return;
911 case tok::kw_default:
912 nextToken();
913 parseLabel();
914 return;
915 case tok::kw_case:
916 parseCaseLabel();
917 return;
Daniel Jasper04a71a42014-05-08 11:58:24 +0000918 case tok::kw_try:
Nico Weberfac23712015-02-04 15:26:27 +0000919 case tok::kw___try:
Daniel Jasper04a71a42014-05-08 11:58:24 +0000920 parseTryCatch();
921 return;
Manuel Klimekae610d12013-01-21 14:32:05 +0000922 case tok::kw_extern:
923 nextToken();
Manuel Klimek15dfe7a2013-05-28 11:55:06 +0000924 if (FormatTok->Tok.is(tok::string_literal)) {
Manuel Klimekae610d12013-01-21 14:32:05 +0000925 nextToken();
Manuel Klimek15dfe7a2013-05-28 11:55:06 +0000926 if (FormatTok->Tok.is(tok::l_brace)) {
Daniel Jasper65ee3472013-07-31 23:16:02 +0000927 parseBlock(/*MustBeDeclaration=*/true, /*AddLevel=*/false);
Manuel Klimekae610d12013-01-21 14:32:05 +0000928 addUnwrappedLine();
929 return;
930 }
931 }
Daniel Jaspere1e43192014-04-01 12:55:11 +0000932 break;
Daniel Jasperfca735c2015-02-19 16:14:18 +0000933 case tok::kw_export:
934 if (Style.Language == FormatStyle::LK_JavaScript) {
935 parseJavaScriptEs6ImportExport();
936 return;
937 }
938 break;
Daniel Jaspere1e43192014-04-01 12:55:11 +0000939 case tok::identifier:
Daniel Jasper66cb8c52015-05-04 09:22:29 +0000940 if (FormatTok->is(TT_ForEachMacro)) {
Daniel Jaspere1e43192014-04-01 12:55:11 +0000941 parseForOrWhileLoop();
942 return;
943 }
Birunthan Mohanathasb001a0b2015-07-03 17:25:16 +0000944 if (FormatTok->is(TT_MacroBlockBegin)) {
945 parseBlock(/*MustBeDeclaration=*/false, /*AddLevel=*/true,
946 /*MunchSemi=*/false);
947 return;
948 }
Daniel Jasper3d5a7d62016-06-20 18:20:38 +0000949 if (FormatTok->is(Keywords.kw_import)) {
950 if (Style.Language == FormatStyle::LK_JavaScript) {
951 parseJavaScriptEs6ImportExport();
952 return;
953 }
954 if (Style.Language == FormatStyle::LK_Proto) {
955 nextToken();
Daniel Jasper8b61d142016-06-20 20:39:53 +0000956 if (FormatTok->is(tok::kw_public))
957 nextToken();
Daniel Jasper3d5a7d62016-06-20 18:20:38 +0000958 if (!FormatTok->is(tok::string_literal))
959 return;
960 nextToken();
961 if (FormatTok->is(tok::semi))
962 nextToken();
963 addUnwrappedLine();
964 return;
965 }
Daniel Jasper354aa512015-02-19 16:07:32 +0000966 }
Daniel Jasper1dbc2102017-03-31 13:30:24 +0000967 if (Style.isCpp() &&
Daniel Jasper72b33572017-03-31 12:04:37 +0000968 FormatTok->isOneOf(Keywords.kw_signals, Keywords.kw_qsignals,
Daniel Jaspera00de632015-12-01 12:05:04 +0000969 Keywords.kw_slots, Keywords.kw_qslots)) {
Daniel Jasperde0d1f32015-04-24 07:50:34 +0000970 nextToken();
971 if (FormatTok->is(tok::colon)) {
972 nextToken();
973 addUnwrappedLine();
Daniel Jasper31343832016-07-27 10:13:24 +0000974 return;
Daniel Jasperde0d1f32015-04-24 07:50:34 +0000975 }
Daniel Jasper53395402015-04-07 15:04:40 +0000976 }
Manuel Klimekae610d12013-01-21 14:32:05 +0000977 // In all other cases, parse the declaration.
978 break;
Alexander Kornienkob7076a22012-12-04 14:46:19 +0000979 default:
980 break;
Daniel Jasperf7935112012-12-03 18:12:45 +0000981 }
Daniel Jasperf7935112012-12-03 18:12:45 +0000982 do {
Daniel Jaspera7900ad2016-05-08 18:12:22 +0000983 const FormatToken *Previous = getPreviousToken();
Manuel Klimek15dfe7a2013-05-28 11:55:06 +0000984 switch (FormatTok->Tok.getKind()) {
Nico Weber372d8dc2013-02-10 20:35:35 +0000985 case tok::at:
986 nextToken();
Manuel Klimek15dfe7a2013-05-28 11:55:06 +0000987 if (FormatTok->Tok.is(tok::l_brace))
Nico Weber372d8dc2013-02-10 20:35:35 +0000988 parseBracedList();
989 break;
Alexander Kornienkob7076a22012-12-04 14:46:19 +0000990 case tok::kw_enum:
Daniel Jaspera7900ad2016-05-08 18:12:22 +0000991 // Ignore if this is part of "template <enum ...".
992 if (Previous && Previous->is(tok::less)) {
993 nextToken();
994 break;
995 }
996
Daniel Jasper90cf3802015-06-17 09:44:02 +0000997 // parseEnum falls through and does not yet add an unwrapped line as an
998 // enum definition can start a structural element.
Daniel Jasper6f5a1932015-12-29 08:54:23 +0000999 if (!parseEnum())
1000 break;
Daniel Jasperc6dd2732015-07-16 14:25:43 +00001001 // This only applies for C++.
Daniel Jasper1dbc2102017-03-31 13:30:24 +00001002 if (!Style.isCpp()) {
Daniel Jasper90cf3802015-06-17 09:44:02 +00001003 addUnwrappedLine();
1004 return;
1005 }
Manuel Klimek2cec0192013-01-21 19:17:52 +00001006 break;
Daniel Jaspera88f80a2014-01-30 14:38:37 +00001007 case tok::kw_typedef:
1008 nextToken();
Daniel Jasper31f6c542014-12-05 10:42:21 +00001009 if (FormatTok->isOneOf(Keywords.kw_NS_ENUM, Keywords.kw_NS_OPTIONS,
1010 Keywords.kw_CF_ENUM, Keywords.kw_CF_OPTIONS))
Daniel Jaspera88f80a2014-01-30 14:38:37 +00001011 parseEnum();
1012 break;
Alexander Kornienko1231e062013-01-16 11:43:46 +00001013 case tok::kw_struct:
1014 case tok::kw_union:
Manuel Klimek28cacc72013-01-07 18:10:23 +00001015 case tok::kw_class:
Daniel Jasper910807d2015-06-12 04:52:02 +00001016 // parseRecord falls through and does not yet add an unwrapped line as a
1017 // record declaration or definition can start a structural element.
Manuel Klimeke01bab52013-01-15 13:38:33 +00001018 parseRecord();
Daniel Jasper910807d2015-06-12 04:52:02 +00001019 // This does not apply for Java and JavaScript.
1020 if (Style.Language == FormatStyle::LK_Java ||
1021 Style.Language == FormatStyle::LK_JavaScript) {
Daniel Jasperd5ec65b2016-01-08 07:06:07 +00001022 if (FormatTok->is(tok::semi))
1023 nextToken();
Daniel Jasper910807d2015-06-12 04:52:02 +00001024 addUnwrappedLine();
1025 return;
1026 }
Manuel Klimeke01bab52013-01-15 13:38:33 +00001027 break;
Daniel Jaspere5d74862014-11-26 08:17:08 +00001028 case tok::period:
1029 nextToken();
1030 // In Java, classes have an implicit static member "class".
1031 if (Style.Language == FormatStyle::LK_Java && FormatTok &&
1032 FormatTok->is(tok::kw_class))
1033 nextToken();
Daniel Jasperba52fcb2015-09-28 14:29:45 +00001034 if (Style.Language == FormatStyle::LK_JavaScript && FormatTok &&
1035 FormatTok->Tok.getIdentifierInfo())
1036 // JavaScript only has pseudo keywords, all keywords are allowed to
1037 // appear in "IdentifierName" positions. See http://es5.github.io/#x7.6
1038 nextToken();
Daniel Jaspere5d74862014-11-26 08:17:08 +00001039 break;
Daniel Jasperf7935112012-12-03 18:12:45 +00001040 case tok::semi:
1041 nextToken();
1042 addUnwrappedLine();
1043 return;
Alexander Kornienko1231e062013-01-16 11:43:46 +00001044 case tok::r_brace:
1045 addUnwrappedLine();
1046 return;
Daniel Jasperf7935112012-12-03 18:12:45 +00001047 case tok::l_paren:
1048 parseParens();
1049 break;
Daniel Jasper5af04a42015-10-07 03:43:10 +00001050 case tok::kw_operator:
1051 nextToken();
1052 if (FormatTok->isBinaryOperator())
1053 nextToken();
1054 break;
Manuel Klimek516e0542013-09-04 13:25:30 +00001055 case tok::caret:
1056 nextToken();
Daniel Jasper395193c2014-03-28 07:48:59 +00001057 if (FormatTok->Tok.isAnyIdentifier() ||
1058 FormatTok->isSimpleTypeSpecifier())
1059 nextToken();
1060 if (FormatTok->is(tok::l_paren))
1061 parseParens();
1062 if (FormatTok->is(tok::l_brace))
Manuel Klimek516e0542013-09-04 13:25:30 +00001063 parseChildBlock();
Manuel Klimek516e0542013-09-04 13:25:30 +00001064 break;
Daniel Jasperf7935112012-12-03 18:12:45 +00001065 case tok::l_brace:
Manuel Klimekab419912013-05-23 09:41:43 +00001066 if (!tryToParseBracedList()) {
1067 // A block outside of parentheses must be the last part of a
1068 // structural element.
1069 // FIXME: Figure out cases where this is not true, and add projections
1070 // for them (the one we know is missing are lambdas).
Daniel Jasperc1bc38e2015-09-29 14:57:55 +00001071 if (Style.BraceWrapping.AfterFunction)
Manuel Klimekab419912013-05-23 09:41:43 +00001072 addUnwrappedLine();
Alexander Kornienko3cfa9732013-11-20 16:33:05 +00001073 FormatTok->Type = TT_FunctionLBrace;
Nico Weber9096fc02013-06-26 00:30:14 +00001074 parseBlock(/*MustBeDeclaration=*/false);
Manuel Klimeka8eb9142013-05-13 12:51:40 +00001075 addUnwrappedLine();
Manuel Klimekab419912013-05-23 09:41:43 +00001076 return;
1077 }
1078 // Otherwise this was a braced init list, and the structural
1079 // element continues.
1080 break;
Daniel Jasper04a71a42014-05-08 11:58:24 +00001081 case tok::kw_try:
1082 // We arrive here when parsing function-try blocks.
1083 parseTryCatch();
1084 return;
Daniel Jasper40e19212013-05-29 13:16:10 +00001085 case tok::identifier: {
Birunthan Mohanathasb001a0b2015-07-03 17:25:16 +00001086 if (FormatTok->is(TT_MacroBlockEnd)) {
1087 addUnwrappedLine();
1088 return;
1089 }
1090
Martin Probst973ff792017-04-27 13:07:24 +00001091 // Function declarations (as opposed to function expressions) are parsed
1092 // on their own unwrapped line by continuing this loop. Function
1093 // expressions (functions that are not on their own line) must not create
1094 // a new unwrapped line, so they are special cased below.
1095 size_t TokenCount = Line->Tokens.size();
Daniel Jasper9326f912015-05-05 08:40:32 +00001096 if (Style.Language == FormatStyle::LK_JavaScript &&
Martin Probst973ff792017-04-27 13:07:24 +00001097 FormatTok->is(Keywords.kw_function) &&
1098 (TokenCount > 1 || (TokenCount == 1 && !Line->Tokens.front().Tok->is(
1099 Keywords.kw_async)))) {
Daniel Jasper069e5f42014-05-20 11:14:57 +00001100 tryToParseJSFunction();
1101 break;
1102 }
Daniel Jasper9326f912015-05-05 08:40:32 +00001103 if ((Style.Language == FormatStyle::LK_JavaScript ||
1104 Style.Language == FormatStyle::LK_Java) &&
1105 FormatTok->is(Keywords.kw_interface)) {
Martin Probst1e8261e2016-04-19 18:18:59 +00001106 if (Style.Language == FormatStyle::LK_JavaScript) {
1107 // In JavaScript/TypeScript, "interface" can be used as a standalone
1108 // identifier, e.g. in `var interface = 1;`. If "interface" is
1109 // followed by another identifier, it is very like to be an actual
1110 // interface declaration.
1111 unsigned StoredPosition = Tokens->getPosition();
1112 FormatToken *Next = Tokens->getNextToken();
1113 FormatTok = Tokens->setPosition(StoredPosition);
Martin Probst533965c2016-04-19 18:19:06 +00001114 if (Next && !mustBeJSIdent(Keywords, Next)) {
Martin Probst1e8261e2016-04-19 18:18:59 +00001115 nextToken();
1116 break;
1117 }
1118 }
Daniel Jasper9326f912015-05-05 08:40:32 +00001119 parseRecord();
Daniel Jasper259188b2015-06-12 04:56:34 +00001120 addUnwrappedLine();
Daniel Jasper5c235c02015-07-06 14:26:04 +00001121 return;
Daniel Jasper9326f912015-05-05 08:40:32 +00001122 }
1123
Daniel Jasper1dcbbcfc2016-03-14 19:21:36 +00001124 // See if the following token should start a new unwrapped line.
Daniel Jasper9326f912015-05-05 08:40:32 +00001125 StringRef Text = FormatTok->TokenText;
Daniel Jasperf7935112012-12-03 18:12:45 +00001126 nextToken();
Daniel Jasper83709082015-02-18 17:14:05 +00001127 if (Line->Tokens.size() == 1 &&
1128 // JS doesn't have macros, and within classes colons indicate fields,
1129 // not labels.
Daniel Jasper676e5162015-04-07 14:36:33 +00001130 Style.Language != FormatStyle::LK_JavaScript) {
1131 if (FormatTok->Tok.is(tok::colon) && !Line->MustBeDeclaration) {
Daniel Jasper40609472016-04-06 15:02:46 +00001132 Line->Tokens.begin()->Tok->MustBreakBefore = true;
Alexander Kornienkode644272013-04-08 22:16:06 +00001133 parseLabel();
1134 return;
1135 }
Daniel Jasper680b09b2014-11-05 10:48:04 +00001136 // Recognize function-like macro usages without trailing semicolon as
Daniel Jasper83709082015-02-18 17:14:05 +00001137 // well as free-standing macros like Q_OBJECT.
Daniel Jasper680b09b2014-11-05 10:48:04 +00001138 bool FunctionLike = FormatTok->is(tok::l_paren);
1139 if (FunctionLike)
Alexander Kornienkode644272013-04-08 22:16:06 +00001140 parseParens();
Daniel Jaspere60cba12015-05-13 11:35:53 +00001141
1142 bool FollowedByNewline =
1143 CommentsBeforeNextToken.empty()
1144 ? FormatTok->NewlinesBefore > 0
1145 : CommentsBeforeNextToken.front()->NewlinesBefore > 0;
1146
Daniel Jaspere6fcf7d2015-06-17 13:08:06 +00001147 if (FollowedByNewline && (Text.size() >= 5 || FunctionLike) &&
Daniel Jasper680b09b2014-11-05 10:48:04 +00001148 tokenCanStartNewLine(FormatTok->Tok) && Text == Text.upper()) {
Daniel Jasper40e19212013-05-29 13:16:10 +00001149 addUnwrappedLine();
Daniel Jasper41a0f782013-05-29 14:09:17 +00001150 return;
Alexander Kornienkode644272013-04-08 22:16:06 +00001151 }
Daniel Jasperf7935112012-12-03 18:12:45 +00001152 }
1153 break;
Daniel Jasper40e19212013-05-29 13:16:10 +00001154 }
Daniel Jaspere25509f2012-12-17 11:29:41 +00001155 case tok::equal:
Manuel Klimek79e06082015-05-21 12:23:34 +00001156 // Fat arrows (=>) have tok::TokenKind tok::equal but TokenType
1157 // TT_JsFatArrow. The always start an expression or a child block if
1158 // followed by a curly.
1159 if (FormatTok->is(TT_JsFatArrow)) {
1160 nextToken();
Daniel Jasperbe520bd2015-05-31 08:51:54 +00001161 if (FormatTok->is(tok::l_brace))
Manuel Klimek79e06082015-05-21 12:23:34 +00001162 parseChildBlock();
Manuel Klimek79e06082015-05-21 12:23:34 +00001163 break;
1164 }
1165
Daniel Jaspere25509f2012-12-17 11:29:41 +00001166 nextToken();
Manuel Klimek15dfe7a2013-05-28 11:55:06 +00001167 if (FormatTok->Tok.is(tok::l_brace)) {
Manuel Klimek8e07a1b2013-01-10 11:52:21 +00001168 parseBracedList();
1169 }
Daniel Jaspere25509f2012-12-17 11:29:41 +00001170 break;
Manuel Klimekffdeb592013-09-03 15:10:01 +00001171 case tok::l_square:
Daniel Jasperb88b25f2013-12-23 07:29:06 +00001172 parseSquare();
Manuel Klimekffdeb592013-09-03 15:10:01 +00001173 break;
Daniel Jasper6acf5132015-03-12 14:44:29 +00001174 case tok::kw_new:
1175 parseNew();
1176 break;
Alexander Kornienkob7076a22012-12-04 14:46:19 +00001177 default:
1178 nextToken();
1179 break;
Daniel Jasperf7935112012-12-03 18:12:45 +00001180 }
1181 } while (!eof());
1182}
1183
Daniel Jasperb88b25f2013-12-23 07:29:06 +00001184bool UnwrappedLineParser::tryToParseLambda() {
Daniel Jasper1dbc2102017-03-31 13:30:24 +00001185 if (!Style.isCpp()) {
Daniel Jasper1feab0f2015-06-02 15:31:37 +00001186 nextToken();
1187 return false;
1188 }
Daniel Jasperb9a49902016-01-09 15:56:28 +00001189 const FormatToken* Previous = getPreviousToken();
1190 if (Previous &&
1191 (Previous->isOneOf(tok::identifier, tok::kw_operator, tok::kw_new,
1192 tok::kw_delete) ||
1193 Previous->closesScope() || Previous->isSimpleTypeSpecifier())) {
Daniel Jasperbf02b2c12013-09-05 11:49:39 +00001194 nextToken();
Daniel Jasperb88b25f2013-12-23 07:29:06 +00001195 return false;
Daniel Jasperbf02b2c12013-09-05 11:49:39 +00001196 }
Daniel Jasper9fe0e8d2013-09-05 09:29:45 +00001197 assert(FormatTok->is(tok::l_square));
1198 FormatToken &LSquare = *FormatTok;
Daniel Jasper9a8d48b2013-09-05 10:04:31 +00001199 if (!tryToParseLambdaIntroducer())
Daniel Jasperb88b25f2013-12-23 07:29:06 +00001200 return false;
Manuel Klimekffdeb592013-09-03 15:10:01 +00001201
Alexander Kornienkoc2ee9cf2014-03-13 13:59:48 +00001202 while (FormatTok->isNot(tok::l_brace)) {
Daniel Jaspercb51cf42014-01-16 09:11:55 +00001203 if (FormatTok->isSimpleTypeSpecifier()) {
1204 nextToken();
1205 continue;
1206 }
Manuel Klimekffdeb592013-09-03 15:10:01 +00001207 switch (FormatTok->Tok.getKind()) {
Daniel Jasper9a8d48b2013-09-05 10:04:31 +00001208 case tok::l_brace:
1209 break;
1210 case tok::l_paren:
1211 parseParens();
1212 break;
Daniel Jasperbcb55ee2014-11-21 14:08:38 +00001213 case tok::amp:
1214 case tok::star:
1215 case tok::kw_const:
Daniel Jasper3431b752014-12-08 13:22:37 +00001216 case tok::comma:
Daniel Jaspercb51cf42014-01-16 09:11:55 +00001217 case tok::less:
1218 case tok::greater:
Daniel Jasper9a8d48b2013-09-05 10:04:31 +00001219 case tok::identifier:
Daniel Jasper5eaa0092015-08-13 13:37:08 +00001220 case tok::numeric_constant:
Daniel Jasper1067ab02014-02-11 10:16:55 +00001221 case tok::coloncolon:
Daniel Jasper9a8d48b2013-09-05 10:04:31 +00001222 case tok::kw_mutable:
Daniel Jasper81a20782014-03-10 10:02:02 +00001223 nextToken();
1224 break;
Daniel Jaspercb51cf42014-01-16 09:11:55 +00001225 case tok::arrow:
Daniel Jasper6f2b88a2015-06-05 13:18:09 +00001226 FormatTok->Type = TT_LambdaArrow;
Daniel Jasper9a8d48b2013-09-05 10:04:31 +00001227 nextToken();
1228 break;
1229 default:
Daniel Jasperb88b25f2013-12-23 07:29:06 +00001230 return true;
Manuel Klimekffdeb592013-09-03 15:10:01 +00001231 }
1232 }
Daniel Jasper9fe0e8d2013-09-05 09:29:45 +00001233 LSquare.Type = TT_LambdaLSquare;
Manuel Klimek516e0542013-09-04 13:25:30 +00001234 parseChildBlock();
Daniel Jasperb88b25f2013-12-23 07:29:06 +00001235 return true;
Manuel Klimekffdeb592013-09-03 15:10:01 +00001236}
1237
1238bool UnwrappedLineParser::tryToParseLambdaIntroducer() {
1239 nextToken();
1240 if (FormatTok->is(tok::equal)) {
1241 nextToken();
Daniel Jasper9a8d48b2013-09-05 10:04:31 +00001242 if (FormatTok->is(tok::r_square)) {
1243 nextToken();
1244 return true;
1245 }
1246 if (FormatTok->isNot(tok::comma))
1247 return false;
Manuel Klimekffdeb592013-09-03 15:10:01 +00001248 nextToken();
1249 } else if (FormatTok->is(tok::amp)) {
1250 nextToken();
Daniel Jasper9a8d48b2013-09-05 10:04:31 +00001251 if (FormatTok->is(tok::r_square)) {
1252 nextToken();
1253 return true;
1254 }
Manuel Klimekffdeb592013-09-03 15:10:01 +00001255 if (!FormatTok->isOneOf(tok::comma, tok::identifier)) {
1256 return false;
1257 }
Daniel Jasper9a8d48b2013-09-05 10:04:31 +00001258 if (FormatTok->is(tok::comma))
1259 nextToken();
Manuel Klimekffdeb592013-09-03 15:10:01 +00001260 } else if (FormatTok->is(tok::r_square)) {
1261 nextToken();
1262 return true;
1263 }
1264 do {
Daniel Jasper9a8d48b2013-09-05 10:04:31 +00001265 if (FormatTok->is(tok::amp))
1266 nextToken();
1267 if (!FormatTok->isOneOf(tok::identifier, tok::kw_this))
1268 return false;
Manuel Klimekffdeb592013-09-03 15:10:01 +00001269 nextToken();
Daniel Jasperda18fd82014-06-10 06:39:03 +00001270 if (FormatTok->is(tok::ellipsis))
1271 nextToken();
Manuel Klimekffdeb592013-09-03 15:10:01 +00001272 if (FormatTok->is(tok::comma)) {
1273 nextToken();
1274 } else if (FormatTok->is(tok::r_square)) {
1275 nextToken();
1276 return true;
1277 } else {
1278 return false;
1279 }
1280 } while (!eof());
1281 return false;
1282}
1283
Daniel Jasperc03e16a2014-05-08 09:25:39 +00001284void UnwrappedLineParser::tryToParseJSFunction() {
Martin Probst409697e2016-05-29 14:41:07 +00001285 assert(FormatTok->is(Keywords.kw_function) ||
1286 FormatTok->startsSequence(Keywords.kw_async, Keywords.kw_function));
Martin Probst5f8445b2016-04-24 22:05:09 +00001287 if (FormatTok->is(Keywords.kw_async))
1288 nextToken();
1289 // Consume "function".
Daniel Jasperc03e16a2014-05-08 09:25:39 +00001290 nextToken();
Daniel Jasper5217a8b2014-06-13 07:02:04 +00001291
Daniel Jasper71e50af2016-11-01 06:22:59 +00001292 // Consume * (generator function). Treat it like C++'s overloaded operators.
1293 if (FormatTok->is(tok::star)) {
1294 FormatTok->Type = TT_OverloadedOperator;
Martin Probst5f8445b2016-04-24 22:05:09 +00001295 nextToken();
Daniel Jasper71e50af2016-11-01 06:22:59 +00001296 }
Martin Probst5f8445b2016-04-24 22:05:09 +00001297
Daniel Jasper5217a8b2014-06-13 07:02:04 +00001298 // Consume function name.
1299 if (FormatTok->is(tok::identifier))
Daniel Jasperfca735c2015-02-19 16:14:18 +00001300 nextToken();
Daniel Jasper5217a8b2014-06-13 07:02:04 +00001301
Daniel Jasperc03e16a2014-05-08 09:25:39 +00001302 if (FormatTok->isNot(tok::l_paren))
1303 return;
Manuel Klimek79e06082015-05-21 12:23:34 +00001304
1305 // Parse formal parameter list.
Daniel Jasperbe520bd2015-05-31 08:51:54 +00001306 parseParens();
Manuel Klimek79e06082015-05-21 12:23:34 +00001307
1308 if (FormatTok->is(tok::colon)) {
1309 // Parse a type definition.
1310 nextToken();
1311
1312 // Eat the type declaration. For braced inline object types, balance braces,
1313 // otherwise just parse until finding an l_brace for the function body.
Daniel Jasperbe520bd2015-05-31 08:51:54 +00001314 if (FormatTok->is(tok::l_brace))
1315 tryToParseBracedList();
1316 else
Martin Probstaf16c502017-01-04 13:36:43 +00001317 while (!FormatTok->isOneOf(tok::l_brace, tok::semi) && !eof())
Manuel Klimek79e06082015-05-21 12:23:34 +00001318 nextToken();
Manuel Klimek79e06082015-05-21 12:23:34 +00001319 }
1320
Martin Probstaf16c502017-01-04 13:36:43 +00001321 if (FormatTok->is(tok::semi))
1322 return;
1323
Manuel Klimek79e06082015-05-21 12:23:34 +00001324 parseChildBlock();
1325}
1326
Daniel Jasper3c883d12015-05-18 14:49:19 +00001327bool UnwrappedLineParser::tryToParseBracedList() {
Daniel Jasperb1f74a82013-07-09 09:06:29 +00001328 if (FormatTok->BlockKind == BK_Unknown)
Daniel Jasper3c883d12015-05-18 14:49:19 +00001329 calculateBraceTypes();
Daniel Jasperb1f74a82013-07-09 09:06:29 +00001330 assert(FormatTok->BlockKind != BK_Unknown);
1331 if (FormatTok->BlockKind == BK_Block)
Manuel Klimekab419912013-05-23 09:41:43 +00001332 return false;
1333 parseBracedList();
1334 return true;
1335}
1336
Daniel Jasper015ed022013-09-13 09:20:45 +00001337bool UnwrappedLineParser::parseBracedList(bool ContinueOnSemicolons) {
1338 bool HasError = false;
Manuel Klimek8e07a1b2013-01-10 11:52:21 +00001339 nextToken();
1340
Manuel Klimeka3ff45e2013-04-10 09:52:05 +00001341 // FIXME: Once we have an expression parser in the UnwrappedLineParser,
1342 // replace this by using parseAssigmentExpression() inside.
Manuel Klimek8e07a1b2013-01-10 11:52:21 +00001343 do {
Manuel Klimek79e06082015-05-21 12:23:34 +00001344 if (Style.Language == FormatStyle::LK_JavaScript) {
Martin Probst409697e2016-05-29 14:41:07 +00001345 if (FormatTok->is(Keywords.kw_function) ||
1346 FormatTok->startsSequence(Keywords.kw_async, Keywords.kw_function)) {
Manuel Klimek79e06082015-05-21 12:23:34 +00001347 tryToParseJSFunction();
1348 continue;
Daniel Jasperbe520bd2015-05-31 08:51:54 +00001349 }
1350 if (FormatTok->is(TT_JsFatArrow)) {
Manuel Klimek79e06082015-05-21 12:23:34 +00001351 nextToken();
1352 // Fat arrows can be followed by simple expressions or by child blocks
1353 // in curly braces.
Daniel Jaspere6fcf7d2015-06-17 13:08:06 +00001354 if (FormatTok->is(tok::l_brace)) {
Manuel Klimek79e06082015-05-21 12:23:34 +00001355 parseChildBlock();
1356 continue;
1357 }
1358 }
Martin Probst8e3eba02017-02-07 16:33:13 +00001359 if (FormatTok->is(tok::l_brace)) {
1360 // Could be a method inside of a braced list `{a() { return 1; }}`.
1361 if (tryToParseBracedList())
1362 continue;
1363 parseChildBlock();
1364 }
Daniel Jasperc03e16a2014-05-08 09:25:39 +00001365 }
Manuel Klimek15dfe7a2013-05-28 11:55:06 +00001366 switch (FormatTok->Tok.getKind()) {
Manuel Klimek516e0542013-09-04 13:25:30 +00001367 case tok::caret:
1368 nextToken();
1369 if (FormatTok->is(tok::l_brace)) {
1370 parseChildBlock();
1371 }
1372 break;
1373 case tok::l_square:
1374 tryToParseLambda();
1375 break;
Daniel Jaspera87af7a2015-06-30 11:32:22 +00001376 case tok::l_paren:
1377 parseParens();
Daniel Jasperf46dec82015-03-31 14:34:15 +00001378 // JavaScript can just have free standing methods and getters/setters in
1379 // object literals. Detect them by a "{" following ")".
1380 if (Style.Language == FormatStyle::LK_JavaScript) {
Daniel Jasperf46dec82015-03-31 14:34:15 +00001381 if (FormatTok->is(tok::l_brace))
1382 parseChildBlock();
1383 break;
1384 }
Daniel Jasperf46dec82015-03-31 14:34:15 +00001385 break;
Martin Probst8e3eba02017-02-07 16:33:13 +00001386 case tok::l_brace:
1387 // Assume there are no blocks inside a braced init list apart
1388 // from the ones we explicitly parse out (like lambdas).
1389 FormatTok->BlockKind = BK_BracedInit;
1390 parseBracedList();
1391 break;
Manuel Klimek8e07a1b2013-01-10 11:52:21 +00001392 case tok::r_brace:
1393 nextToken();
Daniel Jasper015ed022013-09-13 09:20:45 +00001394 return !HasError;
Manuel Klimeka3ff45e2013-04-10 09:52:05 +00001395 case tok::semi:
Daniel Jasperb9a49902016-01-09 15:56:28 +00001396 // JavaScript (or more precisely TypeScript) can have semicolons in braced
1397 // lists (in so-called TypeMemberLists). Thus, the semicolon cannot be
1398 // used for error recovery if we have otherwise determined that this is
1399 // a braced list.
1400 if (Style.Language == FormatStyle::LK_JavaScript) {
1401 nextToken();
1402 break;
1403 }
Daniel Jasper015ed022013-09-13 09:20:45 +00001404 HasError = true;
1405 if (!ContinueOnSemicolons)
1406 return !HasError;
1407 nextToken();
1408 break;
Manuel Klimeka3ff45e2013-04-10 09:52:05 +00001409 case tok::comma:
1410 nextToken();
Manuel Klimeka3ff45e2013-04-10 09:52:05 +00001411 break;
Manuel Klimek8e07a1b2013-01-10 11:52:21 +00001412 default:
1413 nextToken();
1414 break;
1415 }
1416 } while (!eof());
Daniel Jasper015ed022013-09-13 09:20:45 +00001417 return false;
Manuel Klimek8e07a1b2013-01-10 11:52:21 +00001418}
1419
Daniel Jasperf7935112012-12-03 18:12:45 +00001420void UnwrappedLineParser::parseParens() {
Manuel Klimek15dfe7a2013-05-28 11:55:06 +00001421 assert(FormatTok->Tok.is(tok::l_paren) && "'(' expected.");
Daniel Jasperf7935112012-12-03 18:12:45 +00001422 nextToken();
1423 do {
Manuel Klimek15dfe7a2013-05-28 11:55:06 +00001424 switch (FormatTok->Tok.getKind()) {
Daniel Jasperf7935112012-12-03 18:12:45 +00001425 case tok::l_paren:
1426 parseParens();
Daniel Jasper5f1fa852015-01-04 20:40:51 +00001427 if (Style.Language == FormatStyle::LK_Java && FormatTok->is(tok::l_brace))
1428 parseChildBlock();
Daniel Jasperf7935112012-12-03 18:12:45 +00001429 break;
1430 case tok::r_paren:
1431 nextToken();
1432 return;
Daniel Jasper393564f2013-05-31 14:56:29 +00001433 case tok::r_brace:
1434 // A "}" inside parenthesis is an error if there wasn't a matching "{".
1435 return;
Daniel Jasper9a8d48b2013-09-05 10:04:31 +00001436 case tok::l_square:
1437 tryToParseLambda();
1438 break;
Daniel Jasper5f1fa852015-01-04 20:40:51 +00001439 case tok::l_brace:
Daniel Jasperadba2aa2015-05-18 12:52:00 +00001440 if (!tryToParseBracedList())
Manuel Klimekf017dc02013-09-04 13:34:14 +00001441 parseChildBlock();
Manuel Klimek8e07a1b2013-01-10 11:52:21 +00001442 break;
Nico Weber372d8dc2013-02-10 20:35:35 +00001443 case tok::at:
1444 nextToken();
Manuel Klimek15dfe7a2013-05-28 11:55:06 +00001445 if (FormatTok->Tok.is(tok::l_brace))
Nico Weber372d8dc2013-02-10 20:35:35 +00001446 parseBracedList();
1447 break;
Martin Probst1027fb82017-02-07 14:05:30 +00001448 case tok::kw_class:
1449 if (Style.Language == FormatStyle::LK_JavaScript)
1450 parseRecord(/*ParseAsExpr=*/true);
1451 else
1452 nextToken();
1453 break;
Daniel Jasper3f69ba12014-09-05 08:42:27 +00001454 case tok::identifier:
1455 if (Style.Language == FormatStyle::LK_JavaScript &&
Martin Probst409697e2016-05-29 14:41:07 +00001456 (FormatTok->is(Keywords.kw_function) ||
1457 FormatTok->startsSequence(Keywords.kw_async, Keywords.kw_function)))
Daniel Jasper3f69ba12014-09-05 08:42:27 +00001458 tryToParseJSFunction();
1459 else
1460 nextToken();
1461 break;
Daniel Jasperf7935112012-12-03 18:12:45 +00001462 default:
1463 nextToken();
1464 break;
1465 }
1466 } while (!eof());
1467}
1468
Daniel Jasperb88b25f2013-12-23 07:29:06 +00001469void UnwrappedLineParser::parseSquare() {
1470 assert(FormatTok->Tok.is(tok::l_square) && "'[' expected.");
1471 if (tryToParseLambda())
1472 return;
1473 do {
Daniel Jasperb88b25f2013-12-23 07:29:06 +00001474 switch (FormatTok->Tok.getKind()) {
1475 case tok::l_paren:
1476 parseParens();
1477 break;
1478 case tok::r_square:
1479 nextToken();
1480 return;
1481 case tok::r_brace:
1482 // A "}" inside parenthesis is an error if there wasn't a matching "{".
1483 return;
1484 case tok::l_square:
1485 parseSquare();
1486 break;
1487 case tok::l_brace: {
Daniel Jasperadba2aa2015-05-18 12:52:00 +00001488 if (!tryToParseBracedList())
Daniel Jasperb88b25f2013-12-23 07:29:06 +00001489 parseChildBlock();
Daniel Jasperb88b25f2013-12-23 07:29:06 +00001490 break;
1491 }
1492 case tok::at:
1493 nextToken();
1494 if (FormatTok->Tok.is(tok::l_brace))
1495 parseBracedList();
1496 break;
1497 default:
1498 nextToken();
1499 break;
1500 }
1501 } while (!eof());
1502}
1503
Daniel Jasperf7935112012-12-03 18:12:45 +00001504void UnwrappedLineParser::parseIfThenElse() {
Manuel Klimek15dfe7a2013-05-28 11:55:06 +00001505 assert(FormatTok->Tok.is(tok::kw_if) && "'if' expected");
Daniel Jasperf7935112012-12-03 18:12:45 +00001506 nextToken();
Manuel Klimek15dfe7a2013-05-28 11:55:06 +00001507 if (FormatTok->Tok.is(tok::l_paren))
Manuel Klimekadededf2013-01-11 18:28:36 +00001508 parseParens();
Daniel Jasperf7935112012-12-03 18:12:45 +00001509 bool NeedsUnwrappedLine = false;
Manuel Klimek15dfe7a2013-05-28 11:55:06 +00001510 if (FormatTok->Tok.is(tok::l_brace)) {
Alexander Kornienko3a33f022013-12-12 09:49:52 +00001511 CompoundStatementIndenter Indenter(this, Style, Line->Level);
Nico Weber9096fc02013-06-26 00:30:14 +00001512 parseBlock(/*MustBeDeclaration=*/false);
Daniel Jasperc1bc38e2015-09-29 14:57:55 +00001513 if (Style.BraceWrapping.BeforeElse)
Manuel Klimekd3ed59a2013-08-02 21:31:59 +00001514 addUnwrappedLine();
Daniel Jasperc1bc38e2015-09-29 14:57:55 +00001515 else
Manuel Klimekd3ed59a2013-08-02 21:31:59 +00001516 NeedsUnwrappedLine = true;
Daniel Jasperf7935112012-12-03 18:12:45 +00001517 } else {
1518 addUnwrappedLine();
Manuel Klimek52b15152013-01-09 15:25:02 +00001519 ++Line->Level;
Manuel Klimek6b9eeba2013-01-07 14:56:16 +00001520 parseStructuralElement();
Manuel Klimek52b15152013-01-09 15:25:02 +00001521 --Line->Level;
Daniel Jasperf7935112012-12-03 18:12:45 +00001522 }
Manuel Klimek15dfe7a2013-05-28 11:55:06 +00001523 if (FormatTok->Tok.is(tok::kw_else)) {
Daniel Jasperf7935112012-12-03 18:12:45 +00001524 nextToken();
Manuel Klimek15dfe7a2013-05-28 11:55:06 +00001525 if (FormatTok->Tok.is(tok::l_brace)) {
Alexander Kornienko3a33f022013-12-12 09:49:52 +00001526 CompoundStatementIndenter Indenter(this, Style, Line->Level);
Nico Weber9096fc02013-06-26 00:30:14 +00001527 parseBlock(/*MustBeDeclaration=*/false);
Daniel Jasperf7935112012-12-03 18:12:45 +00001528 addUnwrappedLine();
Manuel Klimek15dfe7a2013-05-28 11:55:06 +00001529 } else if (FormatTok->Tok.is(tok::kw_if)) {
Daniel Jasperf7935112012-12-03 18:12:45 +00001530 parseIfThenElse();
1531 } else {
1532 addUnwrappedLine();
Manuel Klimek52b15152013-01-09 15:25:02 +00001533 ++Line->Level;
Manuel Klimek6b9eeba2013-01-07 14:56:16 +00001534 parseStructuralElement();
Daniel Jasper451544a2016-05-19 06:30:48 +00001535 if (FormatTok->is(tok::eof))
1536 addUnwrappedLine();
Manuel Klimek52b15152013-01-09 15:25:02 +00001537 --Line->Level;
Daniel Jasperf7935112012-12-03 18:12:45 +00001538 }
1539 } else if (NeedsUnwrappedLine) {
1540 addUnwrappedLine();
1541 }
1542}
1543
Daniel Jasper04a71a42014-05-08 11:58:24 +00001544void UnwrappedLineParser::parseTryCatch() {
Nico Weberfac23712015-02-04 15:26:27 +00001545 assert(FormatTok->isOneOf(tok::kw_try, tok::kw___try) && "'try' expected");
Daniel Jasper04a71a42014-05-08 11:58:24 +00001546 nextToken();
1547 bool NeedsUnwrappedLine = false;
1548 if (FormatTok->is(tok::colon)) {
1549 // We are in a function try block, what comes is an initializer list.
1550 nextToken();
1551 while (FormatTok->is(tok::identifier)) {
1552 nextToken();
1553 if (FormatTok->is(tok::l_paren))
1554 parseParens();
Daniel Jasper04a71a42014-05-08 11:58:24 +00001555 if (FormatTok->is(tok::comma))
1556 nextToken();
1557 }
1558 }
Daniel Jaspere189d462015-01-14 10:48:41 +00001559 // Parse try with resource.
1560 if (Style.Language == FormatStyle::LK_Java && FormatTok->is(tok::l_paren)) {
1561 parseParens();
1562 }
Daniel Jasper04a71a42014-05-08 11:58:24 +00001563 if (FormatTok->is(tok::l_brace)) {
1564 CompoundStatementIndenter Indenter(this, Style, Line->Level);
1565 parseBlock(/*MustBeDeclaration=*/false);
Daniel Jasperc1bc38e2015-09-29 14:57:55 +00001566 if (Style.BraceWrapping.BeforeCatch) {
Daniel Jasper04a71a42014-05-08 11:58:24 +00001567 addUnwrappedLine();
1568 } else {
1569 NeedsUnwrappedLine = true;
1570 }
1571 } else if (!FormatTok->is(tok::kw_catch)) {
1572 // The C++ standard requires a compound-statement after a try.
1573 // If there's none, we try to assume there's a structuralElement
1574 // and try to continue.
Daniel Jasper04a71a42014-05-08 11:58:24 +00001575 addUnwrappedLine();
1576 ++Line->Level;
1577 parseStructuralElement();
1578 --Line->Level;
1579 }
Nico Weber33381f52015-02-07 01:57:32 +00001580 while (1) {
1581 if (FormatTok->is(tok::at))
1582 nextToken();
1583 if (!(FormatTok->isOneOf(tok::kw_catch, Keywords.kw___except,
1584 tok::kw___finally) ||
1585 ((Style.Language == FormatStyle::LK_Java ||
1586 Style.Language == FormatStyle::LK_JavaScript) &&
1587 FormatTok->is(Keywords.kw_finally)) ||
1588 (FormatTok->Tok.isObjCAtKeyword(tok::objc_catch) ||
1589 FormatTok->Tok.isObjCAtKeyword(tok::objc_finally))))
1590 break;
Daniel Jasper04a71a42014-05-08 11:58:24 +00001591 nextToken();
1592 while (FormatTok->isNot(tok::l_brace)) {
1593 if (FormatTok->is(tok::l_paren)) {
1594 parseParens();
1595 continue;
1596 }
Daniel Jasper2bd7a642015-01-19 10:50:51 +00001597 if (FormatTok->isOneOf(tok::semi, tok::r_brace, tok::eof))
Daniel Jasper04a71a42014-05-08 11:58:24 +00001598 return;
1599 nextToken();
1600 }
1601 NeedsUnwrappedLine = false;
1602 CompoundStatementIndenter Indenter(this, Style, Line->Level);
1603 parseBlock(/*MustBeDeclaration=*/false);
Daniel Jasperc1bc38e2015-09-29 14:57:55 +00001604 if (Style.BraceWrapping.BeforeCatch)
Daniel Jasper04a71a42014-05-08 11:58:24 +00001605 addUnwrappedLine();
Daniel Jasperc1bc38e2015-09-29 14:57:55 +00001606 else
Daniel Jasper04a71a42014-05-08 11:58:24 +00001607 NeedsUnwrappedLine = true;
Daniel Jasper04a71a42014-05-08 11:58:24 +00001608 }
Daniel Jasperc1bc38e2015-09-29 14:57:55 +00001609 if (NeedsUnwrappedLine)
Daniel Jasper04a71a42014-05-08 11:58:24 +00001610 addUnwrappedLine();
Daniel Jasper04a71a42014-05-08 11:58:24 +00001611}
1612
Alexander Kornienko578fdd82012-12-06 18:03:27 +00001613void UnwrappedLineParser::parseNamespace() {
Manuel Klimek15dfe7a2013-05-28 11:55:06 +00001614 assert(FormatTok->Tok.is(tok::kw_namespace) && "'namespace' expected");
Roman Kashitsyna043ced2014-08-11 12:18:01 +00001615
1616 const FormatToken &InitialToken = *FormatTok;
Alexander Kornienko578fdd82012-12-06 18:03:27 +00001617 nextToken();
Saleem Abdulrasool328085f2015-10-30 05:07:56 +00001618 while (FormatTok->isOneOf(tok::identifier, tok::coloncolon))
Alexander Kornienko578fdd82012-12-06 18:03:27 +00001619 nextToken();
Manuel Klimek15dfe7a2013-05-28 11:55:06 +00001620 if (FormatTok->Tok.is(tok::l_brace)) {
Roman Kashitsyna043ced2014-08-11 12:18:01 +00001621 if (ShouldBreakBeforeBrace(Style, InitialToken))
Manuel Klimeka8eb9142013-05-13 12:51:40 +00001622 addUnwrappedLine();
1623
Daniel Jasper65ee3472013-07-31 23:16:02 +00001624 bool AddLevel = Style.NamespaceIndentation == FormatStyle::NI_All ||
1625 (Style.NamespaceIndentation == FormatStyle::NI_Inner &&
1626 DeclarationScopeStack.size() > 1);
1627 parseBlock(/*MustBeDeclaration=*/true, AddLevel);
Manuel Klimek046b9302013-02-06 16:08:09 +00001628 // Munch the semicolon after a namespace. This is more common than one would
1629 // think. Puttin the semicolon into its own line is very ugly.
Manuel Klimek15dfe7a2013-05-28 11:55:06 +00001630 if (FormatTok->Tok.is(tok::semi))
Manuel Klimek046b9302013-02-06 16:08:09 +00001631 nextToken();
Alexander Kornienko578fdd82012-12-06 18:03:27 +00001632 addUnwrappedLine();
1633 }
1634 // FIXME: Add error handling.
1635}
1636
Daniel Jasper6acf5132015-03-12 14:44:29 +00001637void UnwrappedLineParser::parseNew() {
1638 assert(FormatTok->is(tok::kw_new) && "'new' expected");
1639 nextToken();
1640 if (Style.Language != FormatStyle::LK_Java)
1641 return;
1642
1643 // In Java, we can parse everything up to the parens, which aren't optional.
1644 do {
1645 // There should not be a ;, { or } before the new's open paren.
1646 if (FormatTok->isOneOf(tok::semi, tok::l_brace, tok::r_brace))
1647 return;
1648
1649 // Consume the parens.
1650 if (FormatTok->is(tok::l_paren)) {
1651 parseParens();
1652
1653 // If there is a class body of an anonymous class, consume that as child.
1654 if (FormatTok->is(tok::l_brace))
1655 parseChildBlock();
1656 return;
1657 }
1658 nextToken();
1659 } while (!eof());
1660}
1661
Alexander Kornienko37d6c942012-12-05 15:06:06 +00001662void UnwrappedLineParser::parseForOrWhileLoop() {
Daniel Jasper66cb8c52015-05-04 09:22:29 +00001663 assert(FormatTok->isOneOf(tok::kw_for, tok::kw_while, TT_ForEachMacro) &&
Daniel Jaspere1e43192014-04-01 12:55:11 +00001664 "'for', 'while' or foreach macro expected");
Alexander Kornienko37d6c942012-12-05 15:06:06 +00001665 nextToken();
Martin Probsta050f412017-05-18 21:19:29 +00001666 // JS' for await ( ...
Martin Probstbd49e322017-05-15 19:33:20 +00001667 if (Style.Language == FormatStyle::LK_JavaScript &&
Martin Probsta050f412017-05-18 21:19:29 +00001668 FormatTok->is(Keywords.kw_await))
Martin Probstbd49e322017-05-15 19:33:20 +00001669 nextToken();
Manuel Klimek15dfe7a2013-05-28 11:55:06 +00001670 if (FormatTok->Tok.is(tok::l_paren))
Manuel Klimek9fa8d552013-01-11 19:23:05 +00001671 parseParens();
Manuel Klimek15dfe7a2013-05-28 11:55:06 +00001672 if (FormatTok->Tok.is(tok::l_brace)) {
Alexander Kornienko3a33f022013-12-12 09:49:52 +00001673 CompoundStatementIndenter Indenter(this, Style, Line->Level);
Nico Weber9096fc02013-06-26 00:30:14 +00001674 parseBlock(/*MustBeDeclaration=*/false);
Alexander Kornienko37d6c942012-12-05 15:06:06 +00001675 addUnwrappedLine();
1676 } else {
1677 addUnwrappedLine();
Manuel Klimek52b15152013-01-09 15:25:02 +00001678 ++Line->Level;
Manuel Klimek6b9eeba2013-01-07 14:56:16 +00001679 parseStructuralElement();
Manuel Klimek52b15152013-01-09 15:25:02 +00001680 --Line->Level;
Alexander Kornienko37d6c942012-12-05 15:06:06 +00001681 }
1682}
1683
Daniel Jasperf7935112012-12-03 18:12:45 +00001684void UnwrappedLineParser::parseDoWhile() {
Manuel Klimek15dfe7a2013-05-28 11:55:06 +00001685 assert(FormatTok->Tok.is(tok::kw_do) && "'do' expected");
Daniel Jasperf7935112012-12-03 18:12:45 +00001686 nextToken();
Manuel Klimek15dfe7a2013-05-28 11:55:06 +00001687 if (FormatTok->Tok.is(tok::l_brace)) {
Alexander Kornienko3a33f022013-12-12 09:49:52 +00001688 CompoundStatementIndenter Indenter(this, Style, Line->Level);
Nico Weber9096fc02013-06-26 00:30:14 +00001689 parseBlock(/*MustBeDeclaration=*/false);
Daniel Jasperc1bc38e2015-09-29 14:57:55 +00001690 if (Style.BraceWrapping.IndentBraces)
Alexander Kornienko3a33f022013-12-12 09:49:52 +00001691 addUnwrappedLine();
Daniel Jasperf7935112012-12-03 18:12:45 +00001692 } else {
1693 addUnwrappedLine();
Manuel Klimek52b15152013-01-09 15:25:02 +00001694 ++Line->Level;
Manuel Klimek6b9eeba2013-01-07 14:56:16 +00001695 parseStructuralElement();
Manuel Klimek52b15152013-01-09 15:25:02 +00001696 --Line->Level;
Daniel Jasperf7935112012-12-03 18:12:45 +00001697 }
1698
Alexander Kornienko0ea8e102012-12-04 15:40:36 +00001699 // FIXME: Add error handling.
Manuel Klimek15dfe7a2013-05-28 11:55:06 +00001700 if (!FormatTok->Tok.is(tok::kw_while)) {
Alexander Kornienko0ea8e102012-12-04 15:40:36 +00001701 addUnwrappedLine();
1702 return;
1703 }
1704
Daniel Jasperf7935112012-12-03 18:12:45 +00001705 nextToken();
Manuel Klimek6b9eeba2013-01-07 14:56:16 +00001706 parseStructuralElement();
Daniel Jasperf7935112012-12-03 18:12:45 +00001707}
1708
1709void UnwrappedLineParser::parseLabel() {
Daniel Jasperf7935112012-12-03 18:12:45 +00001710 nextToken();
Manuel Klimek52b15152013-01-09 15:25:02 +00001711 unsigned OldLineLevel = Line->Level;
Daniel Jaspera1275122013-03-20 10:23:53 +00001712 if (Line->Level > 1 || (!Line->InPPDirective && Line->Level > 0))
Manuel Klimek52b15152013-01-09 15:25:02 +00001713 --Line->Level;
Manuel Klimek15dfe7a2013-05-28 11:55:06 +00001714 if (CommentsBeforeNextToken.empty() && FormatTok->Tok.is(tok::l_brace)) {
Alexander Kornienko3a33f022013-12-12 09:49:52 +00001715 CompoundStatementIndenter Indenter(this, Style, Line->Level);
Nico Weber9096fc02013-06-26 00:30:14 +00001716 parseBlock(/*MustBeDeclaration=*/false);
Manuel Klimekd3ed59a2013-08-02 21:31:59 +00001717 if (FormatTok->Tok.is(tok::kw_break)) {
Daniel Jasperc1bc38e2015-09-29 14:57:55 +00001718 if (Style.BraceWrapping.AfterControlStatement)
Manuel Klimekd3ed59a2013-08-02 21:31:59 +00001719 addUnwrappedLine();
1720 parseStructuralElement();
1721 }
Alexander Kornienko3a33f022013-12-12 09:49:52 +00001722 addUnwrappedLine();
1723 } else {
Daniel Jasper1fe0d5c2015-05-06 15:19:47 +00001724 if (FormatTok->is(tok::semi))
1725 nextToken();
Alexander Kornienko3a33f022013-12-12 09:49:52 +00001726 addUnwrappedLine();
Daniel Jasperf7935112012-12-03 18:12:45 +00001727 }
Manuel Klimek52b15152013-01-09 15:25:02 +00001728 Line->Level = OldLineLevel;
Daniel Jasper2cce7b72016-04-06 16:41:39 +00001729 if (FormatTok->isNot(tok::l_brace)) {
Daniel Jasper40609472016-04-06 15:02:46 +00001730 parseStructuralElement();
Daniel Jasper2cce7b72016-04-06 16:41:39 +00001731 addUnwrappedLine();
1732 }
Daniel Jasperf7935112012-12-03 18:12:45 +00001733}
1734
1735void UnwrappedLineParser::parseCaseLabel() {
Manuel Klimek15dfe7a2013-05-28 11:55:06 +00001736 assert(FormatTok->Tok.is(tok::kw_case) && "'case' expected");
Daniel Jasperf7935112012-12-03 18:12:45 +00001737 // FIXME: fix handling of complex expressions here.
1738 do {
1739 nextToken();
Manuel Klimek15dfe7a2013-05-28 11:55:06 +00001740 } while (!eof() && !FormatTok->Tok.is(tok::colon));
Daniel Jasperf7935112012-12-03 18:12:45 +00001741 parseLabel();
1742}
1743
1744void UnwrappedLineParser::parseSwitch() {
Manuel Klimek15dfe7a2013-05-28 11:55:06 +00001745 assert(FormatTok->Tok.is(tok::kw_switch) && "'switch' expected");
Daniel Jasperf7935112012-12-03 18:12:45 +00001746 nextToken();
Manuel Klimek15dfe7a2013-05-28 11:55:06 +00001747 if (FormatTok->Tok.is(tok::l_paren))
Manuel Klimek9fa8d552013-01-11 19:23:05 +00001748 parseParens();
Manuel Klimek15dfe7a2013-05-28 11:55:06 +00001749 if (FormatTok->Tok.is(tok::l_brace)) {
Alexander Kornienko3a33f022013-12-12 09:49:52 +00001750 CompoundStatementIndenter Indenter(this, Style, Line->Level);
Daniel Jasper65ee3472013-07-31 23:16:02 +00001751 parseBlock(/*MustBeDeclaration=*/false);
Daniel Jasperf7935112012-12-03 18:12:45 +00001752 addUnwrappedLine();
1753 } else {
1754 addUnwrappedLine();
Daniel Jasper516d7972013-07-25 11:31:57 +00001755 ++Line->Level;
Manuel Klimek6b9eeba2013-01-07 14:56:16 +00001756 parseStructuralElement();
Daniel Jasper516d7972013-07-25 11:31:57 +00001757 --Line->Level;
Daniel Jasperf7935112012-12-03 18:12:45 +00001758 }
1759}
1760
1761void UnwrappedLineParser::parseAccessSpecifier() {
1762 nextToken();
Daniel Jasper84c47a12013-11-23 17:53:41 +00001763 // Understand Qt's slots.
Daniel Jasper53395402015-04-07 15:04:40 +00001764 if (FormatTok->isOneOf(Keywords.kw_slots, Keywords.kw_qslots))
Daniel Jasper84c47a12013-11-23 17:53:41 +00001765 nextToken();
Alexander Kornienko2ca766f2012-12-10 16:34:48 +00001766 // Otherwise, we don't know what it is, and we'd better keep the next token.
Manuel Klimek15dfe7a2013-05-28 11:55:06 +00001767 if (FormatTok->Tok.is(tok::colon))
Alexander Kornienko2ca766f2012-12-10 16:34:48 +00001768 nextToken();
Daniel Jasperf7935112012-12-03 18:12:45 +00001769 addUnwrappedLine();
1770}
1771
Daniel Jasper6f5a1932015-12-29 08:54:23 +00001772bool UnwrappedLineParser::parseEnum() {
Daniel Jasper6be0f552014-11-13 15:56:28 +00001773 // Won't be 'enum' for NS_ENUMs.
1774 if (FormatTok->Tok.is(tok::kw_enum))
Daniel Jasperccb68b42014-11-19 22:38:18 +00001775 nextToken();
Daniel Jasper6be0f552014-11-13 15:56:28 +00001776
Daniel Jasper6f5a1932015-12-29 08:54:23 +00001777 // In TypeScript, "enum" can also be used as property name, e.g. in interface
1778 // declarations. An "enum" keyword followed by a colon would be a syntax
1779 // error and thus assume it is just an identifier.
Daniel Jasper87379302016-02-03 05:33:44 +00001780 if (Style.Language == FormatStyle::LK_JavaScript &&
1781 FormatTok->isOneOf(tok::colon, tok::question))
Daniel Jasper6f5a1932015-12-29 08:54:23 +00001782 return false;
1783
Daniel Jasper2b41a822013-08-20 12:42:50 +00001784 // Eat up enum class ...
Daniel Jasperb05a81d2014-05-09 13:11:16 +00001785 if (FormatTok->Tok.is(tok::kw_class) || FormatTok->Tok.is(tok::kw_struct))
1786 nextToken();
Daniel Jasperb5a0b852015-06-19 08:17:32 +00001787
Daniel Jasper786a5502013-09-06 21:32:35 +00001788 while (FormatTok->Tok.getIdentifierInfo() ||
Daniel Jasperccb68b42014-11-19 22:38:18 +00001789 FormatTok->isOneOf(tok::colon, tok::coloncolon, tok::less,
1790 tok::greater, tok::comma, tok::question)) {
Manuel Klimek2cec0192013-01-21 19:17:52 +00001791 nextToken();
1792 // We can have macros or attributes in between 'enum' and the enum name.
Daniel Jasperccb68b42014-11-19 22:38:18 +00001793 if (FormatTok->is(tok::l_paren))
Alexander Kornienkob7076a22012-12-04 14:46:19 +00001794 parseParens();
Daniel Jasperb5a0b852015-06-19 08:17:32 +00001795 if (FormatTok->is(tok::identifier)) {
Manuel Klimek2cec0192013-01-21 19:17:52 +00001796 nextToken();
Daniel Jasperb5a0b852015-06-19 08:17:32 +00001797 // If there are two identifiers in a row, this is likely an elaborate
1798 // return type. In Java, this can be "implements", etc.
Daniel Jasper1dbc2102017-03-31 13:30:24 +00001799 if (Style.isCpp() && FormatTok->is(tok::identifier))
Daniel Jasper6f5a1932015-12-29 08:54:23 +00001800 return false;
Daniel Jasperb5a0b852015-06-19 08:17:32 +00001801 }
Manuel Klimek2cec0192013-01-21 19:17:52 +00001802 }
Daniel Jasper6be0f552014-11-13 15:56:28 +00001803
1804 // Just a declaration or something is wrong.
Daniel Jasperccb68b42014-11-19 22:38:18 +00001805 if (FormatTok->isNot(tok::l_brace))
Daniel Jasper6f5a1932015-12-29 08:54:23 +00001806 return true;
Daniel Jasper6be0f552014-11-13 15:56:28 +00001807 FormatTok->BlockKind = BK_Block;
1808
1809 if (Style.Language == FormatStyle::LK_Java) {
1810 // Java enums are different.
1811 parseJavaEnumBody();
Daniel Jasper6f5a1932015-12-29 08:54:23 +00001812 return true;
1813 }
1814 if (Style.Language == FormatStyle::LK_Proto) {
Daniel Jasperc6dd2732015-07-16 14:25:43 +00001815 parseBlock(/*MustBeDeclaration=*/true);
Daniel Jasper6f5a1932015-12-29 08:54:23 +00001816 return true;
Manuel Klimek2cec0192013-01-21 19:17:52 +00001817 }
Daniel Jasper6be0f552014-11-13 15:56:28 +00001818
1819 // Parse enum body.
1820 bool HasError = !parseBracedList(/*ContinueOnSemicolons=*/true);
1821 if (HasError) {
1822 if (FormatTok->is(tok::semi))
1823 nextToken();
1824 addUnwrappedLine();
1825 }
Daniel Jasper6f5a1932015-12-29 08:54:23 +00001826 return true;
Daniel Jasper6be0f552014-11-13 15:56:28 +00001827
Daniel Jasper90cf3802015-06-17 09:44:02 +00001828 // There is no addUnwrappedLine() here so that we fall through to parsing a
1829 // structural element afterwards. Thus, in "enum A {} n, m;",
Manuel Klimek2cec0192013-01-21 19:17:52 +00001830 // "} n, m;" will end up in one unwrapped line.
Daniel Jasper6be0f552014-11-13 15:56:28 +00001831}
1832
1833void UnwrappedLineParser::parseJavaEnumBody() {
1834 // Determine whether the enum is simple, i.e. does not have a semicolon or
1835 // constants with class bodies. Simple enums can be formatted like braced
1836 // lists, contracted to a single line, etc.
1837 unsigned StoredPosition = Tokens->getPosition();
1838 bool IsSimple = true;
1839 FormatToken *Tok = Tokens->getNextToken();
1840 while (Tok) {
1841 if (Tok->is(tok::r_brace))
1842 break;
1843 if (Tok->isOneOf(tok::l_brace, tok::semi)) {
1844 IsSimple = false;
1845 break;
1846 }
1847 // FIXME: This will also mark enums with braces in the arguments to enum
1848 // constants as "not simple". This is probably fine in practice, though.
1849 Tok = Tokens->getNextToken();
1850 }
1851 FormatTok = Tokens->setPosition(StoredPosition);
1852
1853 if (IsSimple) {
1854 parseBracedList();
Daniel Jasperdf2ff002014-11-02 22:31:39 +00001855 addUnwrappedLine();
Daniel Jasper6be0f552014-11-13 15:56:28 +00001856 return;
1857 }
1858
1859 // Parse the body of a more complex enum.
1860 // First add a line for everything up to the "{".
1861 nextToken();
1862 addUnwrappedLine();
1863 ++Line->Level;
1864
1865 // Parse the enum constants.
1866 while (FormatTok) {
1867 if (FormatTok->is(tok::l_brace)) {
1868 // Parse the constant's class body.
1869 parseBlock(/*MustBeDeclaration=*/true, /*AddLevel=*/true,
1870 /*MunchSemi=*/false);
1871 } else if (FormatTok->is(tok::l_paren)) {
1872 parseParens();
1873 } else if (FormatTok->is(tok::comma)) {
1874 nextToken();
1875 addUnwrappedLine();
1876 } else if (FormatTok->is(tok::semi)) {
1877 nextToken();
1878 addUnwrappedLine();
1879 break;
1880 } else if (FormatTok->is(tok::r_brace)) {
1881 addUnwrappedLine();
1882 break;
1883 } else {
1884 nextToken();
1885 }
1886 }
1887
1888 // Parse the class body after the enum's ";" if any.
1889 parseLevel(/*HasOpeningBrace=*/true);
1890 nextToken();
1891 --Line->Level;
1892 addUnwrappedLine();
Daniel Jasperf7935112012-12-03 18:12:45 +00001893}
1894
Martin Probst1027fb82017-02-07 14:05:30 +00001895void UnwrappedLineParser::parseRecord(bool ParseAsExpr) {
Roman Kashitsyna043ced2014-08-11 12:18:01 +00001896 const FormatToken &InitialToken = *FormatTok;
Manuel Klimek28cacc72013-01-07 18:10:23 +00001897 nextToken();
Daniel Jasper04785d02015-05-06 14:03:02 +00001898
Daniel Jasper04785d02015-05-06 14:03:02 +00001899 // The actual identifier can be a nested name specifier, and in macros
1900 // it is often token-pasted.
1901 while (FormatTok->isOneOf(tok::identifier, tok::coloncolon, tok::hashhash,
1902 tok::kw___attribute, tok::kw___declspec,
1903 tok::kw_alignas) ||
1904 ((Style.Language == FormatStyle::LK_Java ||
1905 Style.Language == FormatStyle::LK_JavaScript) &&
1906 FormatTok->isOneOf(tok::period, tok::comma))) {
1907 bool IsNonMacroIdentifier =
1908 FormatTok->is(tok::identifier) &&
1909 FormatTok->TokenText != FormatTok->TokenText.upper();
Manuel Klimeke01bab52013-01-15 13:38:33 +00001910 nextToken();
1911 // We can have macros or attributes in between 'class' and the class name.
Daniel Jasper04785d02015-05-06 14:03:02 +00001912 if (!IsNonMacroIdentifier && FormatTok->Tok.is(tok::l_paren))
Manuel Klimeke01bab52013-01-15 13:38:33 +00001913 parseParens();
Daniel Jasper04785d02015-05-06 14:03:02 +00001914 }
Manuel Klimeke01bab52013-01-15 13:38:33 +00001915
Daniel Jasper04785d02015-05-06 14:03:02 +00001916 // Note that parsing away template declarations here leads to incorrectly
1917 // accepting function declarations as record declarations.
1918 // In general, we cannot solve this problem. Consider:
1919 // class A<int> B() {}
1920 // which can be a function definition or a class definition when B() is a
1921 // macro. If we find enough real-world cases where this is a problem, we
1922 // can parse for the 'template' keyword in the beginning of the statement,
1923 // and thus rule out the record production in case there is no template
1924 // (this would still leave us with an ambiguity between template function
1925 // and class declarations).
Daniel Jasperadba2aa2015-05-18 12:52:00 +00001926 if (FormatTok->isOneOf(tok::colon, tok::less)) {
1927 while (!eof()) {
Daniel Jasper3c883d12015-05-18 14:49:19 +00001928 if (FormatTok->is(tok::l_brace)) {
1929 calculateBraceTypes(/*ExpectClassBody=*/true);
1930 if (!tryToParseBracedList())
1931 break;
1932 }
Daniel Jasper04785d02015-05-06 14:03:02 +00001933 if (FormatTok->Tok.is(tok::semi))
1934 return;
1935 nextToken();
Manuel Klimeke01bab52013-01-15 13:38:33 +00001936 }
1937 }
Manuel Klimek15dfe7a2013-05-28 11:55:06 +00001938 if (FormatTok->Tok.is(tok::l_brace)) {
Martin Probst1027fb82017-02-07 14:05:30 +00001939 if (ParseAsExpr) {
1940 parseChildBlock();
1941 } else {
1942 if (ShouldBreakBeforeBrace(Style, InitialToken))
1943 addUnwrappedLine();
Manuel Klimeka8eb9142013-05-13 12:51:40 +00001944
Martin Probst1027fb82017-02-07 14:05:30 +00001945 parseBlock(/*MustBeDeclaration=*/true, /*AddLevel=*/true,
1946 /*MunchSemi=*/false);
1947 }
Manuel Klimeka8eb9142013-05-13 12:51:40 +00001948 }
Daniel Jasper90cf3802015-06-17 09:44:02 +00001949 // There is no addUnwrappedLine() here so that we fall through to parsing a
1950 // structural element afterwards. Thus, in "class A {} n, m;",
1951 // "} n, m;" will end up in one unwrapped line.
Manuel Klimek28cacc72013-01-07 18:10:23 +00001952}
1953
Nico Weber8696a8d2013-01-09 21:15:03 +00001954void UnwrappedLineParser::parseObjCProtocolList() {
Manuel Klimek15dfe7a2013-05-28 11:55:06 +00001955 assert(FormatTok->Tok.is(tok::less) && "'<' expected.");
Nico Weber8696a8d2013-01-09 21:15:03 +00001956 do
1957 nextToken();
Manuel Klimek15dfe7a2013-05-28 11:55:06 +00001958 while (!eof() && FormatTok->Tok.isNot(tok::greater));
Nico Weber8696a8d2013-01-09 21:15:03 +00001959 nextToken(); // Skip '>'.
1960}
1961
1962void UnwrappedLineParser::parseObjCUntilAtEnd() {
1963 do {
Manuel Klimek15dfe7a2013-05-28 11:55:06 +00001964 if (FormatTok->Tok.isObjCAtKeyword(tok::objc_end)) {
Nico Weber8696a8d2013-01-09 21:15:03 +00001965 nextToken();
1966 addUnwrappedLine();
1967 break;
1968 }
Daniel Jaspera15da302013-08-28 08:04:23 +00001969 if (FormatTok->is(tok::l_brace)) {
1970 parseBlock(/*MustBeDeclaration=*/false);
1971 // In ObjC interfaces, nothing should be following the "}".
1972 addUnwrappedLine();
Benjamin Kramere21cb742014-01-08 15:59:42 +00001973 } else if (FormatTok->is(tok::r_brace)) {
1974 // Ignore stray "}". parseStructuralElement doesn't consume them.
1975 nextToken();
1976 addUnwrappedLine();
Daniel Jaspera15da302013-08-28 08:04:23 +00001977 } else {
1978 parseStructuralElement();
1979 }
Nico Weber8696a8d2013-01-09 21:15:03 +00001980 } while (!eof());
1981}
1982
Nico Weber2ce0ac52013-01-09 23:25:37 +00001983void UnwrappedLineParser::parseObjCInterfaceOrImplementation() {
Nico Weber7eecf4b2013-01-09 20:25:35 +00001984 nextToken();
Daniel Jasperd1ae3582013-03-20 12:37:50 +00001985 nextToken(); // interface name
Nico Weber7eecf4b2013-01-09 20:25:35 +00001986
1987 // @interface can be followed by either a base class, or a category.
Manuel Klimek15dfe7a2013-05-28 11:55:06 +00001988 if (FormatTok->Tok.is(tok::colon)) {
Nico Weber7eecf4b2013-01-09 20:25:35 +00001989 nextToken();
Daniel Jasperd1ae3582013-03-20 12:37:50 +00001990 nextToken(); // base class name
Manuel Klimek15dfe7a2013-05-28 11:55:06 +00001991 } else if (FormatTok->Tok.is(tok::l_paren))
Nico Weber7eecf4b2013-01-09 20:25:35 +00001992 // Skip category, if present.
1993 parseParens();
1994
Manuel Klimek15dfe7a2013-05-28 11:55:06 +00001995 if (FormatTok->Tok.is(tok::less))
Nico Weber8696a8d2013-01-09 21:15:03 +00001996 parseObjCProtocolList();
Nico Weber7eecf4b2013-01-09 20:25:35 +00001997
Dinesh Dwivediea3aca82014-05-02 17:01:46 +00001998 if (FormatTok->Tok.is(tok::l_brace)) {
Daniel Jasperc1bc38e2015-09-29 14:57:55 +00001999 if (Style.BraceWrapping.AfterObjCDeclaration)
Dinesh Dwivediea3aca82014-05-02 17:01:46 +00002000 addUnwrappedLine();
Nico Weber9096fc02013-06-26 00:30:14 +00002001 parseBlock(/*MustBeDeclaration=*/true);
Dinesh Dwivediea3aca82014-05-02 17:01:46 +00002002 }
Nico Weber7eecf4b2013-01-09 20:25:35 +00002003
2004 // With instance variables, this puts '}' on its own line. Without instance
2005 // variables, this ends the @interface line.
2006 addUnwrappedLine();
2007
Nico Weber8696a8d2013-01-09 21:15:03 +00002008 parseObjCUntilAtEnd();
2009}
Nico Weber7eecf4b2013-01-09 20:25:35 +00002010
Nico Weber8696a8d2013-01-09 21:15:03 +00002011void UnwrappedLineParser::parseObjCProtocol() {
2012 nextToken();
Daniel Jasperd1ae3582013-03-20 12:37:50 +00002013 nextToken(); // protocol name
Nico Weber8696a8d2013-01-09 21:15:03 +00002014
Manuel Klimek15dfe7a2013-05-28 11:55:06 +00002015 if (FormatTok->Tok.is(tok::less))
Nico Weber8696a8d2013-01-09 21:15:03 +00002016 parseObjCProtocolList();
2017
2018 // Check for protocol declaration.
Manuel Klimek15dfe7a2013-05-28 11:55:06 +00002019 if (FormatTok->Tok.is(tok::semi)) {
Nico Weber8696a8d2013-01-09 21:15:03 +00002020 nextToken();
2021 return addUnwrappedLine();
2022 }
2023
2024 addUnwrappedLine();
2025 parseObjCUntilAtEnd();
Nico Weber7eecf4b2013-01-09 20:25:35 +00002026}
2027
Daniel Jasperfca735c2015-02-19 16:14:18 +00002028void UnwrappedLineParser::parseJavaScriptEs6ImportExport() {
Martin Probst053f1aa2016-04-19 14:55:37 +00002029 bool IsImport = FormatTok->is(Keywords.kw_import);
2030 assert(IsImport || FormatTok->is(tok::kw_export));
Daniel Jasper354aa512015-02-19 16:07:32 +00002031 nextToken();
Daniel Jasperfca735c2015-02-19 16:14:18 +00002032
Daniel Jasperec05fc72015-05-11 09:14:50 +00002033 // Consume the "default" in "export default class/function".
Daniel Jasper668c7bb2015-05-11 09:03:10 +00002034 if (FormatTok->is(tok::kw_default))
2035 nextToken();
Daniel Jasperec05fc72015-05-11 09:14:50 +00002036
Martin Probst5f8445b2016-04-24 22:05:09 +00002037 // Consume "async function", "function" and "default function", so that these
2038 // get parsed as free-standing JS functions, i.e. do not require a trailing
2039 // semicolon.
2040 if (FormatTok->is(Keywords.kw_async))
2041 nextToken();
Daniel Jasper668c7bb2015-05-11 09:03:10 +00002042 if (FormatTok->is(Keywords.kw_function)) {
2043 nextToken();
2044 return;
2045 }
2046
Martin Probst053f1aa2016-04-19 14:55:37 +00002047 // For imports, `export *`, `export {...}`, consume the rest of the line up
2048 // to the terminating `;`. For everything else, just return and continue
2049 // parsing the structural element, i.e. the declaration or expression for
2050 // `export default`.
2051 if (!IsImport && !FormatTok->isOneOf(tok::l_brace, tok::star) &&
2052 !FormatTok->isStringLiteral())
2053 return;
Daniel Jasperfca735c2015-02-19 16:14:18 +00002054
Martin Probstd40bca42017-01-09 08:56:36 +00002055 while (!eof()) {
2056 if (FormatTok->is(tok::semi))
2057 return;
2058 if (Line->Tokens.size() == 0) {
2059 // Common issue: Automatic Semicolon Insertion wrapped the line, so the
2060 // import statement should terminate.
2061 return;
2062 }
Daniel Jasperefc1a832016-01-07 08:53:35 +00002063 if (FormatTok->is(tok::l_brace)) {
2064 FormatTok->BlockKind = BK_Block;
2065 parseBracedList();
2066 } else {
2067 nextToken();
2068 }
Daniel Jasper354aa512015-02-19 16:07:32 +00002069 }
2070}
2071
Daniel Jasper3b203a62013-09-05 16:05:56 +00002072LLVM_ATTRIBUTE_UNUSED static void printDebugInfo(const UnwrappedLine &Line,
2073 StringRef Prefix = "") {
Daniel Jasper9fe0e8d2013-09-05 09:29:45 +00002074 llvm::dbgs() << Prefix << "Line(" << Line.Level << ")"
2075 << (Line.InPPDirective ? " MACRO" : "") << ": ";
2076 for (std::list<UnwrappedLineNode>::const_iterator I = Line.Tokens.begin(),
2077 E = Line.Tokens.end();
2078 I != E; ++I) {
Krasimir Georgiev91834222017-01-25 13:58:58 +00002079 llvm::dbgs() << I->Tok->Tok.getName() << "["
2080 << "T=" << I->Tok->Type
2081 << ", OC=" << I->Tok->OriginalColumn << "] ";
Daniel Jasper9fe0e8d2013-09-05 09:29:45 +00002082 }
2083 for (std::list<UnwrappedLineNode>::const_iterator I = Line.Tokens.begin(),
2084 E = Line.Tokens.end();
2085 I != E; ++I) {
2086 const UnwrappedLineNode &Node = *I;
2087 for (SmallVectorImpl<UnwrappedLine>::const_iterator
2088 I = Node.Children.begin(),
2089 E = Node.Children.end();
2090 I != E; ++I) {
2091 printDebugInfo(*I, "\nChild: ");
2092 }
2093 }
2094 llvm::dbgs() << "\n";
2095}
2096
Daniel Jasperf7935112012-12-03 18:12:45 +00002097void UnwrappedLineParser::addUnwrappedLine() {
Daniel Jasperdaffc0d2013-01-16 09:10:19 +00002098 if (Line->Tokens.empty())
Daniel Jasper7c85fde2013-01-08 14:56:18 +00002099 return;
Manuel Klimekab3dc002013-01-16 12:31:12 +00002100 DEBUG({
Daniel Jasper9fe0e8d2013-09-05 09:29:45 +00002101 if (CurrentLines == &Lines)
2102 printDebugInfo(*Line);
Manuel Klimekab3dc002013-01-16 12:31:12 +00002103 });
Benjamin Kramerc7551a42015-05-31 11:18:05 +00002104 CurrentLines->push_back(std::move(*Line));
Daniel Jasperdaffc0d2013-01-16 09:10:19 +00002105 Line->Tokens.clear();
Krasimir Georgiev85c37042017-03-01 16:38:08 +00002106 Line->MatchingOpeningBlockLineIndex = UnwrappedLine::kInvalidIndex;
Manuel Klimekd3b92fa2013-01-18 14:04:34 +00002107 if (CurrentLines == &Lines && !PreprocessorDirectives.empty()) {
Benjamin Kramerc7551a42015-05-31 11:18:05 +00002108 CurrentLines->append(
2109 std::make_move_iterator(PreprocessorDirectives.begin()),
2110 std::make_move_iterator(PreprocessorDirectives.end()));
Manuel Klimekd3b92fa2013-01-18 14:04:34 +00002111 PreprocessorDirectives.clear();
2112 }
Daniel Jasperf7935112012-12-03 18:12:45 +00002113}
2114
Manuel Klimek15dfe7a2013-05-28 11:55:06 +00002115bool UnwrappedLineParser::eof() const { return FormatTok->Tok.is(tok::eof); }
Daniel Jasperf7935112012-12-03 18:12:45 +00002116
Daniel Jasperb05a81d2014-05-09 13:11:16 +00002117bool UnwrappedLineParser::isOnNewLine(const FormatToken &FormatTok) {
Manuel Klimek1fcbe672014-04-11 12:27:47 +00002118 return (Line->InPPDirective || FormatTok.HasUnescapedNewline) &&
2119 FormatTok.NewlinesBefore > 0;
2120}
2121
Krasimir Georgiev91834222017-01-25 13:58:58 +00002122// Checks if \p FormatTok is a line comment that continues the line comment
2123// section on \p Line.
Krasimir Georgievea222a72017-05-22 10:07:56 +00002124static bool continuesLineCommentSection(const FormatToken &FormatTok,
2125 const UnwrappedLine &Line,
2126 llvm::Regex &CommentPragmasRegex) {
Krasimir Georgiev91834222017-01-25 13:58:58 +00002127 if (Line.Tokens.empty())
2128 return false;
Krasimir Georgiev84321612017-01-30 19:18:55 +00002129
Krasimir Georgiev00c5c722017-02-02 15:32:19 +00002130 StringRef IndentContent = FormatTok.TokenText;
2131 if (FormatTok.TokenText.startswith("//") ||
2132 FormatTok.TokenText.startswith("/*"))
2133 IndentContent = FormatTok.TokenText.substr(2);
2134 if (CommentPragmasRegex.match(IndentContent))
2135 return false;
2136
Krasimir Georgiev91834222017-01-25 13:58:58 +00002137 // If Line starts with a line comment, then FormatTok continues the comment
Krasimir Georgiev84321612017-01-30 19:18:55 +00002138 // section if its original column is greater or equal to the original start
Krasimir Georgiev91834222017-01-25 13:58:58 +00002139 // column of the line.
2140 //
Krasimir Georgiev84321612017-01-30 19:18:55 +00002141 // Define the min column token of a line as follows: if a line ends in '{' or
2142 // contains a '{' followed by a line comment, then the min column token is
2143 // that '{'. Otherwise, the min column token of the line is the first token of
2144 // the line.
2145 //
2146 // If Line starts with a token other than a line comment, then FormatTok
2147 // continues the comment section if its original column is greater than the
2148 // original start column of the min column token of the line.
Krasimir Georgiev91834222017-01-25 13:58:58 +00002149 //
2150 // For example, the second line comment continues the first in these cases:
Krasimir Georgievb6ccd382017-02-02 14:36:50 +00002151 //
Krasimir Georgiev91834222017-01-25 13:58:58 +00002152 // // first line
2153 // // second line
Krasimir Georgievb6ccd382017-02-02 14:36:50 +00002154 //
Krasimir Georgiev91834222017-01-25 13:58:58 +00002155 // and:
Krasimir Georgievb6ccd382017-02-02 14:36:50 +00002156 //
Krasimir Georgiev91834222017-01-25 13:58:58 +00002157 // // first line
2158 // // second line
Krasimir Georgievb6ccd382017-02-02 14:36:50 +00002159 //
Krasimir Georgiev91834222017-01-25 13:58:58 +00002160 // and:
Krasimir Georgievb6ccd382017-02-02 14:36:50 +00002161 //
Krasimir Georgiev91834222017-01-25 13:58:58 +00002162 // int i; // first line
2163 // // second line
Krasimir Georgievb6ccd382017-02-02 14:36:50 +00002164 //
Krasimir Georgiev84321612017-01-30 19:18:55 +00002165 // and:
Krasimir Georgievb6ccd382017-02-02 14:36:50 +00002166 //
Krasimir Georgiev84321612017-01-30 19:18:55 +00002167 // do { // first line
2168 // // second line
2169 // int i;
2170 // } while (true);
Krasimir Georgiev91834222017-01-25 13:58:58 +00002171 //
Krasimir Georgievb6ccd382017-02-02 14:36:50 +00002172 // and:
2173 //
2174 // enum {
2175 // a, // first line
2176 // // second line
2177 // b
2178 // };
2179 //
Krasimir Georgiev91834222017-01-25 13:58:58 +00002180 // The second line comment doesn't continue the first in these cases:
Krasimir Georgievb6ccd382017-02-02 14:36:50 +00002181 //
Krasimir Georgiev91834222017-01-25 13:58:58 +00002182 // // first line
2183 // // second line
Krasimir Georgievb6ccd382017-02-02 14:36:50 +00002184 //
Krasimir Georgiev91834222017-01-25 13:58:58 +00002185 // and:
Krasimir Georgievb6ccd382017-02-02 14:36:50 +00002186 //
Krasimir Georgiev91834222017-01-25 13:58:58 +00002187 // int i; // first line
2188 // // second line
Krasimir Georgievb6ccd382017-02-02 14:36:50 +00002189 //
Krasimir Georgiev84321612017-01-30 19:18:55 +00002190 // and:
Krasimir Georgievb6ccd382017-02-02 14:36:50 +00002191 //
Krasimir Georgiev84321612017-01-30 19:18:55 +00002192 // do { // first line
2193 // // second line
2194 // int i;
2195 // } while (true);
Krasimir Georgievb6ccd382017-02-02 14:36:50 +00002196 //
2197 // and:
2198 //
2199 // enum {
2200 // a, // first line
2201 // // second line
2202 // };
Krasimir Georgiev84321612017-01-30 19:18:55 +00002203 const FormatToken *MinColumnToken = Line.Tokens.front().Tok;
2204
2205 // Scan for '{//'. If found, use the column of '{' as a min column for line
2206 // comment section continuation.
2207 const FormatToken *PreviousToken = nullptr;
Krasimir Georgievd86c25d2017-03-10 13:09:29 +00002208 for (const UnwrappedLineNode &Node : Line.Tokens) {
Krasimir Georgiev84321612017-01-30 19:18:55 +00002209 if (PreviousToken && PreviousToken->is(tok::l_brace) &&
2210 isLineComment(*Node.Tok)) {
2211 MinColumnToken = PreviousToken;
2212 break;
2213 }
2214 PreviousToken = Node.Tok;
Krasimir Georgievb6ccd382017-02-02 14:36:50 +00002215
2216 // Grab the last newline preceding a token in this unwrapped line.
2217 if (Node.Tok->NewlinesBefore > 0) {
2218 MinColumnToken = Node.Tok;
2219 }
Krasimir Georgiev84321612017-01-30 19:18:55 +00002220 }
2221 if (PreviousToken && PreviousToken->is(tok::l_brace)) {
2222 MinColumnToken = PreviousToken;
2223 }
2224
Krasimir Georgievea222a72017-05-22 10:07:56 +00002225 return continuesLineComment(FormatTok, /*Previous=*/Line.Tokens.back().Tok,
2226 MinColumnToken);
Krasimir Georgiev91834222017-01-25 13:58:58 +00002227}
2228
Manuel Klimekf92f7bc2013-01-22 16:31:55 +00002229void UnwrappedLineParser::flushComments(bool NewlineBeforeNext) {
2230 bool JustComments = Line->Tokens.empty();
Manuel Klimek15dfe7a2013-05-28 11:55:06 +00002231 for (SmallVectorImpl<FormatToken *>::const_iterator
Manuel Klimekf92f7bc2013-01-22 16:31:55 +00002232 I = CommentsBeforeNextToken.begin(),
2233 E = CommentsBeforeNextToken.end();
2234 I != E; ++I) {
Krasimir Georgiev91834222017-01-25 13:58:58 +00002235 // Line comments that belong to the same line comment section are put on the
2236 // same line since later we might want to reflow content between them.
Krasimir Georgiev753625b2017-01-31 13:32:38 +00002237 // Additional fine-grained breaking of line comment sections is controlled
2238 // by the class BreakableLineCommentSection in case it is desirable to keep
2239 // several line comment sections in the same unwrapped line.
2240 //
2241 // FIXME: Consider putting separate line comment sections as children to the
2242 // unwrapped line instead.
Krasimir Georgiev00c5c722017-02-02 15:32:19 +00002243 (*I)->ContinuesLineCommentSection =
Krasimir Georgievea222a72017-05-22 10:07:56 +00002244 continuesLineCommentSection(**I, *Line, CommentPragmasRegex);
Krasimir Georgievb6ccd382017-02-02 14:36:50 +00002245 if (isOnNewLine(**I) && JustComments && !(*I)->ContinuesLineCommentSection)
Manuel Klimekf92f7bc2013-01-22 16:31:55 +00002246 addUnwrappedLine();
Manuel Klimekf92f7bc2013-01-22 16:31:55 +00002247 pushToken(*I);
2248 }
Daniel Jaspere60cba12015-05-13 11:35:53 +00002249 if (NewlineBeforeNext && JustComments)
Manuel Klimekf92f7bc2013-01-22 16:31:55 +00002250 addUnwrappedLine();
Manuel Klimekf92f7bc2013-01-22 16:31:55 +00002251 CommentsBeforeNextToken.clear();
2252}
2253
Daniel Jasperf7935112012-12-03 18:12:45 +00002254void UnwrappedLineParser::nextToken() {
2255 if (eof())
2256 return;
Manuel Klimek1fcbe672014-04-11 12:27:47 +00002257 flushComments(isOnNewLine(*FormatTok));
Manuel Klimekf92f7bc2013-01-22 16:31:55 +00002258 pushToken(FormatTok);
Daniel Jasper1dcbbcfc2016-03-14 19:21:36 +00002259 if (Style.Language != FormatStyle::LK_JavaScript)
2260 readToken();
2261 else
2262 readTokenWithJavaScriptASI();
Manuel Klimek1abf7892013-01-04 23:34:14 +00002263}
2264
Daniel Jasperb9a49902016-01-09 15:56:28 +00002265const FormatToken *UnwrappedLineParser::getPreviousToken() {
2266 // FIXME: This is a dirty way to access the previous token. Find a better
2267 // solution.
2268 if (!Line || Line->Tokens.empty())
2269 return nullptr;
2270 return Line->Tokens.back().Tok;
2271}
2272
Krasimir Georgievf62f9582017-02-08 10:30:44 +00002273void UnwrappedLineParser::distributeComments(
2274 const SmallVectorImpl<FormatToken *> &Comments,
2275 const FormatToken *NextTok) {
2276 // Whether or not a line comment token continues a line is controlled by
Krasimir Georgievea222a72017-05-22 10:07:56 +00002277 // the method continuesLineCommentSection, with the following caveat:
Krasimir Georgievf62f9582017-02-08 10:30:44 +00002278 //
2279 // Define a trail of Comments to be a nonempty proper postfix of Comments such
2280 // that each comment line from the trail is aligned with the next token, if
2281 // the next token exists. If a trail exists, the beginning of the maximal
2282 // trail is marked as a start of a new comment section.
2283 //
2284 // For example in this code:
2285 //
2286 // int a; // line about a
2287 // // line 1 about b
2288 // // line 2 about b
2289 // int b;
2290 //
2291 // the two lines about b form a maximal trail, so there are two sections, the
2292 // first one consisting of the single comment "// line about a" and the
2293 // second one consisting of the next two comments.
2294 if (Comments.empty())
2295 return;
2296 bool ShouldPushCommentsInCurrentLine = true;
2297 bool HasTrailAlignedWithNextToken = false;
2298 unsigned StartOfTrailAlignedWithNextToken = 0;
2299 if (NextTok) {
2300 // We are skipping the first element intentionally.
2301 for (unsigned i = Comments.size() - 1; i > 0; --i) {
2302 if (Comments[i]->OriginalColumn == NextTok->OriginalColumn) {
2303 HasTrailAlignedWithNextToken = true;
2304 StartOfTrailAlignedWithNextToken = i;
2305 }
2306 }
2307 }
2308 for (unsigned i = 0, e = Comments.size(); i < e; ++i) {
2309 FormatToken *FormatTok = Comments[i];
2310 if (HasTrailAlignedWithNextToken &&
2311 i == StartOfTrailAlignedWithNextToken) {
2312 FormatTok->ContinuesLineCommentSection = false;
2313 } else {
2314 FormatTok->ContinuesLineCommentSection =
Krasimir Georgievea222a72017-05-22 10:07:56 +00002315 continuesLineCommentSection(*FormatTok, *Line, CommentPragmasRegex);
Krasimir Georgievf62f9582017-02-08 10:30:44 +00002316 }
2317 if (!FormatTok->ContinuesLineCommentSection &&
2318 (isOnNewLine(*FormatTok) || FormatTok->IsFirst)) {
2319 ShouldPushCommentsInCurrentLine = false;
2320 }
2321 if (ShouldPushCommentsInCurrentLine) {
2322 pushToken(FormatTok);
2323 } else {
2324 CommentsBeforeNextToken.push_back(FormatTok);
2325 }
2326 }
2327}
2328
Manuel Klimek1abf7892013-01-04 23:34:14 +00002329void UnwrappedLineParser::readToken() {
Krasimir Georgievf62f9582017-02-08 10:30:44 +00002330 SmallVector<FormatToken *, 1> Comments;
Manuel Klimekf92f7bc2013-01-22 16:31:55 +00002331 do {
2332 FormatTok = Tokens->getNextToken();
Alexander Kornienkoc2ee9cf2014-03-13 13:59:48 +00002333 assert(FormatTok);
Manuel Klimek15dfe7a2013-05-28 11:55:06 +00002334 while (!Line->InPPDirective && FormatTok->Tok.is(tok::hash) &&
2335 (FormatTok->HasUnescapedNewline || FormatTok->IsFirst)) {
Krasimir Georgievf62f9582017-02-08 10:30:44 +00002336 distributeComments(Comments, FormatTok);
2337 Comments.clear();
Manuel Klimekf92f7bc2013-01-22 16:31:55 +00002338 // If there is an unfinished unwrapped line, we flush the preprocessor
2339 // directives only after that unwrapped line was finished later.
Daniel Jasper29d39d52015-02-08 09:34:49 +00002340 bool SwitchToPreprocessorLines = !Line->Tokens.empty();
Manuel Klimekf92f7bc2013-01-22 16:31:55 +00002341 ScopedLineState BlockState(*this, SwitchToPreprocessorLines);
Alexander Kornienkob1be9d62013-04-03 12:38:53 +00002342 // Comments stored before the preprocessor directive need to be output
2343 // before the preprocessor directive, at the same level as the
2344 // preprocessor directive, as we consider them to apply to the directive.
Manuel Klimek1fcbe672014-04-11 12:27:47 +00002345 flushComments(isOnNewLine(*FormatTok));
Manuel Klimekf92f7bc2013-01-22 16:31:55 +00002346 parsePPDirective();
2347 }
Manuel Klimek68b03042014-04-14 09:14:11 +00002348 while (FormatTok->Type == TT_ConflictStart ||
2349 FormatTok->Type == TT_ConflictEnd ||
2350 FormatTok->Type == TT_ConflictAlternative) {
2351 if (FormatTok->Type == TT_ConflictStart) {
2352 conditionalCompilationStart(/*Unreachable=*/false);
2353 } else if (FormatTok->Type == TT_ConflictAlternative) {
2354 conditionalCompilationAlternative();
Daniel Jasperb05a81d2014-05-09 13:11:16 +00002355 } else if (FormatTok->Type == TT_ConflictEnd) {
Manuel Klimek68b03042014-04-14 09:14:11 +00002356 conditionalCompilationEnd();
2357 }
2358 FormatTok = Tokens->getNextToken();
2359 FormatTok->MustBreakBefore = true;
2360 }
Alexander Kornienkof2e02122013-05-24 18:24:24 +00002361
2362 if (!PPStack.empty() && (PPStack.back() == PP_Unreachable) &&
2363 !Line->InPPDirective) {
2364 continue;
2365 }
2366
Krasimir Georgievf62f9582017-02-08 10:30:44 +00002367 if (!FormatTok->Tok.is(tok::comment)) {
2368 distributeComments(Comments, FormatTok);
2369 Comments.clear();
Manuel Klimekf92f7bc2013-01-22 16:31:55 +00002370 return;
Manuel Klimekf92f7bc2013-01-22 16:31:55 +00002371 }
Krasimir Georgievf62f9582017-02-08 10:30:44 +00002372
2373 Comments.push_back(FormatTok);
Manuel Klimekf92f7bc2013-01-22 16:31:55 +00002374 } while (!eof());
Krasimir Georgievf62f9582017-02-08 10:30:44 +00002375
2376 distributeComments(Comments, nullptr);
2377 Comments.clear();
Manuel Klimekf92f7bc2013-01-22 16:31:55 +00002378}
2379
Manuel Klimek15dfe7a2013-05-28 11:55:06 +00002380void UnwrappedLineParser::pushToken(FormatToken *Tok) {
Daniel Jasper9fe0e8d2013-09-05 09:29:45 +00002381 Line->Tokens.push_back(UnwrappedLineNode(Tok));
Manuel Klimekf92f7bc2013-01-22 16:31:55 +00002382 if (MustBreakBeforeNextToken) {
Daniel Jasper9fe0e8d2013-09-05 09:29:45 +00002383 Line->Tokens.back().Tok->MustBreakBefore = true;
Manuel Klimekf92f7bc2013-01-22 16:31:55 +00002384 MustBreakBeforeNextToken = false;
Manuel Klimek1abf7892013-01-04 23:34:14 +00002385 }
Daniel Jasperf7935112012-12-03 18:12:45 +00002386}
2387
Daniel Jasper8d1832e2013-01-07 13:26:07 +00002388} // end namespace format
2389} // end namespace clang