blob: b15e52aeb2cd3845dfe76dfed04f2352b91151b1 [file] [log] [blame]
Daniel Jasperf7935112012-12-03 18:12:45 +00001//===--- UnwrappedLineParser.cpp - Format C++ code ------------------------===//
2//
3// The LLVM Compiler Infrastructure
4//
5// This file is distributed under the University of Illinois Open Source
6// License. See LICENSE.TXT for details.
7//
8//===----------------------------------------------------------------------===//
9///
10/// \file
11/// \brief This file contains the implementation of the UnwrappedLineParser,
12/// which turns a stream of tokens into UnwrappedLines.
13///
Daniel Jasperf7935112012-12-03 18:12:45 +000014//===----------------------------------------------------------------------===//
15
Chandler Carruth4b417452013-01-19 08:09:44 +000016#include "UnwrappedLineParser.h"
Benjamin Kramer33335df2015-03-01 21:36:40 +000017#include "llvm/ADT/STLExtras.h"
Manuel Klimekab3dc002013-01-16 12:31:12 +000018#include "llvm/Support/Debug.h"
Benjamin Kramer53f5e892015-03-23 18:05:43 +000019#include "llvm/Support/raw_ostream.h"
Manuel Klimekab3dc002013-01-16 12:31:12 +000020
Chandler Carruth10346662014-04-22 03:17:02 +000021#define DEBUG_TYPE "format-parser"
22
Daniel Jasperf7935112012-12-03 18:12:45 +000023namespace clang {
24namespace format {
25
Manuel Klimek15dfe7a2013-05-28 11:55:06 +000026class FormatTokenSource {
27public:
Angel Garcia Gomez637d1e62015-10-20 13:23:58 +000028 virtual ~FormatTokenSource() {}
Manuel Klimek15dfe7a2013-05-28 11:55:06 +000029 virtual FormatToken *getNextToken() = 0;
30
31 virtual unsigned getPosition() = 0;
32 virtual FormatToken *setPosition(unsigned Position) = 0;
33};
34
Craig Topper69665e12013-07-01 04:21:54 +000035namespace {
36
Manuel Klimek0a3a3c92013-01-23 09:32:48 +000037class ScopedDeclarationState {
38public:
39 ScopedDeclarationState(UnwrappedLine &Line, std::vector<bool> &Stack,
40 bool MustBeDeclaration)
41 : Line(Line), Stack(Stack) {
Manuel Klimek0a3a3c92013-01-23 09:32:48 +000042 Line.MustBeDeclaration = MustBeDeclaration;
Manuel Klimek39080572013-01-23 11:03:04 +000043 Stack.push_back(MustBeDeclaration);
Manuel Klimek0a3a3c92013-01-23 09:32:48 +000044 }
45 ~ScopedDeclarationState() {
Manuel Klimek0a3a3c92013-01-23 09:32:48 +000046 Stack.pop_back();
Manuel Klimekc1237a82013-01-23 14:08:21 +000047 if (!Stack.empty())
48 Line.MustBeDeclaration = Stack.back();
49 else
50 Line.MustBeDeclaration = true;
Manuel Klimek0a3a3c92013-01-23 09:32:48 +000051 }
Daniel Jasper393564f2013-05-31 14:56:29 +000052
Manuel Klimek0a3a3c92013-01-23 09:32:48 +000053private:
54 UnwrappedLine &Line;
55 std::vector<bool> &Stack;
56};
57
Krasimir Georgieva1c30932017-05-19 10:34:57 +000058static bool isLineComment(const FormatToken &FormatTok) {
59 return FormatTok.is(tok::comment) &&
60 FormatTok.TokenText.startswith("//");
61}
62
Krasimir Georgievea222a72017-05-22 10:07:56 +000063// Checks if \p FormatTok is a line comment that continues the line comment
64// \p Previous. The original column of \p MinColumnToken is used to determine
65// whether \p FormatTok is indented enough to the right to continue \p Previous.
66static bool continuesLineComment(const FormatToken &FormatTok,
67 const FormatToken *Previous,
68 const FormatToken *MinColumnToken) {
69 if (!Previous || !MinColumnToken)
70 return false;
71 unsigned MinContinueColumn =
72 MinColumnToken->OriginalColumn + (isLineComment(*MinColumnToken) ? 0 : 1);
73 return isLineComment(FormatTok) && FormatTok.NewlinesBefore == 1 &&
74 isLineComment(*Previous) &&
75 FormatTok.OriginalColumn >= MinContinueColumn;
76}
77
Manuel Klimek1abf7892013-01-04 23:34:14 +000078class ScopedMacroState : public FormatTokenSource {
79public:
80 ScopedMacroState(UnwrappedLine &Line, FormatTokenSource *&TokenSource,
Manuel Klimek20e0af62015-05-06 11:56:29 +000081 FormatToken *&ResetToken)
Manuel Klimek1abf7892013-01-04 23:34:14 +000082 : Line(Line), TokenSource(TokenSource), ResetToken(ResetToken),
Manuel Klimek1a18c402013-04-12 14:13:36 +000083 PreviousLineLevel(Line.Level), PreviousTokenSource(TokenSource),
Krasimir Georgieva1c30932017-05-19 10:34:57 +000084 Token(nullptr), PreviousToken(nullptr) {
Manuel Klimek1abf7892013-01-04 23:34:14 +000085 TokenSource = this;
Manuel Klimekef2cfb12013-01-05 22:14:16 +000086 Line.Level = 0;
Manuel Klimek1abf7892013-01-04 23:34:14 +000087 Line.InPPDirective = true;
88 }
89
Alexander Kornienko34eb2072015-04-11 02:00:23 +000090 ~ScopedMacroState() override {
Manuel Klimek1abf7892013-01-04 23:34:14 +000091 TokenSource = PreviousTokenSource;
92 ResetToken = Token;
93 Line.InPPDirective = false;
Manuel Klimekef2cfb12013-01-05 22:14:16 +000094 Line.Level = PreviousLineLevel;
Manuel Klimek1abf7892013-01-04 23:34:14 +000095 }
96
Craig Topperfb6b25b2014-03-15 04:29:04 +000097 FormatToken *getNextToken() override {
Manuel Klimek78725712013-01-07 10:03:37 +000098 // The \c UnwrappedLineParser guards against this by never calling
99 // \c getNextToken() after it has encountered the first eof token.
100 assert(!eof());
Krasimir Georgieva1c30932017-05-19 10:34:57 +0000101 PreviousToken = Token;
Manuel Klimek1abf7892013-01-04 23:34:14 +0000102 Token = PreviousTokenSource->getNextToken();
103 if (eof())
Manuel Klimek15dfe7a2013-05-28 11:55:06 +0000104 return getFakeEOF();
Manuel Klimek1abf7892013-01-04 23:34:14 +0000105 return Token;
106 }
107
Craig Topperfb6b25b2014-03-15 04:29:04 +0000108 unsigned getPosition() override { return PreviousTokenSource->getPosition(); }
Manuel Klimekab419912013-05-23 09:41:43 +0000109
Craig Topperfb6b25b2014-03-15 04:29:04 +0000110 FormatToken *setPosition(unsigned Position) override {
Krasimir Georgieva1c30932017-05-19 10:34:57 +0000111 PreviousToken = nullptr;
Manuel Klimekab419912013-05-23 09:41:43 +0000112 Token = PreviousTokenSource->setPosition(Position);
113 return Token;
114 }
115
Manuel Klimek1abf7892013-01-04 23:34:14 +0000116private:
Krasimir Georgieva1c30932017-05-19 10:34:57 +0000117 bool eof() {
118 return Token && Token->HasUnescapedNewline &&
Krasimir Georgievea222a72017-05-22 10:07:56 +0000119 !continuesLineComment(*Token, PreviousToken,
120 /*MinColumnToken=*/PreviousToken);
Krasimir Georgieva1c30932017-05-19 10:34:57 +0000121 }
Manuel Klimek1abf7892013-01-04 23:34:14 +0000122
Manuel Klimek15dfe7a2013-05-28 11:55:06 +0000123 FormatToken *getFakeEOF() {
124 static bool EOFInitialized = false;
125 static FormatToken FormatTok;
126 if (!EOFInitialized) {
127 FormatTok.Tok.startToken();
128 FormatTok.Tok.setKind(tok::eof);
129 EOFInitialized = true;
130 }
131 return &FormatTok;
Manuel Klimek1abf7892013-01-04 23:34:14 +0000132 }
133
134 UnwrappedLine &Line;
135 FormatTokenSource *&TokenSource;
Manuel Klimek15dfe7a2013-05-28 11:55:06 +0000136 FormatToken *&ResetToken;
Manuel Klimekef2cfb12013-01-05 22:14:16 +0000137 unsigned PreviousLineLevel;
Manuel Klimek1abf7892013-01-04 23:34:14 +0000138 FormatTokenSource *PreviousTokenSource;
139
Manuel Klimek15dfe7a2013-05-28 11:55:06 +0000140 FormatToken *Token;
Krasimir Georgieva1c30932017-05-19 10:34:57 +0000141 FormatToken *PreviousToken;
Manuel Klimek1abf7892013-01-04 23:34:14 +0000142};
143
Craig Topper69665e12013-07-01 04:21:54 +0000144} // end anonymous namespace
145
Manuel Klimek8e07a1b2013-01-10 11:52:21 +0000146class ScopedLineState {
147public:
Manuel Klimekd3b92fa2013-01-18 14:04:34 +0000148 ScopedLineState(UnwrappedLineParser &Parser,
149 bool SwitchToPreprocessorLines = false)
David Blaikieefb6eb22014-08-09 20:02:07 +0000150 : Parser(Parser), OriginalLines(Parser.CurrentLines) {
Manuel Klimekd3b92fa2013-01-18 14:04:34 +0000151 if (SwitchToPreprocessorLines)
152 Parser.CurrentLines = &Parser.PreprocessorDirectives;
Daniel Jasper9fe0e8d2013-09-05 09:29:45 +0000153 else if (!Parser.Line->Tokens.empty())
154 Parser.CurrentLines = &Parser.Line->Tokens.back().Children;
David Blaikieefb6eb22014-08-09 20:02:07 +0000155 PreBlockLine = std::move(Parser.Line);
156 Parser.Line = llvm::make_unique<UnwrappedLine>();
Daniel Jasperdaffc0d2013-01-16 09:10:19 +0000157 Parser.Line->Level = PreBlockLine->Level;
158 Parser.Line->InPPDirective = PreBlockLine->InPPDirective;
Manuel Klimek8e07a1b2013-01-10 11:52:21 +0000159 }
160
161 ~ScopedLineState() {
Daniel Jasperdaffc0d2013-01-16 09:10:19 +0000162 if (!Parser.Line->Tokens.empty()) {
Manuel Klimek8e07a1b2013-01-10 11:52:21 +0000163 Parser.addUnwrappedLine();
164 }
Daniel Jasperdaffc0d2013-01-16 09:10:19 +0000165 assert(Parser.Line->Tokens.empty());
David Blaikieefb6eb22014-08-09 20:02:07 +0000166 Parser.Line = std::move(PreBlockLine);
Daniel Jasper9fe0e8d2013-09-05 09:29:45 +0000167 if (Parser.CurrentLines == &Parser.PreprocessorDirectives)
168 Parser.MustBreakBeforeNextToken = true;
169 Parser.CurrentLines = OriginalLines;
Manuel Klimek8e07a1b2013-01-10 11:52:21 +0000170 }
171
172private:
173 UnwrappedLineParser &Parser;
174
David Blaikieefb6eb22014-08-09 20:02:07 +0000175 std::unique_ptr<UnwrappedLine> PreBlockLine;
Daniel Jasper9fe0e8d2013-09-05 09:29:45 +0000176 SmallVectorImpl<UnwrappedLine> *OriginalLines;
Manuel Klimek8e07a1b2013-01-10 11:52:21 +0000177};
178
Alexander Kornienko3a33f022013-12-12 09:49:52 +0000179class CompoundStatementIndenter {
180public:
181 CompoundStatementIndenter(UnwrappedLineParser *Parser,
182 const FormatStyle &Style, unsigned &LineLevel)
183 : LineLevel(LineLevel), OldLineLevel(LineLevel) {
Daniel Jasperc1bc38e2015-09-29 14:57:55 +0000184 if (Style.BraceWrapping.AfterControlStatement)
Alexander Kornienko3a33f022013-12-12 09:49:52 +0000185 Parser->addUnwrappedLine();
Daniel Jasperc1bc38e2015-09-29 14:57:55 +0000186 if (Style.BraceWrapping.IndentBraces)
Alexander Kornienko3a33f022013-12-12 09:49:52 +0000187 ++LineLevel;
Alexander Kornienko3a33f022013-12-12 09:49:52 +0000188 }
Daniel Jasperb05a81d2014-05-09 13:11:16 +0000189 ~CompoundStatementIndenter() { LineLevel = OldLineLevel; }
Alexander Kornienko3a33f022013-12-12 09:49:52 +0000190
191private:
192 unsigned &LineLevel;
193 unsigned OldLineLevel;
194};
195
Craig Topper69665e12013-07-01 04:21:54 +0000196namespace {
197
Manuel Klimekab419912013-05-23 09:41:43 +0000198class IndexedTokenSource : public FormatTokenSource {
199public:
Manuel Klimek15dfe7a2013-05-28 11:55:06 +0000200 IndexedTokenSource(ArrayRef<FormatToken *> Tokens)
Manuel Klimekab419912013-05-23 09:41:43 +0000201 : Tokens(Tokens), Position(-1) {}
202
Craig Topperfb6b25b2014-03-15 04:29:04 +0000203 FormatToken *getNextToken() override {
Manuel Klimekab419912013-05-23 09:41:43 +0000204 ++Position;
205 return Tokens[Position];
206 }
207
Craig Topperfb6b25b2014-03-15 04:29:04 +0000208 unsigned getPosition() override {
Manuel Klimekab419912013-05-23 09:41:43 +0000209 assert(Position >= 0);
210 return Position;
211 }
212
Craig Topperfb6b25b2014-03-15 04:29:04 +0000213 FormatToken *setPosition(unsigned P) override {
Manuel Klimekab419912013-05-23 09:41:43 +0000214 Position = P;
215 return Tokens[Position];
216 }
217
Manuel Klimek71814b42013-10-11 21:25:45 +0000218 void reset() { Position = -1; }
219
Manuel Klimekab419912013-05-23 09:41:43 +0000220private:
Manuel Klimek15dfe7a2013-05-28 11:55:06 +0000221 ArrayRef<FormatToken *> Tokens;
Manuel Klimekab419912013-05-23 09:41:43 +0000222 int Position;
223};
224
Craig Topper69665e12013-07-01 04:21:54 +0000225} // end anonymous namespace
226
Daniel Jasperd2ae41a2013-05-15 08:14:19 +0000227UnwrappedLineParser::UnwrappedLineParser(const FormatStyle &Style,
Daniel Jasperd0ec0d62014-11-04 12:41:02 +0000228 const AdditionalKeywords &Keywords,
Manuel Klimek15dfe7a2013-05-28 11:55:06 +0000229 ArrayRef<FormatToken *> Tokens,
Daniel Jasperd2ae41a2013-05-15 08:14:19 +0000230 UnwrappedLineConsumer &Callback)
Daniel Jasperb05a81d2014-05-09 13:11:16 +0000231 : Line(new UnwrappedLine), MustBreakBeforeNextToken(false),
Krasimir Georgiev00c5c722017-02-02 15:32:19 +0000232 CurrentLines(&Lines), Style(Style), Keywords(Keywords),
233 CommentPragmasRegex(Style.CommentPragmas), Tokens(nullptr),
Krasimir Georgievad47c902017-08-30 14:34:57 +0000234 Callback(Callback), AllTokens(Tokens), PPBranchLevel(-1),
235 IfNdefCondition(nullptr), FoundIncludeGuardStart(false),
236 IncludeGuardRejected(false) {}
Manuel Klimek71814b42013-10-11 21:25:45 +0000237
238void UnwrappedLineParser::reset() {
239 PPBranchLevel = -1;
Krasimir Georgievad47c902017-08-30 14:34:57 +0000240 IfNdefCondition = nullptr;
241 FoundIncludeGuardStart = false;
242 IncludeGuardRejected = false;
Manuel Klimek71814b42013-10-11 21:25:45 +0000243 Line.reset(new UnwrappedLine);
244 CommentsBeforeNextToken.clear();
Craig Topper2145bc02014-05-09 08:15:10 +0000245 FormatTok = nullptr;
Manuel Klimek71814b42013-10-11 21:25:45 +0000246 MustBreakBeforeNextToken = false;
247 PreprocessorDirectives.clear();
248 CurrentLines = &Lines;
249 DeclarationScopeStack.clear();
Manuel Klimek71814b42013-10-11 21:25:45 +0000250 PPStack.clear();
251}
Daniel Jasperf7935112012-12-03 18:12:45 +0000252
Manuel Klimek20e0af62015-05-06 11:56:29 +0000253void UnwrappedLineParser::parse() {
Manuel Klimekab419912013-05-23 09:41:43 +0000254 IndexedTokenSource TokenSource(AllTokens);
Manuel Klimek71814b42013-10-11 21:25:45 +0000255 do {
256 DEBUG(llvm::dbgs() << "----\n");
257 reset();
258 Tokens = &TokenSource;
259 TokenSource.reset();
Daniel Jaspera79064a2013-03-01 18:11:39 +0000260
Manuel Klimek71814b42013-10-11 21:25:45 +0000261 readToken();
262 parseFile();
263 // Create line with eof token.
264 pushToken(FormatTok);
265 addUnwrappedLine();
266
267 for (SmallVectorImpl<UnwrappedLine>::iterator I = Lines.begin(),
268 E = Lines.end();
269 I != E; ++I) {
270 Callback.consumeUnwrappedLine(*I);
271 }
272 Callback.finishRun();
273 Lines.clear();
274 while (!PPLevelBranchIndex.empty() &&
Daniel Jasper53bd1672013-10-12 13:32:56 +0000275 PPLevelBranchIndex.back() + 1 >= PPLevelBranchCount.back()) {
Manuel Klimek71814b42013-10-11 21:25:45 +0000276 PPLevelBranchIndex.resize(PPLevelBranchIndex.size() - 1);
277 PPLevelBranchCount.resize(PPLevelBranchCount.size() - 1);
278 }
279 if (!PPLevelBranchIndex.empty()) {
280 ++PPLevelBranchIndex.back();
281 assert(PPLevelBranchIndex.size() == PPLevelBranchCount.size());
282 assert(PPLevelBranchIndex.back() <= PPLevelBranchCount.back());
283 }
284 } while (!PPLevelBranchIndex.empty());
Manuel Klimek1abf7892013-01-04 23:34:14 +0000285}
286
Manuel Klimek1a18c402013-04-12 14:13:36 +0000287void UnwrappedLineParser::parseFile() {
Daniel Jasper9326f912015-05-05 08:40:32 +0000288 // The top-level context in a file always has declarations, except for pre-
289 // processor directives and JavaScript files.
290 bool MustBeDeclaration =
291 !Line->InPPDirective && Style.Language != FormatStyle::LK_JavaScript;
292 ScopedDeclarationState DeclarationState(*Line, DeclarationScopeStack,
293 MustBeDeclaration);
Krasimir Georgiev26b144c2017-07-03 15:05:14 +0000294 if (Style.Language == FormatStyle::LK_TextProto)
295 parseBracedList();
296 else
297 parseLevel(/*HasOpeningBrace=*/false);
Manuel Klimek1abf7892013-01-04 23:34:14 +0000298 // Make sure to format the remaining tokens.
Manuel Klimekf92f7bc2013-01-22 16:31:55 +0000299 flushComments(true);
Manuel Klimek1abf7892013-01-04 23:34:14 +0000300 addUnwrappedLine();
Daniel Jasperf7935112012-12-03 18:12:45 +0000301}
302
Manuel Klimek1a18c402013-04-12 14:13:36 +0000303void UnwrappedLineParser::parseLevel(bool HasOpeningBrace) {
Daniel Jasper516d7972013-07-25 11:31:57 +0000304 bool SwitchLabelEncountered = false;
Daniel Jasperf7935112012-12-03 18:12:45 +0000305 do {
Birunthan Mohanathasb001a0b2015-07-03 17:25:16 +0000306 tok::TokenKind kind = FormatTok->Tok.getKind();
307 if (FormatTok->Type == TT_MacroBlockBegin) {
308 kind = tok::l_brace;
309 } else if (FormatTok->Type == TT_MacroBlockEnd) {
310 kind = tok::r_brace;
311 }
312
313 switch (kind) {
Daniel Jasperf7935112012-12-03 18:12:45 +0000314 case tok::comment:
Daniel Jaspere25509f2012-12-17 11:29:41 +0000315 nextToken();
316 addUnwrappedLine();
Daniel Jasperf7935112012-12-03 18:12:45 +0000317 break;
318 case tok::l_brace:
Manuel Klimek0a3a3c92013-01-23 09:32:48 +0000319 // FIXME: Add parameter whether this can happen - if this happens, we must
320 // be in a non-declaration context.
Daniel Jasperb86e2722015-08-24 13:23:37 +0000321 if (!FormatTok->is(TT_MacroBlockBegin) && tryToParseBracedList())
322 continue;
Nico Weber9096fc02013-06-26 00:30:14 +0000323 parseBlock(/*MustBeDeclaration=*/false);
Daniel Jasperf7935112012-12-03 18:12:45 +0000324 addUnwrappedLine();
325 break;
326 case tok::r_brace:
Manuel Klimek1a18c402013-04-12 14:13:36 +0000327 if (HasOpeningBrace)
328 return;
Manuel Klimek1a18c402013-04-12 14:13:36 +0000329 nextToken();
330 addUnwrappedLine();
Manuel Klimek1058d982013-01-06 20:07:31 +0000331 break;
Daniel Jasper516d7972013-07-25 11:31:57 +0000332 case tok::kw_default:
333 case tok::kw_case:
Martin Probstf785fd92017-08-04 17:07:15 +0000334 if (Style.Language == FormatStyle::LK_JavaScript && Line->MustBeDeclaration) {
335 // A 'case: string' style field declaration.
336 parseStructuralElement();
337 break;
338 }
Daniel Jasper72407622013-09-02 08:26:29 +0000339 if (!SwitchLabelEncountered &&
340 (Style.IndentCaseLabels || (Line->InPPDirective && Line->Level == 1)))
341 ++Line->Level;
Daniel Jasper516d7972013-07-25 11:31:57 +0000342 SwitchLabelEncountered = true;
343 parseStructuralElement();
344 break;
Daniel Jasperf7935112012-12-03 18:12:45 +0000345 default:
Manuel Klimek6b9eeba2013-01-07 14:56:16 +0000346 parseStructuralElement();
Daniel Jasperf7935112012-12-03 18:12:45 +0000347 break;
348 }
349 } while (!eof());
350}
351
Daniel Jasperadba2aa2015-05-18 12:52:00 +0000352void UnwrappedLineParser::calculateBraceTypes(bool ExpectClassBody) {
Manuel Klimekab419912013-05-23 09:41:43 +0000353 // We'll parse forward through the tokens until we hit
354 // a closing brace or eof - note that getNextToken() will
355 // parse macros, so this will magically work inside macro
356 // definitions, too.
357 unsigned StoredPosition = Tokens->getPosition();
Manuel Klimek15dfe7a2013-05-28 11:55:06 +0000358 FormatToken *Tok = FormatTok;
Daniel Jasperb9a49902016-01-09 15:56:28 +0000359 const FormatToken *PrevTok = getPreviousToken();
Manuel Klimekab419912013-05-23 09:41:43 +0000360 // Keep a stack of positions of lbrace tokens. We will
361 // update information about whether an lbrace starts a
362 // braced init list or a different block during the loop.
Daniel Jasperb1f74a82013-07-09 09:06:29 +0000363 SmallVector<FormatToken *, 8> LBraceStack;
Manuel Klimek15dfe7a2013-05-28 11:55:06 +0000364 assert(Tok->Tok.is(tok::l_brace));
Manuel Klimekab419912013-05-23 09:41:43 +0000365 do {
Daniel Jaspereb65e912015-12-21 18:31:15 +0000366 // Get next non-comment token.
Daniel Jasper7f5d53e2013-07-01 09:15:46 +0000367 FormatToken *NextTok;
Daniel Jasperca7bd722013-07-01 16:43:38 +0000368 unsigned ReadTokens = 0;
Daniel Jasper7f5d53e2013-07-01 09:15:46 +0000369 do {
370 NextTok = Tokens->getNextToken();
Daniel Jasperca7bd722013-07-01 16:43:38 +0000371 ++ReadTokens;
Daniel Jasper7f5d53e2013-07-01 09:15:46 +0000372 } while (NextTok->is(tok::comment));
373
Manuel Klimek15dfe7a2013-05-28 11:55:06 +0000374 switch (Tok->Tok.getKind()) {
Manuel Klimekab419912013-05-23 09:41:43 +0000375 case tok::l_brace:
Martin Probst95ed8e72017-05-31 09:29:40 +0000376 if (Style.Language == FormatStyle::LK_JavaScript && PrevTok) {
377 if (PrevTok->is(tok::colon))
378 // A colon indicates this code is in a type, or a braced list
379 // following a label in an object literal ({a: {b: 1}}). The code
380 // below could be confused by semicolons between the individual
381 // members in a type member list, which would normally trigger
382 // BK_Block. In both cases, this must be parsed as an inline braced
383 // init.
384 Tok->BlockKind = BK_BracedInit;
385 else if (PrevTok->is(tok::r_paren))
386 // `) { }` can only occur in function or method declarations in JS.
387 Tok->BlockKind = BK_Block;
388 } else {
Daniel Jasperb9a49902016-01-09 15:56:28 +0000389 Tok->BlockKind = BK_Unknown;
Martin Probst95ed8e72017-05-31 09:29:40 +0000390 }
Daniel Jasperb1f74a82013-07-09 09:06:29 +0000391 LBraceStack.push_back(Tok);
Manuel Klimekab419912013-05-23 09:41:43 +0000392 break;
393 case tok::r_brace:
Daniel Jasperb9a49902016-01-09 15:56:28 +0000394 if (LBraceStack.empty())
395 break;
396 if (LBraceStack.back()->BlockKind == BK_Unknown) {
397 bool ProbablyBracedList = false;
398 if (Style.Language == FormatStyle::LK_Proto) {
399 ProbablyBracedList = NextTok->isOneOf(tok::comma, tok::r_square);
400 } else {
401 // Using OriginalColumn to distinguish between ObjC methods and
402 // binary operators is a bit hacky.
403 bool NextIsObjCMethod = NextTok->isOneOf(tok::plus, tok::minus) &&
404 NextTok->OriginalColumn == 0;
Daniel Jasper91b032a2014-05-22 12:46:38 +0000405
Daniel Jasperb9a49902016-01-09 15:56:28 +0000406 // If there is a comma, semicolon or right paren after the closing
407 // brace, we assume this is a braced initializer list. Note that
408 // regardless how we mark inner braces here, we will overwrite the
409 // BlockKind later if we parse a braced list (where all blocks
410 // inside are by default braced lists), or when we explicitly detect
411 // blocks (for example while parsing lambdas).
Martin Probst95ed8e72017-05-31 09:29:40 +0000412 // FIXME: Some of these do not apply to JS, e.g. "} {" can never be a
413 // braced list in JS.
Daniel Jasperb9a49902016-01-09 15:56:28 +0000414 ProbablyBracedList =
Daniel Jasperacffeb82016-03-05 18:34:26 +0000415 (Style.Language == FormatStyle::LK_JavaScript &&
Martin Probste1e12a72016-08-19 14:35:01 +0000416 NextTok->isOneOf(Keywords.kw_of, Keywords.kw_in,
417 Keywords.kw_as)) ||
Martin Probstb7fb2672017-05-10 13:53:29 +0000418 (Style.isCpp() && NextTok->is(tok::l_paren)) ||
Daniel Jasperb9a49902016-01-09 15:56:28 +0000419 NextTok->isOneOf(tok::comma, tok::period, tok::colon,
420 tok::r_paren, tok::r_square, tok::l_brace,
Martin Probstb7fb2672017-05-10 13:53:29 +0000421 tok::l_square, tok::ellipsis) ||
Daniel Jaspere4ada022016-12-13 10:05:03 +0000422 (NextTok->is(tok::identifier) &&
423 !PrevTok->isOneOf(tok::semi, tok::r_brace, tok::l_brace)) ||
Daniel Jasperb9a49902016-01-09 15:56:28 +0000424 (NextTok->is(tok::semi) &&
425 (!ExpectClassBody || LBraceStack.size() != 1)) ||
426 (NextTok->isBinaryOperator() && !NextIsObjCMethod);
Manuel Klimekab419912013-05-23 09:41:43 +0000427 }
Daniel Jasperb9a49902016-01-09 15:56:28 +0000428 if (ProbablyBracedList) {
429 Tok->BlockKind = BK_BracedInit;
430 LBraceStack.back()->BlockKind = BK_BracedInit;
431 } else {
432 Tok->BlockKind = BK_Block;
433 LBraceStack.back()->BlockKind = BK_Block;
434 }
Manuel Klimekab419912013-05-23 09:41:43 +0000435 }
Daniel Jasperb9a49902016-01-09 15:56:28 +0000436 LBraceStack.pop_back();
Manuel Klimekab419912013-05-23 09:41:43 +0000437 break;
Daniel Jasperac7e34e2014-03-13 10:11:17 +0000438 case tok::at:
Manuel Klimekab419912013-05-23 09:41:43 +0000439 case tok::semi:
440 case tok::kw_if:
441 case tok::kw_while:
442 case tok::kw_for:
443 case tok::kw_switch:
444 case tok::kw_try:
Nico Weberfac23712015-02-04 15:26:27 +0000445 case tok::kw___try:
Daniel Jasperb9a49902016-01-09 15:56:28 +0000446 if (!LBraceStack.empty() && LBraceStack.back()->BlockKind == BK_Unknown)
Daniel Jasperb1f74a82013-07-09 09:06:29 +0000447 LBraceStack.back()->BlockKind = BK_Block;
Manuel Klimekab419912013-05-23 09:41:43 +0000448 break;
449 default:
450 break;
451 }
Daniel Jasperb9a49902016-01-09 15:56:28 +0000452 PrevTok = Tok;
Manuel Klimekab419912013-05-23 09:41:43 +0000453 Tok = NextTok;
Manuel Klimekbab25fd2013-09-04 08:20:47 +0000454 } while (Tok->Tok.isNot(tok::eof) && !LBraceStack.empty());
Daniel Jasperb9a49902016-01-09 15:56:28 +0000455
Manuel Klimekab419912013-05-23 09:41:43 +0000456 // Assume other blocks for all unclosed opening braces.
457 for (unsigned i = 0, e = LBraceStack.size(); i != e; ++i) {
Daniel Jasperb1f74a82013-07-09 09:06:29 +0000458 if (LBraceStack[i]->BlockKind == BK_Unknown)
459 LBraceStack[i]->BlockKind = BK_Block;
Manuel Klimekab419912013-05-23 09:41:43 +0000460 }
Manuel Klimekbab25fd2013-09-04 08:20:47 +0000461
Manuel Klimekab419912013-05-23 09:41:43 +0000462 FormatTok = Tokens->setPosition(StoredPosition);
463}
464
Francois Ferranda98a95c2017-07-28 07:56:14 +0000465template <class T>
466static inline void hash_combine(std::size_t &seed, const T &v) {
467 std::hash<T> hasher;
468 seed ^= hasher(v) + 0x9e3779b9 + (seed << 6) + (seed >> 2);
469}
470
471size_t UnwrappedLineParser::computePPHash() const {
472 size_t h = 0;
473 for (const auto &i : PPStack) {
474 hash_combine(h, size_t(i.Kind));
475 hash_combine(h, i.Line);
476 }
477 return h;
478}
479
Manuel Klimekb212f3b2013-10-12 22:46:56 +0000480void UnwrappedLineParser::parseBlock(bool MustBeDeclaration, bool AddLevel,
481 bool MunchSemi) {
Birunthan Mohanathasb001a0b2015-07-03 17:25:16 +0000482 assert(FormatTok->isOneOf(tok::l_brace, TT_MacroBlockBegin) &&
483 "'{' or macro block token expected");
484 const bool MacroBlock = FormatTok->is(TT_MacroBlockBegin);
Daniel Jaspereb65e912015-12-21 18:31:15 +0000485 FormatTok->BlockKind = BK_Block;
Birunthan Mohanathasb001a0b2015-07-03 17:25:16 +0000486
Francois Ferranda98a95c2017-07-28 07:56:14 +0000487 size_t PPStartHash = computePPHash();
488
Daniel Jasper516d7972013-07-25 11:31:57 +0000489 unsigned InitialLevel = Line->Level;
Krasimir Georgiev3e051052017-07-24 14:51:59 +0000490 nextToken(/*LevelDifference=*/AddLevel ? 1 : 0);
Daniel Jasperf7935112012-12-03 18:12:45 +0000491
Birunthan Mohanathasb001a0b2015-07-03 17:25:16 +0000492 if (MacroBlock && FormatTok->is(tok::l_paren))
493 parseParens();
494
Francois Ferranda98a95c2017-07-28 07:56:14 +0000495 size_t NbPreprocessorDirectives =
496 CurrentLines == &Lines ? PreprocessorDirectives.size() : 0;
Manuel Klimeka4fe1c12013-01-21 16:42:44 +0000497 addUnwrappedLine();
Francois Ferranda98a95c2017-07-28 07:56:14 +0000498 size_t OpeningLineIndex =
499 CurrentLines->empty()
500 ? (UnwrappedLine::kInvalidIndex)
501 : (CurrentLines->size() - 1 - NbPreprocessorDirectives);
Daniel Jasperf7935112012-12-03 18:12:45 +0000502
Manuel Klimek0a3a3c92013-01-23 09:32:48 +0000503 ScopedDeclarationState DeclarationState(*Line, DeclarationScopeStack,
504 MustBeDeclaration);
Daniel Jasper65ee3472013-07-31 23:16:02 +0000505 if (AddLevel)
506 ++Line->Level;
Nico Weber9096fc02013-06-26 00:30:14 +0000507 parseLevel(/*HasOpeningBrace=*/true);
Alexander Kornienko578fdd82012-12-06 18:03:27 +0000508
Marianne Mailhot-Sarrasin03137c62016-04-14 14:56:49 +0000509 if (eof())
510 return;
511
Birunthan Mohanathasb001a0b2015-07-03 17:25:16 +0000512 if (MacroBlock ? !FormatTok->is(TT_MacroBlockEnd)
513 : !FormatTok->is(tok::r_brace)) {
Daniel Jasper516d7972013-07-25 11:31:57 +0000514 Line->Level = InitialLevel;
Daniel Jaspereb65e912015-12-21 18:31:15 +0000515 FormatTok->BlockKind = BK_Block;
Manuel Klimek1a18c402013-04-12 14:13:36 +0000516 return;
Manuel Klimekf92f7bc2013-01-22 16:31:55 +0000517 }
Alexander Kornienko0ea8e102012-12-04 15:40:36 +0000518
Francois Ferranda98a95c2017-07-28 07:56:14 +0000519 size_t PPEndHash = computePPHash();
520
Krasimir Georgiev3e051052017-07-24 14:51:59 +0000521 // Munch the closing brace.
522 nextToken(/*LevelDifference=*/AddLevel ? -1 : 0);
Birunthan Mohanathasb001a0b2015-07-03 17:25:16 +0000523
524 if (MacroBlock && FormatTok->is(tok::l_paren))
525 parseParens();
526
Manuel Klimekb212f3b2013-10-12 22:46:56 +0000527 if (MunchSemi && FormatTok->Tok.is(tok::semi))
528 nextToken();
Krasimir Georgiev3e051052017-07-24 14:51:59 +0000529 Line->Level = InitialLevel;
Francois Ferranda98a95c2017-07-28 07:56:14 +0000530
531 if (PPStartHash == PPEndHash) {
532 Line->MatchingOpeningBlockLineIndex = OpeningLineIndex;
533 if (OpeningLineIndex != UnwrappedLine::kInvalidIndex) {
534 // Update the opening line to add the forward reference as well
535 (*CurrentLines)[OpeningLineIndex].MatchingOpeningBlockLineIndex =
536 CurrentLines->size() - 1;
537 }
Francois Ferrande56a8292017-06-14 12:29:47 +0000538 }
Daniel Jasperf7935112012-12-03 18:12:45 +0000539}
540
Daniel Jasper02c7bca2015-03-30 09:56:50 +0000541static bool isGoogScope(const UnwrappedLine &Line) {
Daniel Jasper616de8642014-11-23 16:46:28 +0000542 // FIXME: Closure-library specific stuff should not be hard-coded but be
543 // configurable.
Daniel Jasper4a39c842014-05-06 13:54:10 +0000544 if (Line.Tokens.size() < 4)
545 return false;
546 auto I = Line.Tokens.begin();
547 if (I->Tok->TokenText != "goog")
548 return false;
549 ++I;
550 if (I->Tok->isNot(tok::period))
551 return false;
552 ++I;
553 if (I->Tok->TokenText != "scope")
554 return false;
555 ++I;
556 return I->Tok->is(tok::l_paren);
557}
558
Martin Probst101ec892017-05-09 20:04:09 +0000559static bool isIIFE(const UnwrappedLine &Line,
560 const AdditionalKeywords &Keywords) {
561 // Look for the start of an immediately invoked anonymous function.
562 // https://en.wikipedia.org/wiki/Immediately-invoked_function_expression
563 // This is commonly done in JavaScript to create a new, anonymous scope.
564 // Example: (function() { ... })()
565 if (Line.Tokens.size() < 3)
566 return false;
567 auto I = Line.Tokens.begin();
568 if (I->Tok->isNot(tok::l_paren))
569 return false;
570 ++I;
571 if (I->Tok->isNot(Keywords.kw_function))
572 return false;
573 ++I;
574 return I->Tok->is(tok::l_paren);
575}
576
Roman Kashitsyna043ced2014-08-11 12:18:01 +0000577static bool ShouldBreakBeforeBrace(const FormatStyle &Style,
578 const FormatToken &InitialToken) {
Daniel Jasperc1bc38e2015-09-29 14:57:55 +0000579 if (InitialToken.is(tok::kw_namespace))
580 return Style.BraceWrapping.AfterNamespace;
581 if (InitialToken.is(tok::kw_class))
582 return Style.BraceWrapping.AfterClass;
583 if (InitialToken.is(tok::kw_union))
584 return Style.BraceWrapping.AfterUnion;
585 if (InitialToken.is(tok::kw_struct))
586 return Style.BraceWrapping.AfterStruct;
587 return false;
Roman Kashitsyna043ced2014-08-11 12:18:01 +0000588}
589
Manuel Klimek516e0542013-09-04 13:25:30 +0000590void UnwrappedLineParser::parseChildBlock() {
591 FormatTok->BlockKind = BK_Block;
592 nextToken();
593 {
Martin Probst101ec892017-05-09 20:04:09 +0000594 bool SkipIndent =
595 (Style.Language == FormatStyle::LK_JavaScript &&
596 (isGoogScope(*Line) || isIIFE(*Line, Keywords)));
Manuel Klimek516e0542013-09-04 13:25:30 +0000597 ScopedLineState LineState(*this);
598 ScopedDeclarationState DeclarationState(*Line, DeclarationScopeStack,
599 /*MustBeDeclaration=*/false);
Martin Probst101ec892017-05-09 20:04:09 +0000600 Line->Level += SkipIndent ? 0 : 1;
Manuel Klimek516e0542013-09-04 13:25:30 +0000601 parseLevel(/*HasOpeningBrace=*/true);
Daniel Jasper02c7bca2015-03-30 09:56:50 +0000602 flushComments(isOnNewLine(*FormatTok));
Martin Probst101ec892017-05-09 20:04:09 +0000603 Line->Level -= SkipIndent ? 0 : 1;
Manuel Klimek516e0542013-09-04 13:25:30 +0000604 }
605 nextToken();
606}
607
Daniel Jasperf7935112012-12-03 18:12:45 +0000608void UnwrappedLineParser::parsePPDirective() {
Manuel Klimek15dfe7a2013-05-28 11:55:06 +0000609 assert(FormatTok->Tok.is(tok::hash) && "'#' expected");
Manuel Klimek20e0af62015-05-06 11:56:29 +0000610 ScopedMacroState MacroState(*Line, Tokens, FormatTok);
Manuel Klimeka71e5d82013-01-02 16:30:12 +0000611 nextToken();
612
Craig Topper2145bc02014-05-09 08:15:10 +0000613 if (!FormatTok->Tok.getIdentifierInfo()) {
Manuel Klimek591b5802013-01-31 15:58:48 +0000614 parsePPUnknown();
Manuel Klimeka71e5d82013-01-02 16:30:12 +0000615 return;
Daniel Jasperf7935112012-12-03 18:12:45 +0000616 }
Manuel Klimeka71e5d82013-01-02 16:30:12 +0000617
Manuel Klimek15dfe7a2013-05-28 11:55:06 +0000618 switch (FormatTok->Tok.getIdentifierInfo()->getPPKeywordID()) {
Manuel Klimek1abf7892013-01-04 23:34:14 +0000619 case tok::pp_define:
620 parsePPDefine();
Alexander Kornienkof2e02122013-05-24 18:24:24 +0000621 return;
622 case tok::pp_if:
Manuel Klimek71814b42013-10-11 21:25:45 +0000623 parsePPIf(/*IfDef=*/false);
Alexander Kornienkof2e02122013-05-24 18:24:24 +0000624 break;
625 case tok::pp_ifdef:
626 case tok::pp_ifndef:
Manuel Klimek71814b42013-10-11 21:25:45 +0000627 parsePPIf(/*IfDef=*/true);
Alexander Kornienkof2e02122013-05-24 18:24:24 +0000628 break;
629 case tok::pp_else:
630 parsePPElse();
631 break;
632 case tok::pp_elif:
633 parsePPElIf();
634 break;
635 case tok::pp_endif:
636 parsePPEndIf();
Manuel Klimek1abf7892013-01-04 23:34:14 +0000637 break;
638 default:
639 parsePPUnknown();
640 break;
641 }
642}
643
Manuel Klimek68b03042014-04-14 09:14:11 +0000644void UnwrappedLineParser::conditionalCompilationCondition(bool Unreachable) {
Francois Ferranda98a95c2017-07-28 07:56:14 +0000645 size_t Line = CurrentLines->size();
646 if (CurrentLines == &PreprocessorDirectives)
647 Line += Lines.size();
648
649 if (Unreachable ||
650 (!PPStack.empty() && PPStack.back().Kind == PP_Unreachable))
651 PPStack.push_back({PP_Unreachable, Line});
Alexander Kornienkof2e02122013-05-24 18:24:24 +0000652 else
Francois Ferranda98a95c2017-07-28 07:56:14 +0000653 PPStack.push_back({PP_Conditional, Line});
Alexander Kornienkof2e02122013-05-24 18:24:24 +0000654}
655
Manuel Klimek68b03042014-04-14 09:14:11 +0000656void UnwrappedLineParser::conditionalCompilationStart(bool Unreachable) {
Manuel Klimek71814b42013-10-11 21:25:45 +0000657 ++PPBranchLevel;
658 assert(PPBranchLevel >= 0 && PPBranchLevel <= (int)PPLevelBranchIndex.size());
659 if (PPBranchLevel == (int)PPLevelBranchIndex.size()) {
660 PPLevelBranchIndex.push_back(0);
661 PPLevelBranchCount.push_back(0);
662 }
663 PPChainBranchIndex.push(0);
Manuel Klimek68b03042014-04-14 09:14:11 +0000664 bool Skip = PPLevelBranchIndex[PPBranchLevel] > 0;
665 conditionalCompilationCondition(Unreachable || Skip);
Alexander Kornienkof2e02122013-05-24 18:24:24 +0000666}
667
Manuel Klimek68b03042014-04-14 09:14:11 +0000668void UnwrappedLineParser::conditionalCompilationAlternative() {
Alexander Kornienkof2e02122013-05-24 18:24:24 +0000669 if (!PPStack.empty())
670 PPStack.pop_back();
Manuel Klimek71814b42013-10-11 21:25:45 +0000671 assert(PPBranchLevel < (int)PPLevelBranchIndex.size());
672 if (!PPChainBranchIndex.empty())
673 ++PPChainBranchIndex.top();
Manuel Klimek68b03042014-04-14 09:14:11 +0000674 conditionalCompilationCondition(
675 PPBranchLevel >= 0 && !PPChainBranchIndex.empty() &&
676 PPLevelBranchIndex[PPBranchLevel] != PPChainBranchIndex.top());
Alexander Kornienkof2e02122013-05-24 18:24:24 +0000677}
678
Manuel Klimek68b03042014-04-14 09:14:11 +0000679void UnwrappedLineParser::conditionalCompilationEnd() {
Manuel Klimek71814b42013-10-11 21:25:45 +0000680 assert(PPBranchLevel < (int)PPLevelBranchIndex.size());
681 if (PPBranchLevel >= 0 && !PPChainBranchIndex.empty()) {
682 if (PPChainBranchIndex.top() + 1 > PPLevelBranchCount[PPBranchLevel]) {
Manuel Klimek71814b42013-10-11 21:25:45 +0000683 PPLevelBranchCount[PPBranchLevel] = PPChainBranchIndex.top() + 1;
684 }
685 }
Manuel Klimek14bd9172014-01-29 08:49:02 +0000686 // Guard against #endif's without #if.
Krasimir Georgievad47c902017-08-30 14:34:57 +0000687 if (PPBranchLevel > -1)
Manuel Klimek14bd9172014-01-29 08:49:02 +0000688 --PPBranchLevel;
Manuel Klimek71814b42013-10-11 21:25:45 +0000689 if (!PPChainBranchIndex.empty())
690 PPChainBranchIndex.pop();
Alexander Kornienkof2e02122013-05-24 18:24:24 +0000691 if (!PPStack.empty())
692 PPStack.pop_back();
Manuel Klimek68b03042014-04-14 09:14:11 +0000693}
694
695void UnwrappedLineParser::parsePPIf(bool IfDef) {
Daniel Jasper62703eb2017-03-01 11:10:11 +0000696 bool IfNDef = FormatTok->is(tok::pp_ifndef);
Manuel Klimek68b03042014-04-14 09:14:11 +0000697 nextToken();
Daniel Jaspereab6cd42017-03-01 10:47:52 +0000698 bool Unreachable = false;
699 if (!IfDef && (FormatTok->is(tok::kw_false) || FormatTok->TokenText == "0"))
700 Unreachable = true;
Daniel Jasper62703eb2017-03-01 11:10:11 +0000701 if (IfDef && !IfNDef && FormatTok->TokenText == "SWIG")
Daniel Jaspereab6cd42017-03-01 10:47:52 +0000702 Unreachable = true;
703 conditionalCompilationStart(Unreachable);
Krasimir Georgievad47c902017-08-30 14:34:57 +0000704 FormatToken *IfCondition = FormatTok;
705 // If there's a #ifndef on the first line, and the only lines before it are
706 // comments, it could be an include guard.
707 bool MaybeIncludeGuard = IfNDef;
708 if (!IncludeGuardRejected && !FoundIncludeGuardStart && MaybeIncludeGuard) {
709 for (auto &Line : Lines) {
710 if (!Line.Tokens.front().Tok->is(tok::comment)) {
711 MaybeIncludeGuard = false;
712 IncludeGuardRejected = true;
713 break;
714 }
715 }
716 }
717 --PPBranchLevel;
Manuel Klimek68b03042014-04-14 09:14:11 +0000718 parsePPUnknown();
Krasimir Georgievad47c902017-08-30 14:34:57 +0000719 ++PPBranchLevel;
720 if (!IncludeGuardRejected && !FoundIncludeGuardStart && MaybeIncludeGuard)
721 IfNdefCondition = IfCondition;
Manuel Klimek68b03042014-04-14 09:14:11 +0000722}
723
724void UnwrappedLineParser::parsePPElse() {
Krasimir Georgievad47c902017-08-30 14:34:57 +0000725 // If a potential include guard has an #else, it's not an include guard.
726 if (FoundIncludeGuardStart && PPBranchLevel == 0)
727 FoundIncludeGuardStart = false;
Manuel Klimek68b03042014-04-14 09:14:11 +0000728 conditionalCompilationAlternative();
Krasimir Georgievad47c902017-08-30 14:34:57 +0000729 if (PPBranchLevel > -1)
730 --PPBranchLevel;
Manuel Klimek68b03042014-04-14 09:14:11 +0000731 parsePPUnknown();
Krasimir Georgievad47c902017-08-30 14:34:57 +0000732 ++PPBranchLevel;
Manuel Klimek68b03042014-04-14 09:14:11 +0000733}
734
735void UnwrappedLineParser::parsePPElIf() { parsePPElse(); }
736
737void UnwrappedLineParser::parsePPEndIf() {
738 conditionalCompilationEnd();
Alexander Kornienkof2e02122013-05-24 18:24:24 +0000739 parsePPUnknown();
Krasimir Georgievad47c902017-08-30 14:34:57 +0000740 // If the #endif of a potential include guard is the last thing in the file,
741 // then we count it as a real include guard and subtract one from every
742 // preprocessor indent.
743 unsigned TokenPosition = Tokens->getPosition();
744 FormatToken *PeekNext = AllTokens[TokenPosition];
Daniel Jasper4df130f2017-09-04 13:33:52 +0000745 if (FoundIncludeGuardStart && PPBranchLevel == -1 && PeekNext->is(tok::eof) &&
746 Style.IndentPPDirectives != FormatStyle::PPDIS_None)
747 for (auto &Line : Lines)
Krasimir Georgievad47c902017-08-30 14:34:57 +0000748 if (Line.InPPDirective && Line.Level > 0)
749 --Line.Level;
Alexander Kornienkof2e02122013-05-24 18:24:24 +0000750}
751
Manuel Klimek1abf7892013-01-04 23:34:14 +0000752void UnwrappedLineParser::parsePPDefine() {
753 nextToken();
754
Manuel Klimek15dfe7a2013-05-28 11:55:06 +0000755 if (FormatTok->Tok.getKind() != tok::identifier) {
Manuel Klimek1abf7892013-01-04 23:34:14 +0000756 parsePPUnknown();
757 return;
758 }
Krasimir Georgievad47c902017-08-30 14:34:57 +0000759 if (IfNdefCondition && IfNdefCondition->TokenText == FormatTok->TokenText) {
760 FoundIncludeGuardStart = true;
761 for (auto &Line : Lines) {
762 if (!Line.Tokens.front().Tok->isOneOf(tok::comment, tok::hash)) {
763 FoundIncludeGuardStart = false;
764 break;
765 }
766 }
767 }
768 IfNdefCondition = nullptr;
Manuel Klimek1abf7892013-01-04 23:34:14 +0000769 nextToken();
Manuel Klimek15dfe7a2013-05-28 11:55:06 +0000770 if (FormatTok->Tok.getKind() == tok::l_paren &&
771 FormatTok->WhitespaceRange.getBegin() ==
772 FormatTok->WhitespaceRange.getEnd()) {
Manuel Klimek1abf7892013-01-04 23:34:14 +0000773 parseParens();
774 }
Krasimir Georgievad47c902017-08-30 14:34:57 +0000775 if (Style.IndentPPDirectives == FormatStyle::PPDIS_AfterHash)
776 Line->Level += PPBranchLevel + 1;
Manuel Klimek1abf7892013-01-04 23:34:14 +0000777 addUnwrappedLine();
Krasimir Georgievad47c902017-08-30 14:34:57 +0000778 ++Line->Level;
Manuel Klimek1b896292013-01-07 09:34:28 +0000779
780 // Errors during a preprocessor directive can only affect the layout of the
781 // preprocessor directive, and thus we ignore them. An alternative approach
782 // would be to use the same approach we use on the file level (no
783 // re-indentation if there was a structural error) within the macro
784 // definition.
Manuel Klimek1abf7892013-01-04 23:34:14 +0000785 parseFile();
786}
787
788void UnwrappedLineParser::parsePPUnknown() {
Manuel Klimeka71e5d82013-01-02 16:30:12 +0000789 do {
Manuel Klimeka71e5d82013-01-02 16:30:12 +0000790 nextToken();
791 } while (!eof());
Krasimir Georgievad47c902017-08-30 14:34:57 +0000792 if (Style.IndentPPDirectives == FormatStyle::PPDIS_AfterHash)
793 Line->Level += PPBranchLevel + 1;
Manuel Klimeka71e5d82013-01-02 16:30:12 +0000794 addUnwrappedLine();
Krasimir Georgievad47c902017-08-30 14:34:57 +0000795 IfNdefCondition = nullptr;
Daniel Jasperf7935112012-12-03 18:12:45 +0000796}
797
Alexander Kornienkoa04e5e22013-04-09 16:15:19 +0000798// Here we blacklist certain tokens that are not usually the first token in an
799// unwrapped line. This is used in attempt to distinguish macro calls without
800// trailing semicolons from other constructs split to several lines.
Benjamin Kramer8407df72015-03-09 16:47:52 +0000801static bool tokenCanStartNewLine(const clang::Token &Tok) {
Alexander Kornienkoa04e5e22013-04-09 16:15:19 +0000802 // Semicolon can be a null-statement, l_square can be a start of a macro or
803 // a C++11 attribute, but this doesn't seem to be common.
804 return Tok.isNot(tok::semi) && Tok.isNot(tok::l_brace) &&
805 Tok.isNot(tok::l_square) &&
806 // Tokens that can only be used as binary operators and a part of
807 // overloaded operator names.
808 Tok.isNot(tok::period) && Tok.isNot(tok::periodstar) &&
809 Tok.isNot(tok::arrow) && Tok.isNot(tok::arrowstar) &&
810 Tok.isNot(tok::less) && Tok.isNot(tok::greater) &&
811 Tok.isNot(tok::slash) && Tok.isNot(tok::percent) &&
812 Tok.isNot(tok::lessless) && Tok.isNot(tok::greatergreater) &&
813 Tok.isNot(tok::equal) && Tok.isNot(tok::plusequal) &&
814 Tok.isNot(tok::minusequal) && Tok.isNot(tok::starequal) &&
815 Tok.isNot(tok::slashequal) && Tok.isNot(tok::percentequal) &&
816 Tok.isNot(tok::ampequal) && Tok.isNot(tok::pipeequal) &&
817 Tok.isNot(tok::caretequal) && Tok.isNot(tok::greatergreaterequal) &&
818 Tok.isNot(tok::lesslessequal) &&
819 // Colon is used in labels, base class lists, initializer lists,
820 // range-based for loops, ternary operator, but should never be the
821 // first token in an unwrapped line.
Daniel Jasper5ebb2f32014-05-21 13:08:17 +0000822 Tok.isNot(tok::colon) &&
823 // 'noexcept' is a trailing annotation.
824 Tok.isNot(tok::kw_noexcept);
Alexander Kornienkoa04e5e22013-04-09 16:15:19 +0000825}
826
Martin Probst533965c2016-04-19 18:19:06 +0000827static bool mustBeJSIdent(const AdditionalKeywords &Keywords,
828 const FormatToken *FormatTok) {
Daniel Jasper1dcbbcfc2016-03-14 19:21:36 +0000829 // FIXME: This returns true for C/C++ keywords like 'struct'.
830 return FormatTok->is(tok::identifier) &&
831 (FormatTok->Tok.getIdentifierInfo() == nullptr ||
Martin Probst3dbbefa2016-11-10 16:21:02 +0000832 !FormatTok->isOneOf(
833 Keywords.kw_in, Keywords.kw_of, Keywords.kw_as, Keywords.kw_async,
834 Keywords.kw_await, Keywords.kw_yield, Keywords.kw_finally,
835 Keywords.kw_function, Keywords.kw_import, Keywords.kw_is,
836 Keywords.kw_let, Keywords.kw_var, tok::kw_const,
837 Keywords.kw_abstract, Keywords.kw_extends, Keywords.kw_implements,
838 Keywords.kw_instanceof, Keywords.kw_interface,
Martin Probst93008f02017-07-18 14:00:19 +0000839 Keywords.kw_throws, Keywords.kw_from));
Daniel Jasper1dcbbcfc2016-03-14 19:21:36 +0000840}
841
Martin Probst533965c2016-04-19 18:19:06 +0000842static bool mustBeJSIdentOrValue(const AdditionalKeywords &Keywords,
843 const FormatToken *FormatTok) {
Martin Probstb9316ff2016-09-18 17:21:52 +0000844 return FormatTok->Tok.isLiteral() ||
845 FormatTok->isOneOf(tok::kw_true, tok::kw_false) ||
846 mustBeJSIdent(Keywords, FormatTok);
Martin Probst533965c2016-04-19 18:19:06 +0000847}
848
Daniel Jasper1dcbbcfc2016-03-14 19:21:36 +0000849// isJSDeclOrStmt returns true if |FormatTok| starts a declaration or statement
850// when encountered after a value (see mustBeJSIdentOrValue).
851static bool isJSDeclOrStmt(const AdditionalKeywords &Keywords,
852 const FormatToken *FormatTok) {
853 return FormatTok->isOneOf(
Martin Probst5f8445b2016-04-24 22:05:09 +0000854 tok::kw_return, Keywords.kw_yield,
Daniel Jasper1dcbbcfc2016-03-14 19:21:36 +0000855 // conditionals
856 tok::kw_if, tok::kw_else,
857 // loops
858 tok::kw_for, tok::kw_while, tok::kw_do, tok::kw_continue, tok::kw_break,
859 // switch/case
860 tok::kw_switch, tok::kw_case,
861 // exceptions
862 tok::kw_throw, tok::kw_try, tok::kw_catch, Keywords.kw_finally,
863 // declaration
864 tok::kw_const, tok::kw_class, Keywords.kw_var, Keywords.kw_let,
Martin Probst5f8445b2016-04-24 22:05:09 +0000865 Keywords.kw_async, Keywords.kw_function,
866 // import/export
867 Keywords.kw_import, tok::kw_export);
Daniel Jasper1dcbbcfc2016-03-14 19:21:36 +0000868}
869
870// readTokenWithJavaScriptASI reads the next token and terminates the current
871// line if JavaScript Automatic Semicolon Insertion must
872// happen between the current token and the next token.
873//
874// This method is conservative - it cannot cover all edge cases of JavaScript,
875// but only aims to correctly handle certain well known cases. It *must not*
876// return true in speculative cases.
877void UnwrappedLineParser::readTokenWithJavaScriptASI() {
878 FormatToken *Previous = FormatTok;
879 readToken();
880 FormatToken *Next = FormatTok;
881
882 bool IsOnSameLine =
883 CommentsBeforeNextToken.empty()
884 ? Next->NewlinesBefore == 0
885 : CommentsBeforeNextToken.front()->NewlinesBefore == 0;
886 if (IsOnSameLine)
887 return;
888
889 bool PreviousMustBeValue = mustBeJSIdentOrValue(Keywords, Previous);
Martin Probst717f6dc2016-10-21 05:11:38 +0000890 bool PreviousStartsTemplateExpr =
891 Previous->is(TT_TemplateString) && Previous->TokenText.endswith("${");
Martin Probstbbffeac2016-04-11 07:35:57 +0000892 if (PreviousMustBeValue && Line && Line->Tokens.size() > 1) {
893 // If the token before the previous one is an '@', the previous token is an
894 // annotation and can precede another identifier/value.
Benjamin Kramer5ffc24e2016-04-11 12:19:19 +0000895 const FormatToken *PrePrevious = std::prev(Line->Tokens.end(), 2)->Tok;
Martin Probstbbffeac2016-04-11 07:35:57 +0000896 if (PrePrevious->is(tok::at))
897 return;
898 }
Daniel Jasper1dcbbcfc2016-03-14 19:21:36 +0000899 if (Next->is(tok::exclaim) && PreviousMustBeValue)
Martin Probstd40bca42017-01-09 08:56:36 +0000900 return addUnwrappedLine();
Daniel Jasper1dcbbcfc2016-03-14 19:21:36 +0000901 bool NextMustBeValue = mustBeJSIdentOrValue(Keywords, Next);
Martin Probst717f6dc2016-10-21 05:11:38 +0000902 bool NextEndsTemplateExpr =
903 Next->is(TT_TemplateString) && Next->TokenText.startswith("}");
904 if (NextMustBeValue && !NextEndsTemplateExpr && !PreviousStartsTemplateExpr &&
905 (PreviousMustBeValue ||
906 Previous->isOneOf(tok::r_square, tok::r_paren, tok::plusplus,
907 tok::minusminus)))
Martin Probstd40bca42017-01-09 08:56:36 +0000908 return addUnwrappedLine();
Martin Probst0a19d432017-08-09 15:19:16 +0000909 if ((PreviousMustBeValue || Previous->is(tok::r_paren)) &&
910 isJSDeclOrStmt(Keywords, Next))
Martin Probstd40bca42017-01-09 08:56:36 +0000911 return addUnwrappedLine();
Daniel Jasper1dcbbcfc2016-03-14 19:21:36 +0000912}
913
Manuel Klimek6b9eeba2013-01-07 14:56:16 +0000914void UnwrappedLineParser::parseStructuralElement() {
Daniel Jasper498f5582015-12-25 08:53:31 +0000915 assert(!FormatTok->is(tok::l_brace));
916 if (Style.Language == FormatStyle::LK_TableGen &&
917 FormatTok->is(tok::pp_include)) {
918 nextToken();
919 if (FormatTok->is(tok::string_literal))
920 nextToken();
921 addUnwrappedLine();
922 return;
923 }
Manuel Klimek15dfe7a2013-05-28 11:55:06 +0000924 switch (FormatTok->Tok.getKind()) {
Nico Weber04e9f1a2013-01-07 19:05:19 +0000925 case tok::at:
926 nextToken();
Manuel Klimek15dfe7a2013-05-28 11:55:06 +0000927 if (FormatTok->Tok.is(tok::l_brace)) {
Krasimir Georgiev26b144c2017-07-03 15:05:14 +0000928 nextToken();
Nico Weber372d8dc2013-02-10 20:35:35 +0000929 parseBracedList();
930 break;
931 }
Manuel Klimek15dfe7a2013-05-28 11:55:06 +0000932 switch (FormatTok->Tok.getObjCKeywordID()) {
Nico Weber04e9f1a2013-01-07 19:05:19 +0000933 case tok::objc_public:
934 case tok::objc_protected:
935 case tok::objc_package:
936 case tok::objc_private:
937 return parseAccessSpecifier();
Nico Weber7eecf4b2013-01-09 20:25:35 +0000938 case tok::objc_interface:
Nico Weber2ce0ac52013-01-09 23:25:37 +0000939 case tok::objc_implementation:
940 return parseObjCInterfaceOrImplementation();
Nico Weber8696a8d2013-01-09 21:15:03 +0000941 case tok::objc_protocol:
942 return parseObjCProtocol();
Nico Weberd8ffe752013-01-09 21:42:32 +0000943 case tok::objc_end:
944 return; // Handled by the caller.
Nico Weber51306d22013-01-10 00:25:19 +0000945 case tok::objc_optional:
946 case tok::objc_required:
947 nextToken();
948 addUnwrappedLine();
949 return;
Nico Weber45c48122015-06-28 01:06:16 +0000950 case tok::objc_autoreleasepool:
951 nextToken();
952 if (FormatTok->Tok.is(tok::l_brace)) {
Daniel Jasperc1bc38e2015-09-29 14:57:55 +0000953 if (Style.BraceWrapping.AfterObjCDeclaration)
Nico Weber45c48122015-06-28 01:06:16 +0000954 addUnwrappedLine();
955 parseBlock(/*MustBeDeclaration=*/false);
956 }
957 addUnwrappedLine();
958 return;
Nico Weber33381f52015-02-07 01:57:32 +0000959 case tok::objc_try:
960 // This branch isn't strictly necessary (the kw_try case below would
961 // do this too after the tok::at is parsed above). But be explicit.
962 parseTryCatch();
963 return;
Nico Weber04e9f1a2013-01-07 19:05:19 +0000964 default:
965 break;
966 }
967 break;
Daniel Jasper8f463652014-08-26 23:15:12 +0000968 case tok::kw_asm:
Daniel Jasper8f463652014-08-26 23:15:12 +0000969 nextToken();
970 if (FormatTok->is(tok::l_brace)) {
Daniel Jasperc6366072015-05-10 08:42:04 +0000971 FormatTok->Type = TT_InlineASMBrace;
Daniel Jasper2337f282015-01-12 10:14:56 +0000972 nextToken();
Daniel Jasper4429f142014-08-27 17:16:46 +0000973 while (FormatTok && FormatTok->isNot(tok::eof)) {
Daniel Jasper8f463652014-08-26 23:15:12 +0000974 if (FormatTok->is(tok::r_brace)) {
Daniel Jasperc6366072015-05-10 08:42:04 +0000975 FormatTok->Type = TT_InlineASMBrace;
Daniel Jasper8f463652014-08-26 23:15:12 +0000976 nextToken();
Daniel Jasper790d4f92015-05-11 11:59:46 +0000977 addUnwrappedLine();
Daniel Jasper8f463652014-08-26 23:15:12 +0000978 break;
979 }
Daniel Jasper2337f282015-01-12 10:14:56 +0000980 FormatTok->Finalized = true;
Daniel Jasper8f463652014-08-26 23:15:12 +0000981 nextToken();
982 }
983 }
984 break;
Alexander Kornienko578fdd82012-12-06 18:03:27 +0000985 case tok::kw_namespace:
986 parseNamespace();
987 return;
Dmitri Gribenko58d64e22012-12-30 21:27:25 +0000988 case tok::kw_inline:
989 nextToken();
Manuel Klimek15dfe7a2013-05-28 11:55:06 +0000990 if (FormatTok->Tok.is(tok::kw_namespace)) {
Dmitri Gribenko58d64e22012-12-30 21:27:25 +0000991 parseNamespace();
992 return;
993 }
994 break;
Alexander Kornienkob7076a22012-12-04 14:46:19 +0000995 case tok::kw_public:
996 case tok::kw_protected:
997 case tok::kw_private:
Daniel Jasper83709082015-02-18 17:14:05 +0000998 if (Style.Language == FormatStyle::LK_Java ||
999 Style.Language == FormatStyle::LK_JavaScript)
Daniel Jasperc58c70e2014-09-15 11:21:46 +00001000 nextToken();
1001 else
1002 parseAccessSpecifier();
Daniel Jasperf7935112012-12-03 18:12:45 +00001003 return;
Alexander Kornienkob7076a22012-12-04 14:46:19 +00001004 case tok::kw_if:
1005 parseIfThenElse();
Daniel Jasperf7935112012-12-03 18:12:45 +00001006 return;
Alexander Kornienko37d6c942012-12-05 15:06:06 +00001007 case tok::kw_for:
1008 case tok::kw_while:
1009 parseForOrWhileLoop();
1010 return;
Alexander Kornienkob7076a22012-12-04 14:46:19 +00001011 case tok::kw_do:
1012 parseDoWhile();
1013 return;
1014 case tok::kw_switch:
Martin Probstf785fd92017-08-04 17:07:15 +00001015 if (Style.Language == FormatStyle::LK_JavaScript && Line->MustBeDeclaration)
1016 // 'switch: string' field declaration.
1017 break;
Alexander Kornienkob7076a22012-12-04 14:46:19 +00001018 parseSwitch();
1019 return;
1020 case tok::kw_default:
Martin Probstf785fd92017-08-04 17:07:15 +00001021 if (Style.Language == FormatStyle::LK_JavaScript && Line->MustBeDeclaration)
1022 // 'default: string' field declaration.
1023 break;
Alexander Kornienkob7076a22012-12-04 14:46:19 +00001024 nextToken();
1025 parseLabel();
1026 return;
1027 case tok::kw_case:
Martin Probstf785fd92017-08-04 17:07:15 +00001028 if (Style.Language == FormatStyle::LK_JavaScript && Line->MustBeDeclaration)
1029 // 'case: string' field declaration.
1030 break;
Alexander Kornienkob7076a22012-12-04 14:46:19 +00001031 parseCaseLabel();
1032 return;
Daniel Jasper04a71a42014-05-08 11:58:24 +00001033 case tok::kw_try:
Nico Weberfac23712015-02-04 15:26:27 +00001034 case tok::kw___try:
Daniel Jasper04a71a42014-05-08 11:58:24 +00001035 parseTryCatch();
1036 return;
Manuel Klimekae610d12013-01-21 14:32:05 +00001037 case tok::kw_extern:
1038 nextToken();
Manuel Klimek15dfe7a2013-05-28 11:55:06 +00001039 if (FormatTok->Tok.is(tok::string_literal)) {
Manuel Klimekae610d12013-01-21 14:32:05 +00001040 nextToken();
Manuel Klimek15dfe7a2013-05-28 11:55:06 +00001041 if (FormatTok->Tok.is(tok::l_brace)) {
Daniel Jasper65ee3472013-07-31 23:16:02 +00001042 parseBlock(/*MustBeDeclaration=*/true, /*AddLevel=*/false);
Manuel Klimekae610d12013-01-21 14:32:05 +00001043 addUnwrappedLine();
1044 return;
1045 }
1046 }
Daniel Jaspere1e43192014-04-01 12:55:11 +00001047 break;
Daniel Jasperfca735c2015-02-19 16:14:18 +00001048 case tok::kw_export:
1049 if (Style.Language == FormatStyle::LK_JavaScript) {
1050 parseJavaScriptEs6ImportExport();
1051 return;
1052 }
1053 break;
Daniel Jaspere1e43192014-04-01 12:55:11 +00001054 case tok::identifier:
Daniel Jasper66cb8c52015-05-04 09:22:29 +00001055 if (FormatTok->is(TT_ForEachMacro)) {
Daniel Jaspere1e43192014-04-01 12:55:11 +00001056 parseForOrWhileLoop();
1057 return;
1058 }
Birunthan Mohanathasb001a0b2015-07-03 17:25:16 +00001059 if (FormatTok->is(TT_MacroBlockBegin)) {
1060 parseBlock(/*MustBeDeclaration=*/false, /*AddLevel=*/true,
1061 /*MunchSemi=*/false);
1062 return;
1063 }
Daniel Jasper3d5a7d62016-06-20 18:20:38 +00001064 if (FormatTok->is(Keywords.kw_import)) {
1065 if (Style.Language == FormatStyle::LK_JavaScript) {
1066 parseJavaScriptEs6ImportExport();
1067 return;
1068 }
1069 if (Style.Language == FormatStyle::LK_Proto) {
1070 nextToken();
Daniel Jasper8b61d142016-06-20 20:39:53 +00001071 if (FormatTok->is(tok::kw_public))
1072 nextToken();
Daniel Jasper3d5a7d62016-06-20 18:20:38 +00001073 if (!FormatTok->is(tok::string_literal))
1074 return;
1075 nextToken();
1076 if (FormatTok->is(tok::semi))
1077 nextToken();
1078 addUnwrappedLine();
1079 return;
1080 }
Daniel Jasper354aa512015-02-19 16:07:32 +00001081 }
Daniel Jasper1dbc2102017-03-31 13:30:24 +00001082 if (Style.isCpp() &&
Daniel Jasper72b33572017-03-31 12:04:37 +00001083 FormatTok->isOneOf(Keywords.kw_signals, Keywords.kw_qsignals,
Daniel Jaspera00de632015-12-01 12:05:04 +00001084 Keywords.kw_slots, Keywords.kw_qslots)) {
Daniel Jasperde0d1f32015-04-24 07:50:34 +00001085 nextToken();
1086 if (FormatTok->is(tok::colon)) {
1087 nextToken();
1088 addUnwrappedLine();
Daniel Jasper31343832016-07-27 10:13:24 +00001089 return;
Daniel Jasperde0d1f32015-04-24 07:50:34 +00001090 }
Daniel Jasper53395402015-04-07 15:04:40 +00001091 }
Manuel Klimekae610d12013-01-21 14:32:05 +00001092 // In all other cases, parse the declaration.
1093 break;
Alexander Kornienkob7076a22012-12-04 14:46:19 +00001094 default:
1095 break;
Daniel Jasperf7935112012-12-03 18:12:45 +00001096 }
Daniel Jasperf7935112012-12-03 18:12:45 +00001097 do {
Daniel Jaspera7900ad2016-05-08 18:12:22 +00001098 const FormatToken *Previous = getPreviousToken();
Manuel Klimek15dfe7a2013-05-28 11:55:06 +00001099 switch (FormatTok->Tok.getKind()) {
Nico Weber372d8dc2013-02-10 20:35:35 +00001100 case tok::at:
1101 nextToken();
Krasimir Georgiev26b144c2017-07-03 15:05:14 +00001102 if (FormatTok->Tok.is(tok::l_brace)) {
1103 nextToken();
Nico Weber372d8dc2013-02-10 20:35:35 +00001104 parseBracedList();
Krasimir Georgiev26b144c2017-07-03 15:05:14 +00001105 }
Nico Weber372d8dc2013-02-10 20:35:35 +00001106 break;
Alexander Kornienkob7076a22012-12-04 14:46:19 +00001107 case tok::kw_enum:
Daniel Jaspera7900ad2016-05-08 18:12:22 +00001108 // Ignore if this is part of "template <enum ...".
1109 if (Previous && Previous->is(tok::less)) {
1110 nextToken();
1111 break;
1112 }
1113
Daniel Jasper90cf3802015-06-17 09:44:02 +00001114 // parseEnum falls through and does not yet add an unwrapped line as an
1115 // enum definition can start a structural element.
Daniel Jasper6f5a1932015-12-29 08:54:23 +00001116 if (!parseEnum())
1117 break;
Daniel Jasperc6dd2732015-07-16 14:25:43 +00001118 // This only applies for C++.
Daniel Jasper1dbc2102017-03-31 13:30:24 +00001119 if (!Style.isCpp()) {
Daniel Jasper90cf3802015-06-17 09:44:02 +00001120 addUnwrappedLine();
1121 return;
1122 }
Manuel Klimek2cec0192013-01-21 19:17:52 +00001123 break;
Daniel Jaspera88f80a2014-01-30 14:38:37 +00001124 case tok::kw_typedef:
1125 nextToken();
Daniel Jasper31f6c542014-12-05 10:42:21 +00001126 if (FormatTok->isOneOf(Keywords.kw_NS_ENUM, Keywords.kw_NS_OPTIONS,
1127 Keywords.kw_CF_ENUM, Keywords.kw_CF_OPTIONS))
Daniel Jaspera88f80a2014-01-30 14:38:37 +00001128 parseEnum();
1129 break;
Alexander Kornienko1231e062013-01-16 11:43:46 +00001130 case tok::kw_struct:
1131 case tok::kw_union:
Manuel Klimek28cacc72013-01-07 18:10:23 +00001132 case tok::kw_class:
Daniel Jasper910807d2015-06-12 04:52:02 +00001133 // parseRecord falls through and does not yet add an unwrapped line as a
1134 // record declaration or definition can start a structural element.
Manuel Klimeke01bab52013-01-15 13:38:33 +00001135 parseRecord();
Daniel Jasper910807d2015-06-12 04:52:02 +00001136 // This does not apply for Java and JavaScript.
1137 if (Style.Language == FormatStyle::LK_Java ||
1138 Style.Language == FormatStyle::LK_JavaScript) {
Daniel Jasperd5ec65b2016-01-08 07:06:07 +00001139 if (FormatTok->is(tok::semi))
1140 nextToken();
Daniel Jasper910807d2015-06-12 04:52:02 +00001141 addUnwrappedLine();
1142 return;
1143 }
Manuel Klimeke01bab52013-01-15 13:38:33 +00001144 break;
Daniel Jaspere5d74862014-11-26 08:17:08 +00001145 case tok::period:
1146 nextToken();
1147 // In Java, classes have an implicit static member "class".
1148 if (Style.Language == FormatStyle::LK_Java && FormatTok &&
1149 FormatTok->is(tok::kw_class))
1150 nextToken();
Daniel Jasperba52fcb2015-09-28 14:29:45 +00001151 if (Style.Language == FormatStyle::LK_JavaScript && FormatTok &&
1152 FormatTok->Tok.getIdentifierInfo())
1153 // JavaScript only has pseudo keywords, all keywords are allowed to
1154 // appear in "IdentifierName" positions. See http://es5.github.io/#x7.6
1155 nextToken();
Daniel Jaspere5d74862014-11-26 08:17:08 +00001156 break;
Daniel Jasperf7935112012-12-03 18:12:45 +00001157 case tok::semi:
1158 nextToken();
1159 addUnwrappedLine();
1160 return;
Alexander Kornienko1231e062013-01-16 11:43:46 +00001161 case tok::r_brace:
1162 addUnwrappedLine();
1163 return;
Daniel Jasperf7935112012-12-03 18:12:45 +00001164 case tok::l_paren:
1165 parseParens();
1166 break;
Daniel Jasper5af04a42015-10-07 03:43:10 +00001167 case tok::kw_operator:
1168 nextToken();
1169 if (FormatTok->isBinaryOperator())
1170 nextToken();
1171 break;
Manuel Klimek516e0542013-09-04 13:25:30 +00001172 case tok::caret:
1173 nextToken();
Daniel Jasper395193c2014-03-28 07:48:59 +00001174 if (FormatTok->Tok.isAnyIdentifier() ||
1175 FormatTok->isSimpleTypeSpecifier())
1176 nextToken();
1177 if (FormatTok->is(tok::l_paren))
1178 parseParens();
1179 if (FormatTok->is(tok::l_brace))
Manuel Klimek516e0542013-09-04 13:25:30 +00001180 parseChildBlock();
Manuel Klimek516e0542013-09-04 13:25:30 +00001181 break;
Daniel Jasperf7935112012-12-03 18:12:45 +00001182 case tok::l_brace:
Manuel Klimekab419912013-05-23 09:41:43 +00001183 if (!tryToParseBracedList()) {
1184 // A block outside of parentheses must be the last part of a
1185 // structural element.
1186 // FIXME: Figure out cases where this is not true, and add projections
1187 // for them (the one we know is missing are lambdas).
Daniel Jasperc1bc38e2015-09-29 14:57:55 +00001188 if (Style.BraceWrapping.AfterFunction)
Manuel Klimekab419912013-05-23 09:41:43 +00001189 addUnwrappedLine();
Alexander Kornienko3cfa9732013-11-20 16:33:05 +00001190 FormatTok->Type = TT_FunctionLBrace;
Nico Weber9096fc02013-06-26 00:30:14 +00001191 parseBlock(/*MustBeDeclaration=*/false);
Manuel Klimeka8eb9142013-05-13 12:51:40 +00001192 addUnwrappedLine();
Manuel Klimekab419912013-05-23 09:41:43 +00001193 return;
1194 }
1195 // Otherwise this was a braced init list, and the structural
1196 // element continues.
1197 break;
Daniel Jasper04a71a42014-05-08 11:58:24 +00001198 case tok::kw_try:
1199 // We arrive here when parsing function-try blocks.
1200 parseTryCatch();
1201 return;
Daniel Jasper40e19212013-05-29 13:16:10 +00001202 case tok::identifier: {
Birunthan Mohanathasb001a0b2015-07-03 17:25:16 +00001203 if (FormatTok->is(TT_MacroBlockEnd)) {
1204 addUnwrappedLine();
1205 return;
1206 }
1207
Martin Probst973ff792017-04-27 13:07:24 +00001208 // Function declarations (as opposed to function expressions) are parsed
1209 // on their own unwrapped line by continuing this loop. Function
1210 // expressions (functions that are not on their own line) must not create
1211 // a new unwrapped line, so they are special cased below.
1212 size_t TokenCount = Line->Tokens.size();
Daniel Jasper9326f912015-05-05 08:40:32 +00001213 if (Style.Language == FormatStyle::LK_JavaScript &&
Martin Probst973ff792017-04-27 13:07:24 +00001214 FormatTok->is(Keywords.kw_function) &&
1215 (TokenCount > 1 || (TokenCount == 1 && !Line->Tokens.front().Tok->is(
1216 Keywords.kw_async)))) {
Daniel Jasper069e5f42014-05-20 11:14:57 +00001217 tryToParseJSFunction();
1218 break;
1219 }
Daniel Jasper9326f912015-05-05 08:40:32 +00001220 if ((Style.Language == FormatStyle::LK_JavaScript ||
1221 Style.Language == FormatStyle::LK_Java) &&
1222 FormatTok->is(Keywords.kw_interface)) {
Martin Probst1e8261e2016-04-19 18:18:59 +00001223 if (Style.Language == FormatStyle::LK_JavaScript) {
1224 // In JavaScript/TypeScript, "interface" can be used as a standalone
1225 // identifier, e.g. in `var interface = 1;`. If "interface" is
1226 // followed by another identifier, it is very like to be an actual
1227 // interface declaration.
1228 unsigned StoredPosition = Tokens->getPosition();
1229 FormatToken *Next = Tokens->getNextToken();
1230 FormatTok = Tokens->setPosition(StoredPosition);
Martin Probst533965c2016-04-19 18:19:06 +00001231 if (Next && !mustBeJSIdent(Keywords, Next)) {
Martin Probst1e8261e2016-04-19 18:18:59 +00001232 nextToken();
1233 break;
1234 }
1235 }
Daniel Jasper9326f912015-05-05 08:40:32 +00001236 parseRecord();
Daniel Jasper259188b2015-06-12 04:56:34 +00001237 addUnwrappedLine();
Daniel Jasper5c235c02015-07-06 14:26:04 +00001238 return;
Daniel Jasper9326f912015-05-05 08:40:32 +00001239 }
1240
Daniel Jasper1dcbbcfc2016-03-14 19:21:36 +00001241 // See if the following token should start a new unwrapped line.
Daniel Jasper9326f912015-05-05 08:40:32 +00001242 StringRef Text = FormatTok->TokenText;
Daniel Jasperf7935112012-12-03 18:12:45 +00001243 nextToken();
Daniel Jasper83709082015-02-18 17:14:05 +00001244 if (Line->Tokens.size() == 1 &&
1245 // JS doesn't have macros, and within classes colons indicate fields,
1246 // not labels.
Daniel Jasper676e5162015-04-07 14:36:33 +00001247 Style.Language != FormatStyle::LK_JavaScript) {
1248 if (FormatTok->Tok.is(tok::colon) && !Line->MustBeDeclaration) {
Daniel Jasper40609472016-04-06 15:02:46 +00001249 Line->Tokens.begin()->Tok->MustBreakBefore = true;
Alexander Kornienkode644272013-04-08 22:16:06 +00001250 parseLabel();
1251 return;
1252 }
Daniel Jasper680b09b2014-11-05 10:48:04 +00001253 // Recognize function-like macro usages without trailing semicolon as
Daniel Jasper83709082015-02-18 17:14:05 +00001254 // well as free-standing macros like Q_OBJECT.
Daniel Jasper680b09b2014-11-05 10:48:04 +00001255 bool FunctionLike = FormatTok->is(tok::l_paren);
1256 if (FunctionLike)
Alexander Kornienkode644272013-04-08 22:16:06 +00001257 parseParens();
Daniel Jaspere60cba12015-05-13 11:35:53 +00001258
1259 bool FollowedByNewline =
1260 CommentsBeforeNextToken.empty()
1261 ? FormatTok->NewlinesBefore > 0
1262 : CommentsBeforeNextToken.front()->NewlinesBefore > 0;
1263
Daniel Jaspere6fcf7d2015-06-17 13:08:06 +00001264 if (FollowedByNewline && (Text.size() >= 5 || FunctionLike) &&
Daniel Jasper680b09b2014-11-05 10:48:04 +00001265 tokenCanStartNewLine(FormatTok->Tok) && Text == Text.upper()) {
Daniel Jasper40e19212013-05-29 13:16:10 +00001266 addUnwrappedLine();
Daniel Jasper41a0f782013-05-29 14:09:17 +00001267 return;
Alexander Kornienkode644272013-04-08 22:16:06 +00001268 }
Daniel Jasperf7935112012-12-03 18:12:45 +00001269 }
1270 break;
Daniel Jasper40e19212013-05-29 13:16:10 +00001271 }
Daniel Jaspere25509f2012-12-17 11:29:41 +00001272 case tok::equal:
Manuel Klimek79e06082015-05-21 12:23:34 +00001273 // Fat arrows (=>) have tok::TokenKind tok::equal but TokenType
1274 // TT_JsFatArrow. The always start an expression or a child block if
1275 // followed by a curly.
1276 if (FormatTok->is(TT_JsFatArrow)) {
1277 nextToken();
Daniel Jasperbe520bd2015-05-31 08:51:54 +00001278 if (FormatTok->is(tok::l_brace))
Manuel Klimek79e06082015-05-21 12:23:34 +00001279 parseChildBlock();
Manuel Klimek79e06082015-05-21 12:23:34 +00001280 break;
1281 }
1282
Daniel Jaspere25509f2012-12-17 11:29:41 +00001283 nextToken();
Krasimir Georgiev26b144c2017-07-03 15:05:14 +00001284 if (FormatTok->Tok.is(tok::l_brace)) {
1285 nextToken();
Manuel Klimek8e07a1b2013-01-10 11:52:21 +00001286 parseBracedList();
Krasimir Georgiev26b144c2017-07-03 15:05:14 +00001287 } else if (Style.Language == FormatStyle::LK_Proto &&
1288 FormatTok->Tok.is(tok::less)) {
1289 nextToken();
Krasimir Georgiev0b41fcb2017-06-27 13:58:41 +00001290 parseBracedList(/*ContinueOnSemicolons=*/false,
1291 /*ClosingBraceKind=*/tok::greater);
Krasimir Georgiev26b144c2017-07-03 15:05:14 +00001292 }
Daniel Jaspere25509f2012-12-17 11:29:41 +00001293 break;
Manuel Klimekffdeb592013-09-03 15:10:01 +00001294 case tok::l_square:
Daniel Jasperb88b25f2013-12-23 07:29:06 +00001295 parseSquare();
Manuel Klimekffdeb592013-09-03 15:10:01 +00001296 break;
Daniel Jasper6acf5132015-03-12 14:44:29 +00001297 case tok::kw_new:
1298 parseNew();
1299 break;
Alexander Kornienkob7076a22012-12-04 14:46:19 +00001300 default:
1301 nextToken();
1302 break;
Daniel Jasperf7935112012-12-03 18:12:45 +00001303 }
1304 } while (!eof());
1305}
1306
Daniel Jasperb88b25f2013-12-23 07:29:06 +00001307bool UnwrappedLineParser::tryToParseLambda() {
Daniel Jasper1dbc2102017-03-31 13:30:24 +00001308 if (!Style.isCpp()) {
Daniel Jasper1feab0f2015-06-02 15:31:37 +00001309 nextToken();
1310 return false;
1311 }
Daniel Jasperb9a49902016-01-09 15:56:28 +00001312 const FormatToken* Previous = getPreviousToken();
1313 if (Previous &&
1314 (Previous->isOneOf(tok::identifier, tok::kw_operator, tok::kw_new,
1315 tok::kw_delete) ||
1316 Previous->closesScope() || Previous->isSimpleTypeSpecifier())) {
Daniel Jasperbf02b2c12013-09-05 11:49:39 +00001317 nextToken();
Daniel Jasperb88b25f2013-12-23 07:29:06 +00001318 return false;
Daniel Jasperbf02b2c12013-09-05 11:49:39 +00001319 }
Daniel Jasper9fe0e8d2013-09-05 09:29:45 +00001320 assert(FormatTok->is(tok::l_square));
1321 FormatToken &LSquare = *FormatTok;
Daniel Jasper9a8d48b2013-09-05 10:04:31 +00001322 if (!tryToParseLambdaIntroducer())
Daniel Jasperb88b25f2013-12-23 07:29:06 +00001323 return false;
Manuel Klimekffdeb592013-09-03 15:10:01 +00001324
Alexander Kornienkoc2ee9cf2014-03-13 13:59:48 +00001325 while (FormatTok->isNot(tok::l_brace)) {
Daniel Jaspercb51cf42014-01-16 09:11:55 +00001326 if (FormatTok->isSimpleTypeSpecifier()) {
1327 nextToken();
1328 continue;
1329 }
Manuel Klimekffdeb592013-09-03 15:10:01 +00001330 switch (FormatTok->Tok.getKind()) {
Daniel Jasper9a8d48b2013-09-05 10:04:31 +00001331 case tok::l_brace:
1332 break;
1333 case tok::l_paren:
1334 parseParens();
1335 break;
Daniel Jasperbcb55ee2014-11-21 14:08:38 +00001336 case tok::amp:
1337 case tok::star:
1338 case tok::kw_const:
Daniel Jasper3431b752014-12-08 13:22:37 +00001339 case tok::comma:
Daniel Jaspercb51cf42014-01-16 09:11:55 +00001340 case tok::less:
1341 case tok::greater:
Daniel Jasper9a8d48b2013-09-05 10:04:31 +00001342 case tok::identifier:
Daniel Jasper5eaa0092015-08-13 13:37:08 +00001343 case tok::numeric_constant:
Daniel Jasper1067ab02014-02-11 10:16:55 +00001344 case tok::coloncolon:
Daniel Jasper9a8d48b2013-09-05 10:04:31 +00001345 case tok::kw_mutable:
Daniel Jasper81a20782014-03-10 10:02:02 +00001346 nextToken();
1347 break;
Daniel Jaspercb51cf42014-01-16 09:11:55 +00001348 case tok::arrow:
Daniel Jasper6f2b88a2015-06-05 13:18:09 +00001349 FormatTok->Type = TT_LambdaArrow;
Daniel Jasper9a8d48b2013-09-05 10:04:31 +00001350 nextToken();
1351 break;
1352 default:
Daniel Jasperb88b25f2013-12-23 07:29:06 +00001353 return true;
Manuel Klimekffdeb592013-09-03 15:10:01 +00001354 }
1355 }
Daniel Jasper9fe0e8d2013-09-05 09:29:45 +00001356 LSquare.Type = TT_LambdaLSquare;
Manuel Klimek516e0542013-09-04 13:25:30 +00001357 parseChildBlock();
Daniel Jasperb88b25f2013-12-23 07:29:06 +00001358 return true;
Manuel Klimekffdeb592013-09-03 15:10:01 +00001359}
1360
1361bool UnwrappedLineParser::tryToParseLambdaIntroducer() {
1362 nextToken();
1363 if (FormatTok->is(tok::equal)) {
1364 nextToken();
Daniel Jasper9a8d48b2013-09-05 10:04:31 +00001365 if (FormatTok->is(tok::r_square)) {
1366 nextToken();
1367 return true;
1368 }
1369 if (FormatTok->isNot(tok::comma))
1370 return false;
Manuel Klimekffdeb592013-09-03 15:10:01 +00001371 nextToken();
1372 } else if (FormatTok->is(tok::amp)) {
1373 nextToken();
Daniel Jasper9a8d48b2013-09-05 10:04:31 +00001374 if (FormatTok->is(tok::r_square)) {
1375 nextToken();
1376 return true;
1377 }
Manuel Klimekffdeb592013-09-03 15:10:01 +00001378 if (!FormatTok->isOneOf(tok::comma, tok::identifier)) {
1379 return false;
1380 }
Daniel Jasper9a8d48b2013-09-05 10:04:31 +00001381 if (FormatTok->is(tok::comma))
1382 nextToken();
Manuel Klimekffdeb592013-09-03 15:10:01 +00001383 } else if (FormatTok->is(tok::r_square)) {
1384 nextToken();
1385 return true;
1386 }
1387 do {
Daniel Jasper9a8d48b2013-09-05 10:04:31 +00001388 if (FormatTok->is(tok::amp))
1389 nextToken();
1390 if (!FormatTok->isOneOf(tok::identifier, tok::kw_this))
1391 return false;
Manuel Klimekffdeb592013-09-03 15:10:01 +00001392 nextToken();
Daniel Jasperda18fd82014-06-10 06:39:03 +00001393 if (FormatTok->is(tok::ellipsis))
1394 nextToken();
Manuel Klimekffdeb592013-09-03 15:10:01 +00001395 if (FormatTok->is(tok::comma)) {
1396 nextToken();
1397 } else if (FormatTok->is(tok::r_square)) {
1398 nextToken();
1399 return true;
1400 } else {
1401 return false;
1402 }
1403 } while (!eof());
1404 return false;
1405}
1406
Daniel Jasperc03e16a2014-05-08 09:25:39 +00001407void UnwrappedLineParser::tryToParseJSFunction() {
Martin Probst409697e2016-05-29 14:41:07 +00001408 assert(FormatTok->is(Keywords.kw_function) ||
1409 FormatTok->startsSequence(Keywords.kw_async, Keywords.kw_function));
Martin Probst5f8445b2016-04-24 22:05:09 +00001410 if (FormatTok->is(Keywords.kw_async))
1411 nextToken();
1412 // Consume "function".
Daniel Jasperc03e16a2014-05-08 09:25:39 +00001413 nextToken();
Daniel Jasper5217a8b2014-06-13 07:02:04 +00001414
Daniel Jasper71e50af2016-11-01 06:22:59 +00001415 // Consume * (generator function). Treat it like C++'s overloaded operators.
1416 if (FormatTok->is(tok::star)) {
1417 FormatTok->Type = TT_OverloadedOperator;
Martin Probst5f8445b2016-04-24 22:05:09 +00001418 nextToken();
Daniel Jasper71e50af2016-11-01 06:22:59 +00001419 }
Martin Probst5f8445b2016-04-24 22:05:09 +00001420
Daniel Jasper5217a8b2014-06-13 07:02:04 +00001421 // Consume function name.
1422 if (FormatTok->is(tok::identifier))
Daniel Jasperfca735c2015-02-19 16:14:18 +00001423 nextToken();
Daniel Jasper5217a8b2014-06-13 07:02:04 +00001424
Daniel Jasperc03e16a2014-05-08 09:25:39 +00001425 if (FormatTok->isNot(tok::l_paren))
1426 return;
Manuel Klimek79e06082015-05-21 12:23:34 +00001427
1428 // Parse formal parameter list.
Daniel Jasperbe520bd2015-05-31 08:51:54 +00001429 parseParens();
Manuel Klimek79e06082015-05-21 12:23:34 +00001430
1431 if (FormatTok->is(tok::colon)) {
1432 // Parse a type definition.
1433 nextToken();
1434
1435 // Eat the type declaration. For braced inline object types, balance braces,
1436 // otherwise just parse until finding an l_brace for the function body.
Daniel Jasperbe520bd2015-05-31 08:51:54 +00001437 if (FormatTok->is(tok::l_brace))
1438 tryToParseBracedList();
1439 else
Martin Probstaf16c502017-01-04 13:36:43 +00001440 while (!FormatTok->isOneOf(tok::l_brace, tok::semi) && !eof())
Manuel Klimek79e06082015-05-21 12:23:34 +00001441 nextToken();
Manuel Klimek79e06082015-05-21 12:23:34 +00001442 }
1443
Martin Probstaf16c502017-01-04 13:36:43 +00001444 if (FormatTok->is(tok::semi))
1445 return;
1446
Manuel Klimek79e06082015-05-21 12:23:34 +00001447 parseChildBlock();
1448}
1449
Daniel Jasper3c883d12015-05-18 14:49:19 +00001450bool UnwrappedLineParser::tryToParseBracedList() {
Daniel Jasperb1f74a82013-07-09 09:06:29 +00001451 if (FormatTok->BlockKind == BK_Unknown)
Daniel Jasper3c883d12015-05-18 14:49:19 +00001452 calculateBraceTypes();
Daniel Jasperb1f74a82013-07-09 09:06:29 +00001453 assert(FormatTok->BlockKind != BK_Unknown);
1454 if (FormatTok->BlockKind == BK_Block)
Manuel Klimekab419912013-05-23 09:41:43 +00001455 return false;
Krasimir Georgiev26b144c2017-07-03 15:05:14 +00001456 nextToken();
Manuel Klimekab419912013-05-23 09:41:43 +00001457 parseBracedList();
1458 return true;
1459}
1460
Krasimir Georgievff747be2017-06-27 13:43:07 +00001461bool UnwrappedLineParser::parseBracedList(bool ContinueOnSemicolons,
1462 tok::TokenKind ClosingBraceKind) {
Daniel Jasper015ed022013-09-13 09:20:45 +00001463 bool HasError = false;
Manuel Klimek8e07a1b2013-01-10 11:52:21 +00001464
Manuel Klimeka3ff45e2013-04-10 09:52:05 +00001465 // FIXME: Once we have an expression parser in the UnwrappedLineParser,
1466 // replace this by using parseAssigmentExpression() inside.
Manuel Klimek8e07a1b2013-01-10 11:52:21 +00001467 do {
Manuel Klimek79e06082015-05-21 12:23:34 +00001468 if (Style.Language == FormatStyle::LK_JavaScript) {
Martin Probst409697e2016-05-29 14:41:07 +00001469 if (FormatTok->is(Keywords.kw_function) ||
1470 FormatTok->startsSequence(Keywords.kw_async, Keywords.kw_function)) {
Manuel Klimek79e06082015-05-21 12:23:34 +00001471 tryToParseJSFunction();
1472 continue;
Daniel Jasperbe520bd2015-05-31 08:51:54 +00001473 }
1474 if (FormatTok->is(TT_JsFatArrow)) {
Manuel Klimek79e06082015-05-21 12:23:34 +00001475 nextToken();
1476 // Fat arrows can be followed by simple expressions or by child blocks
1477 // in curly braces.
Daniel Jaspere6fcf7d2015-06-17 13:08:06 +00001478 if (FormatTok->is(tok::l_brace)) {
Manuel Klimek79e06082015-05-21 12:23:34 +00001479 parseChildBlock();
1480 continue;
1481 }
1482 }
Martin Probst8e3eba02017-02-07 16:33:13 +00001483 if (FormatTok->is(tok::l_brace)) {
1484 // Could be a method inside of a braced list `{a() { return 1; }}`.
1485 if (tryToParseBracedList())
1486 continue;
1487 parseChildBlock();
1488 }
Daniel Jasperc03e16a2014-05-08 09:25:39 +00001489 }
Krasimir Georgievff747be2017-06-27 13:43:07 +00001490 if (FormatTok->Tok.getKind() == ClosingBraceKind) {
1491 nextToken();
1492 return !HasError;
1493 }
Manuel Klimek15dfe7a2013-05-28 11:55:06 +00001494 switch (FormatTok->Tok.getKind()) {
Manuel Klimek516e0542013-09-04 13:25:30 +00001495 case tok::caret:
1496 nextToken();
1497 if (FormatTok->is(tok::l_brace)) {
1498 parseChildBlock();
1499 }
1500 break;
1501 case tok::l_square:
1502 tryToParseLambda();
1503 break;
Daniel Jaspera87af7a2015-06-30 11:32:22 +00001504 case tok::l_paren:
1505 parseParens();
Daniel Jasperf46dec82015-03-31 14:34:15 +00001506 // JavaScript can just have free standing methods and getters/setters in
1507 // object literals. Detect them by a "{" following ")".
1508 if (Style.Language == FormatStyle::LK_JavaScript) {
Daniel Jasperf46dec82015-03-31 14:34:15 +00001509 if (FormatTok->is(tok::l_brace))
1510 parseChildBlock();
1511 break;
1512 }
Daniel Jasperf46dec82015-03-31 14:34:15 +00001513 break;
Martin Probst8e3eba02017-02-07 16:33:13 +00001514 case tok::l_brace:
1515 // Assume there are no blocks inside a braced init list apart
1516 // from the ones we explicitly parse out (like lambdas).
1517 FormatTok->BlockKind = BK_BracedInit;
Krasimir Georgiev26b144c2017-07-03 15:05:14 +00001518 nextToken();
Martin Probst8e3eba02017-02-07 16:33:13 +00001519 parseBracedList();
1520 break;
Krasimir Georgievfa4dbb62017-08-03 13:43:45 +00001521 case tok::less:
1522 if (Style.Language == FormatStyle::LK_Proto) {
1523 nextToken();
1524 parseBracedList(/*ContinueOnSemicolons=*/false,
1525 /*ClosingBraceKind=*/tok::greater);
1526 } else {
1527 nextToken();
1528 }
1529 break;
Manuel Klimeka3ff45e2013-04-10 09:52:05 +00001530 case tok::semi:
Daniel Jasperb9a49902016-01-09 15:56:28 +00001531 // JavaScript (or more precisely TypeScript) can have semicolons in braced
1532 // lists (in so-called TypeMemberLists). Thus, the semicolon cannot be
1533 // used for error recovery if we have otherwise determined that this is
1534 // a braced list.
1535 if (Style.Language == FormatStyle::LK_JavaScript) {
1536 nextToken();
1537 break;
1538 }
Daniel Jasper015ed022013-09-13 09:20:45 +00001539 HasError = true;
1540 if (!ContinueOnSemicolons)
1541 return !HasError;
1542 nextToken();
1543 break;
Manuel Klimeka3ff45e2013-04-10 09:52:05 +00001544 case tok::comma:
1545 nextToken();
Manuel Klimeka3ff45e2013-04-10 09:52:05 +00001546 break;
Manuel Klimek8e07a1b2013-01-10 11:52:21 +00001547 default:
1548 nextToken();
1549 break;
1550 }
1551 } while (!eof());
Daniel Jasper015ed022013-09-13 09:20:45 +00001552 return false;
Manuel Klimek8e07a1b2013-01-10 11:52:21 +00001553}
1554
Daniel Jasperf7935112012-12-03 18:12:45 +00001555void UnwrappedLineParser::parseParens() {
Manuel Klimek15dfe7a2013-05-28 11:55:06 +00001556 assert(FormatTok->Tok.is(tok::l_paren) && "'(' expected.");
Daniel Jasperf7935112012-12-03 18:12:45 +00001557 nextToken();
1558 do {
Manuel Klimek15dfe7a2013-05-28 11:55:06 +00001559 switch (FormatTok->Tok.getKind()) {
Daniel Jasperf7935112012-12-03 18:12:45 +00001560 case tok::l_paren:
1561 parseParens();
Daniel Jasper5f1fa852015-01-04 20:40:51 +00001562 if (Style.Language == FormatStyle::LK_Java && FormatTok->is(tok::l_brace))
1563 parseChildBlock();
Daniel Jasperf7935112012-12-03 18:12:45 +00001564 break;
1565 case tok::r_paren:
1566 nextToken();
1567 return;
Daniel Jasper393564f2013-05-31 14:56:29 +00001568 case tok::r_brace:
1569 // A "}" inside parenthesis is an error if there wasn't a matching "{".
1570 return;
Daniel Jasper9a8d48b2013-09-05 10:04:31 +00001571 case tok::l_square:
1572 tryToParseLambda();
1573 break;
Daniel Jasper5f1fa852015-01-04 20:40:51 +00001574 case tok::l_brace:
Daniel Jasperadba2aa2015-05-18 12:52:00 +00001575 if (!tryToParseBracedList())
Manuel Klimekf017dc02013-09-04 13:34:14 +00001576 parseChildBlock();
Manuel Klimek8e07a1b2013-01-10 11:52:21 +00001577 break;
Nico Weber372d8dc2013-02-10 20:35:35 +00001578 case tok::at:
1579 nextToken();
Krasimir Georgiev26b144c2017-07-03 15:05:14 +00001580 if (FormatTok->Tok.is(tok::l_brace)) {
1581 nextToken();
Nico Weber372d8dc2013-02-10 20:35:35 +00001582 parseBracedList();
Krasimir Georgiev26b144c2017-07-03 15:05:14 +00001583 }
Nico Weber372d8dc2013-02-10 20:35:35 +00001584 break;
Martin Probst1027fb82017-02-07 14:05:30 +00001585 case tok::kw_class:
1586 if (Style.Language == FormatStyle::LK_JavaScript)
1587 parseRecord(/*ParseAsExpr=*/true);
1588 else
1589 nextToken();
1590 break;
Daniel Jasper3f69ba12014-09-05 08:42:27 +00001591 case tok::identifier:
1592 if (Style.Language == FormatStyle::LK_JavaScript &&
Martin Probst409697e2016-05-29 14:41:07 +00001593 (FormatTok->is(Keywords.kw_function) ||
1594 FormatTok->startsSequence(Keywords.kw_async, Keywords.kw_function)))
Daniel Jasper3f69ba12014-09-05 08:42:27 +00001595 tryToParseJSFunction();
1596 else
1597 nextToken();
1598 break;
Daniel Jasperf7935112012-12-03 18:12:45 +00001599 default:
1600 nextToken();
1601 break;
1602 }
1603 } while (!eof());
1604}
1605
Daniel Jasperb88b25f2013-12-23 07:29:06 +00001606void UnwrappedLineParser::parseSquare() {
1607 assert(FormatTok->Tok.is(tok::l_square) && "'[' expected.");
1608 if (tryToParseLambda())
1609 return;
1610 do {
Daniel Jasperb88b25f2013-12-23 07:29:06 +00001611 switch (FormatTok->Tok.getKind()) {
1612 case tok::l_paren:
1613 parseParens();
1614 break;
1615 case tok::r_square:
1616 nextToken();
1617 return;
1618 case tok::r_brace:
1619 // A "}" inside parenthesis is an error if there wasn't a matching "{".
1620 return;
1621 case tok::l_square:
1622 parseSquare();
1623 break;
1624 case tok::l_brace: {
Daniel Jasperadba2aa2015-05-18 12:52:00 +00001625 if (!tryToParseBracedList())
Daniel Jasperb88b25f2013-12-23 07:29:06 +00001626 parseChildBlock();
Daniel Jasperb88b25f2013-12-23 07:29:06 +00001627 break;
1628 }
1629 case tok::at:
1630 nextToken();
Krasimir Georgiev26b144c2017-07-03 15:05:14 +00001631 if (FormatTok->Tok.is(tok::l_brace)) {
1632 nextToken();
Daniel Jasperb88b25f2013-12-23 07:29:06 +00001633 parseBracedList();
Krasimir Georgiev26b144c2017-07-03 15:05:14 +00001634 }
Daniel Jasperb88b25f2013-12-23 07:29:06 +00001635 break;
1636 default:
1637 nextToken();
1638 break;
1639 }
1640 } while (!eof());
1641}
1642
Daniel Jasperf7935112012-12-03 18:12:45 +00001643void UnwrappedLineParser::parseIfThenElse() {
Manuel Klimek15dfe7a2013-05-28 11:55:06 +00001644 assert(FormatTok->Tok.is(tok::kw_if) && "'if' expected");
Daniel Jasperf7935112012-12-03 18:12:45 +00001645 nextToken();
Daniel Jasper6a7d5a72017-06-19 07:40:49 +00001646 if (FormatTok->Tok.is(tok::kw_constexpr))
1647 nextToken();
Manuel Klimek15dfe7a2013-05-28 11:55:06 +00001648 if (FormatTok->Tok.is(tok::l_paren))
Manuel Klimekadededf2013-01-11 18:28:36 +00001649 parseParens();
Daniel Jasperf7935112012-12-03 18:12:45 +00001650 bool NeedsUnwrappedLine = false;
Manuel Klimek15dfe7a2013-05-28 11:55:06 +00001651 if (FormatTok->Tok.is(tok::l_brace)) {
Alexander Kornienko3a33f022013-12-12 09:49:52 +00001652 CompoundStatementIndenter Indenter(this, Style, Line->Level);
Nico Weber9096fc02013-06-26 00:30:14 +00001653 parseBlock(/*MustBeDeclaration=*/false);
Daniel Jasperc1bc38e2015-09-29 14:57:55 +00001654 if (Style.BraceWrapping.BeforeElse)
Manuel Klimekd3ed59a2013-08-02 21:31:59 +00001655 addUnwrappedLine();
Daniel Jasperc1bc38e2015-09-29 14:57:55 +00001656 else
Manuel Klimekd3ed59a2013-08-02 21:31:59 +00001657 NeedsUnwrappedLine = true;
Daniel Jasperf7935112012-12-03 18:12:45 +00001658 } else {
1659 addUnwrappedLine();
Manuel Klimek52b15152013-01-09 15:25:02 +00001660 ++Line->Level;
Manuel Klimek6b9eeba2013-01-07 14:56:16 +00001661 parseStructuralElement();
Manuel Klimek52b15152013-01-09 15:25:02 +00001662 --Line->Level;
Daniel Jasperf7935112012-12-03 18:12:45 +00001663 }
Manuel Klimek15dfe7a2013-05-28 11:55:06 +00001664 if (FormatTok->Tok.is(tok::kw_else)) {
Daniel Jasperf7935112012-12-03 18:12:45 +00001665 nextToken();
Manuel Klimek15dfe7a2013-05-28 11:55:06 +00001666 if (FormatTok->Tok.is(tok::l_brace)) {
Alexander Kornienko3a33f022013-12-12 09:49:52 +00001667 CompoundStatementIndenter Indenter(this, Style, Line->Level);
Nico Weber9096fc02013-06-26 00:30:14 +00001668 parseBlock(/*MustBeDeclaration=*/false);
Daniel Jasperf7935112012-12-03 18:12:45 +00001669 addUnwrappedLine();
Manuel Klimek15dfe7a2013-05-28 11:55:06 +00001670 } else if (FormatTok->Tok.is(tok::kw_if)) {
Daniel Jasperf7935112012-12-03 18:12:45 +00001671 parseIfThenElse();
1672 } else {
1673 addUnwrappedLine();
Manuel Klimek52b15152013-01-09 15:25:02 +00001674 ++Line->Level;
Manuel Klimek6b9eeba2013-01-07 14:56:16 +00001675 parseStructuralElement();
Daniel Jasper451544a2016-05-19 06:30:48 +00001676 if (FormatTok->is(tok::eof))
1677 addUnwrappedLine();
Manuel Klimek52b15152013-01-09 15:25:02 +00001678 --Line->Level;
Daniel Jasperf7935112012-12-03 18:12:45 +00001679 }
1680 } else if (NeedsUnwrappedLine) {
1681 addUnwrappedLine();
1682 }
1683}
1684
Daniel Jasper04a71a42014-05-08 11:58:24 +00001685void UnwrappedLineParser::parseTryCatch() {
Nico Weberfac23712015-02-04 15:26:27 +00001686 assert(FormatTok->isOneOf(tok::kw_try, tok::kw___try) && "'try' expected");
Daniel Jasper04a71a42014-05-08 11:58:24 +00001687 nextToken();
1688 bool NeedsUnwrappedLine = false;
1689 if (FormatTok->is(tok::colon)) {
1690 // We are in a function try block, what comes is an initializer list.
1691 nextToken();
1692 while (FormatTok->is(tok::identifier)) {
1693 nextToken();
1694 if (FormatTok->is(tok::l_paren))
1695 parseParens();
Daniel Jasper04a71a42014-05-08 11:58:24 +00001696 if (FormatTok->is(tok::comma))
1697 nextToken();
1698 }
1699 }
Daniel Jaspere189d462015-01-14 10:48:41 +00001700 // Parse try with resource.
1701 if (Style.Language == FormatStyle::LK_Java && FormatTok->is(tok::l_paren)) {
1702 parseParens();
1703 }
Daniel Jasper04a71a42014-05-08 11:58:24 +00001704 if (FormatTok->is(tok::l_brace)) {
1705 CompoundStatementIndenter Indenter(this, Style, Line->Level);
1706 parseBlock(/*MustBeDeclaration=*/false);
Daniel Jasperc1bc38e2015-09-29 14:57:55 +00001707 if (Style.BraceWrapping.BeforeCatch) {
Daniel Jasper04a71a42014-05-08 11:58:24 +00001708 addUnwrappedLine();
1709 } else {
1710 NeedsUnwrappedLine = true;
1711 }
1712 } else if (!FormatTok->is(tok::kw_catch)) {
1713 // The C++ standard requires a compound-statement after a try.
1714 // If there's none, we try to assume there's a structuralElement
1715 // and try to continue.
Daniel Jasper04a71a42014-05-08 11:58:24 +00001716 addUnwrappedLine();
1717 ++Line->Level;
1718 parseStructuralElement();
1719 --Line->Level;
1720 }
Nico Weber33381f52015-02-07 01:57:32 +00001721 while (1) {
1722 if (FormatTok->is(tok::at))
1723 nextToken();
1724 if (!(FormatTok->isOneOf(tok::kw_catch, Keywords.kw___except,
1725 tok::kw___finally) ||
1726 ((Style.Language == FormatStyle::LK_Java ||
1727 Style.Language == FormatStyle::LK_JavaScript) &&
1728 FormatTok->is(Keywords.kw_finally)) ||
1729 (FormatTok->Tok.isObjCAtKeyword(tok::objc_catch) ||
1730 FormatTok->Tok.isObjCAtKeyword(tok::objc_finally))))
1731 break;
Daniel Jasper04a71a42014-05-08 11:58:24 +00001732 nextToken();
1733 while (FormatTok->isNot(tok::l_brace)) {
1734 if (FormatTok->is(tok::l_paren)) {
1735 parseParens();
1736 continue;
1737 }
Daniel Jasper2bd7a642015-01-19 10:50:51 +00001738 if (FormatTok->isOneOf(tok::semi, tok::r_brace, tok::eof))
Daniel Jasper04a71a42014-05-08 11:58:24 +00001739 return;
1740 nextToken();
1741 }
1742 NeedsUnwrappedLine = false;
1743 CompoundStatementIndenter Indenter(this, Style, Line->Level);
1744 parseBlock(/*MustBeDeclaration=*/false);
Daniel Jasperc1bc38e2015-09-29 14:57:55 +00001745 if (Style.BraceWrapping.BeforeCatch)
Daniel Jasper04a71a42014-05-08 11:58:24 +00001746 addUnwrappedLine();
Daniel Jasperc1bc38e2015-09-29 14:57:55 +00001747 else
Daniel Jasper04a71a42014-05-08 11:58:24 +00001748 NeedsUnwrappedLine = true;
Daniel Jasper04a71a42014-05-08 11:58:24 +00001749 }
Daniel Jasperc1bc38e2015-09-29 14:57:55 +00001750 if (NeedsUnwrappedLine)
Daniel Jasper04a71a42014-05-08 11:58:24 +00001751 addUnwrappedLine();
Daniel Jasper04a71a42014-05-08 11:58:24 +00001752}
1753
Alexander Kornienko578fdd82012-12-06 18:03:27 +00001754void UnwrappedLineParser::parseNamespace() {
Manuel Klimek15dfe7a2013-05-28 11:55:06 +00001755 assert(FormatTok->Tok.is(tok::kw_namespace) && "'namespace' expected");
Roman Kashitsyna043ced2014-08-11 12:18:01 +00001756
1757 const FormatToken &InitialToken = *FormatTok;
Alexander Kornienko578fdd82012-12-06 18:03:27 +00001758 nextToken();
Saleem Abdulrasool328085f2015-10-30 05:07:56 +00001759 while (FormatTok->isOneOf(tok::identifier, tok::coloncolon))
Alexander Kornienko578fdd82012-12-06 18:03:27 +00001760 nextToken();
Manuel Klimek15dfe7a2013-05-28 11:55:06 +00001761 if (FormatTok->Tok.is(tok::l_brace)) {
Roman Kashitsyna043ced2014-08-11 12:18:01 +00001762 if (ShouldBreakBeforeBrace(Style, InitialToken))
Manuel Klimeka8eb9142013-05-13 12:51:40 +00001763 addUnwrappedLine();
1764
Daniel Jasper65ee3472013-07-31 23:16:02 +00001765 bool AddLevel = Style.NamespaceIndentation == FormatStyle::NI_All ||
1766 (Style.NamespaceIndentation == FormatStyle::NI_Inner &&
1767 DeclarationScopeStack.size() > 1);
1768 parseBlock(/*MustBeDeclaration=*/true, AddLevel);
Manuel Klimek046b9302013-02-06 16:08:09 +00001769 // Munch the semicolon after a namespace. This is more common than one would
1770 // think. Puttin the semicolon into its own line is very ugly.
Manuel Klimek15dfe7a2013-05-28 11:55:06 +00001771 if (FormatTok->Tok.is(tok::semi))
Manuel Klimek046b9302013-02-06 16:08:09 +00001772 nextToken();
Alexander Kornienko578fdd82012-12-06 18:03:27 +00001773 addUnwrappedLine();
1774 }
1775 // FIXME: Add error handling.
1776}
1777
Daniel Jasper6acf5132015-03-12 14:44:29 +00001778void UnwrappedLineParser::parseNew() {
1779 assert(FormatTok->is(tok::kw_new) && "'new' expected");
1780 nextToken();
1781 if (Style.Language != FormatStyle::LK_Java)
1782 return;
1783
1784 // In Java, we can parse everything up to the parens, which aren't optional.
1785 do {
1786 // There should not be a ;, { or } before the new's open paren.
1787 if (FormatTok->isOneOf(tok::semi, tok::l_brace, tok::r_brace))
1788 return;
1789
1790 // Consume the parens.
1791 if (FormatTok->is(tok::l_paren)) {
1792 parseParens();
1793
1794 // If there is a class body of an anonymous class, consume that as child.
1795 if (FormatTok->is(tok::l_brace))
1796 parseChildBlock();
1797 return;
1798 }
1799 nextToken();
1800 } while (!eof());
1801}
1802
Alexander Kornienko37d6c942012-12-05 15:06:06 +00001803void UnwrappedLineParser::parseForOrWhileLoop() {
Daniel Jasper66cb8c52015-05-04 09:22:29 +00001804 assert(FormatTok->isOneOf(tok::kw_for, tok::kw_while, TT_ForEachMacro) &&
Daniel Jaspere1e43192014-04-01 12:55:11 +00001805 "'for', 'while' or foreach macro expected");
Alexander Kornienko37d6c942012-12-05 15:06:06 +00001806 nextToken();
Martin Probsta050f412017-05-18 21:19:29 +00001807 // JS' for await ( ...
Martin Probstbd49e322017-05-15 19:33:20 +00001808 if (Style.Language == FormatStyle::LK_JavaScript &&
Martin Probsta050f412017-05-18 21:19:29 +00001809 FormatTok->is(Keywords.kw_await))
Martin Probstbd49e322017-05-15 19:33:20 +00001810 nextToken();
Manuel Klimek15dfe7a2013-05-28 11:55:06 +00001811 if (FormatTok->Tok.is(tok::l_paren))
Manuel Klimek9fa8d552013-01-11 19:23:05 +00001812 parseParens();
Manuel Klimek15dfe7a2013-05-28 11:55:06 +00001813 if (FormatTok->Tok.is(tok::l_brace)) {
Alexander Kornienko3a33f022013-12-12 09:49:52 +00001814 CompoundStatementIndenter Indenter(this, Style, Line->Level);
Nico Weber9096fc02013-06-26 00:30:14 +00001815 parseBlock(/*MustBeDeclaration=*/false);
Alexander Kornienko37d6c942012-12-05 15:06:06 +00001816 addUnwrappedLine();
1817 } else {
1818 addUnwrappedLine();
Manuel Klimek52b15152013-01-09 15:25:02 +00001819 ++Line->Level;
Manuel Klimek6b9eeba2013-01-07 14:56:16 +00001820 parseStructuralElement();
Manuel Klimek52b15152013-01-09 15:25:02 +00001821 --Line->Level;
Alexander Kornienko37d6c942012-12-05 15:06:06 +00001822 }
1823}
1824
Daniel Jasperf7935112012-12-03 18:12:45 +00001825void UnwrappedLineParser::parseDoWhile() {
Manuel Klimek15dfe7a2013-05-28 11:55:06 +00001826 assert(FormatTok->Tok.is(tok::kw_do) && "'do' expected");
Daniel Jasperf7935112012-12-03 18:12:45 +00001827 nextToken();
Manuel Klimek15dfe7a2013-05-28 11:55:06 +00001828 if (FormatTok->Tok.is(tok::l_brace)) {
Alexander Kornienko3a33f022013-12-12 09:49:52 +00001829 CompoundStatementIndenter Indenter(this, Style, Line->Level);
Nico Weber9096fc02013-06-26 00:30:14 +00001830 parseBlock(/*MustBeDeclaration=*/false);
Daniel Jasperc1bc38e2015-09-29 14:57:55 +00001831 if (Style.BraceWrapping.IndentBraces)
Alexander Kornienko3a33f022013-12-12 09:49:52 +00001832 addUnwrappedLine();
Daniel Jasperf7935112012-12-03 18:12:45 +00001833 } else {
1834 addUnwrappedLine();
Manuel Klimek52b15152013-01-09 15:25:02 +00001835 ++Line->Level;
Manuel Klimek6b9eeba2013-01-07 14:56:16 +00001836 parseStructuralElement();
Manuel Klimek52b15152013-01-09 15:25:02 +00001837 --Line->Level;
Daniel Jasperf7935112012-12-03 18:12:45 +00001838 }
1839
Alexander Kornienko0ea8e102012-12-04 15:40:36 +00001840 // FIXME: Add error handling.
Manuel Klimek15dfe7a2013-05-28 11:55:06 +00001841 if (!FormatTok->Tok.is(tok::kw_while)) {
Alexander Kornienko0ea8e102012-12-04 15:40:36 +00001842 addUnwrappedLine();
1843 return;
1844 }
1845
Daniel Jasperf7935112012-12-03 18:12:45 +00001846 nextToken();
Manuel Klimek6b9eeba2013-01-07 14:56:16 +00001847 parseStructuralElement();
Daniel Jasperf7935112012-12-03 18:12:45 +00001848}
1849
1850void UnwrappedLineParser::parseLabel() {
Daniel Jasperf7935112012-12-03 18:12:45 +00001851 nextToken();
Manuel Klimek52b15152013-01-09 15:25:02 +00001852 unsigned OldLineLevel = Line->Level;
Daniel Jaspera1275122013-03-20 10:23:53 +00001853 if (Line->Level > 1 || (!Line->InPPDirective && Line->Level > 0))
Manuel Klimek52b15152013-01-09 15:25:02 +00001854 --Line->Level;
Manuel Klimek15dfe7a2013-05-28 11:55:06 +00001855 if (CommentsBeforeNextToken.empty() && FormatTok->Tok.is(tok::l_brace)) {
Alexander Kornienko3a33f022013-12-12 09:49:52 +00001856 CompoundStatementIndenter Indenter(this, Style, Line->Level);
Nico Weber9096fc02013-06-26 00:30:14 +00001857 parseBlock(/*MustBeDeclaration=*/false);
Manuel Klimekd3ed59a2013-08-02 21:31:59 +00001858 if (FormatTok->Tok.is(tok::kw_break)) {
Daniel Jasperc1bc38e2015-09-29 14:57:55 +00001859 if (Style.BraceWrapping.AfterControlStatement)
Manuel Klimekd3ed59a2013-08-02 21:31:59 +00001860 addUnwrappedLine();
1861 parseStructuralElement();
1862 }
Alexander Kornienko3a33f022013-12-12 09:49:52 +00001863 addUnwrappedLine();
1864 } else {
Daniel Jasper1fe0d5c2015-05-06 15:19:47 +00001865 if (FormatTok->is(tok::semi))
1866 nextToken();
Alexander Kornienko3a33f022013-12-12 09:49:52 +00001867 addUnwrappedLine();
Daniel Jasperf7935112012-12-03 18:12:45 +00001868 }
Manuel Klimek52b15152013-01-09 15:25:02 +00001869 Line->Level = OldLineLevel;
Daniel Jasper2cce7b72016-04-06 16:41:39 +00001870 if (FormatTok->isNot(tok::l_brace)) {
Daniel Jasper40609472016-04-06 15:02:46 +00001871 parseStructuralElement();
Daniel Jasper2cce7b72016-04-06 16:41:39 +00001872 addUnwrappedLine();
1873 }
Daniel Jasperf7935112012-12-03 18:12:45 +00001874}
1875
1876void UnwrappedLineParser::parseCaseLabel() {
Manuel Klimek15dfe7a2013-05-28 11:55:06 +00001877 assert(FormatTok->Tok.is(tok::kw_case) && "'case' expected");
Daniel Jasperf7935112012-12-03 18:12:45 +00001878 // FIXME: fix handling of complex expressions here.
1879 do {
1880 nextToken();
Manuel Klimek15dfe7a2013-05-28 11:55:06 +00001881 } while (!eof() && !FormatTok->Tok.is(tok::colon));
Daniel Jasperf7935112012-12-03 18:12:45 +00001882 parseLabel();
1883}
1884
1885void UnwrappedLineParser::parseSwitch() {
Manuel Klimek15dfe7a2013-05-28 11:55:06 +00001886 assert(FormatTok->Tok.is(tok::kw_switch) && "'switch' expected");
Daniel Jasperf7935112012-12-03 18:12:45 +00001887 nextToken();
Manuel Klimek15dfe7a2013-05-28 11:55:06 +00001888 if (FormatTok->Tok.is(tok::l_paren))
Manuel Klimek9fa8d552013-01-11 19:23:05 +00001889 parseParens();
Manuel Klimek15dfe7a2013-05-28 11:55:06 +00001890 if (FormatTok->Tok.is(tok::l_brace)) {
Alexander Kornienko3a33f022013-12-12 09:49:52 +00001891 CompoundStatementIndenter Indenter(this, Style, Line->Level);
Daniel Jasper65ee3472013-07-31 23:16:02 +00001892 parseBlock(/*MustBeDeclaration=*/false);
Daniel Jasperf7935112012-12-03 18:12:45 +00001893 addUnwrappedLine();
1894 } else {
1895 addUnwrappedLine();
Daniel Jasper516d7972013-07-25 11:31:57 +00001896 ++Line->Level;
Manuel Klimek6b9eeba2013-01-07 14:56:16 +00001897 parseStructuralElement();
Daniel Jasper516d7972013-07-25 11:31:57 +00001898 --Line->Level;
Daniel Jasperf7935112012-12-03 18:12:45 +00001899 }
1900}
1901
1902void UnwrappedLineParser::parseAccessSpecifier() {
1903 nextToken();
Daniel Jasper84c47a12013-11-23 17:53:41 +00001904 // Understand Qt's slots.
Daniel Jasper53395402015-04-07 15:04:40 +00001905 if (FormatTok->isOneOf(Keywords.kw_slots, Keywords.kw_qslots))
Daniel Jasper84c47a12013-11-23 17:53:41 +00001906 nextToken();
Alexander Kornienko2ca766f2012-12-10 16:34:48 +00001907 // Otherwise, we don't know what it is, and we'd better keep the next token.
Manuel Klimek15dfe7a2013-05-28 11:55:06 +00001908 if (FormatTok->Tok.is(tok::colon))
Alexander Kornienko2ca766f2012-12-10 16:34:48 +00001909 nextToken();
Daniel Jasperf7935112012-12-03 18:12:45 +00001910 addUnwrappedLine();
1911}
1912
Daniel Jasper6f5a1932015-12-29 08:54:23 +00001913bool UnwrappedLineParser::parseEnum() {
Daniel Jasper6be0f552014-11-13 15:56:28 +00001914 // Won't be 'enum' for NS_ENUMs.
1915 if (FormatTok->Tok.is(tok::kw_enum))
Daniel Jasperccb68b42014-11-19 22:38:18 +00001916 nextToken();
Daniel Jasper6be0f552014-11-13 15:56:28 +00001917
Daniel Jasper6f5a1932015-12-29 08:54:23 +00001918 // In TypeScript, "enum" can also be used as property name, e.g. in interface
1919 // declarations. An "enum" keyword followed by a colon would be a syntax
1920 // error and thus assume it is just an identifier.
Daniel Jasper87379302016-02-03 05:33:44 +00001921 if (Style.Language == FormatStyle::LK_JavaScript &&
1922 FormatTok->isOneOf(tok::colon, tok::question))
Daniel Jasper6f5a1932015-12-29 08:54:23 +00001923 return false;
1924
Daniel Jasper2b41a822013-08-20 12:42:50 +00001925 // Eat up enum class ...
Daniel Jasperb05a81d2014-05-09 13:11:16 +00001926 if (FormatTok->Tok.is(tok::kw_class) || FormatTok->Tok.is(tok::kw_struct))
1927 nextToken();
Daniel Jasperb5a0b852015-06-19 08:17:32 +00001928
Daniel Jasper786a5502013-09-06 21:32:35 +00001929 while (FormatTok->Tok.getIdentifierInfo() ||
Daniel Jasperccb68b42014-11-19 22:38:18 +00001930 FormatTok->isOneOf(tok::colon, tok::coloncolon, tok::less,
1931 tok::greater, tok::comma, tok::question)) {
Manuel Klimek2cec0192013-01-21 19:17:52 +00001932 nextToken();
1933 // We can have macros or attributes in between 'enum' and the enum name.
Daniel Jasperccb68b42014-11-19 22:38:18 +00001934 if (FormatTok->is(tok::l_paren))
Alexander Kornienkob7076a22012-12-04 14:46:19 +00001935 parseParens();
Daniel Jasperb5a0b852015-06-19 08:17:32 +00001936 if (FormatTok->is(tok::identifier)) {
Manuel Klimek2cec0192013-01-21 19:17:52 +00001937 nextToken();
Daniel Jasperb5a0b852015-06-19 08:17:32 +00001938 // If there are two identifiers in a row, this is likely an elaborate
1939 // return type. In Java, this can be "implements", etc.
Daniel Jasper1dbc2102017-03-31 13:30:24 +00001940 if (Style.isCpp() && FormatTok->is(tok::identifier))
Daniel Jasper6f5a1932015-12-29 08:54:23 +00001941 return false;
Daniel Jasperb5a0b852015-06-19 08:17:32 +00001942 }
Manuel Klimek2cec0192013-01-21 19:17:52 +00001943 }
Daniel Jasper6be0f552014-11-13 15:56:28 +00001944
1945 // Just a declaration or something is wrong.
Daniel Jasperccb68b42014-11-19 22:38:18 +00001946 if (FormatTok->isNot(tok::l_brace))
Daniel Jasper6f5a1932015-12-29 08:54:23 +00001947 return true;
Daniel Jasper6be0f552014-11-13 15:56:28 +00001948 FormatTok->BlockKind = BK_Block;
1949
1950 if (Style.Language == FormatStyle::LK_Java) {
1951 // Java enums are different.
1952 parseJavaEnumBody();
Daniel Jasper6f5a1932015-12-29 08:54:23 +00001953 return true;
1954 }
1955 if (Style.Language == FormatStyle::LK_Proto) {
Daniel Jasperc6dd2732015-07-16 14:25:43 +00001956 parseBlock(/*MustBeDeclaration=*/true);
Daniel Jasper6f5a1932015-12-29 08:54:23 +00001957 return true;
Manuel Klimek2cec0192013-01-21 19:17:52 +00001958 }
Daniel Jasper6be0f552014-11-13 15:56:28 +00001959
1960 // Parse enum body.
Krasimir Georgiev26b144c2017-07-03 15:05:14 +00001961 nextToken();
Daniel Jasper6be0f552014-11-13 15:56:28 +00001962 bool HasError = !parseBracedList(/*ContinueOnSemicolons=*/true);
1963 if (HasError) {
1964 if (FormatTok->is(tok::semi))
1965 nextToken();
1966 addUnwrappedLine();
1967 }
Daniel Jasper6f5a1932015-12-29 08:54:23 +00001968 return true;
Daniel Jasper6be0f552014-11-13 15:56:28 +00001969
Daniel Jasper90cf3802015-06-17 09:44:02 +00001970 // There is no addUnwrappedLine() here so that we fall through to parsing a
1971 // structural element afterwards. Thus, in "enum A {} n, m;",
Manuel Klimek2cec0192013-01-21 19:17:52 +00001972 // "} n, m;" will end up in one unwrapped line.
Daniel Jasper6be0f552014-11-13 15:56:28 +00001973}
1974
1975void UnwrappedLineParser::parseJavaEnumBody() {
1976 // Determine whether the enum is simple, i.e. does not have a semicolon or
1977 // constants with class bodies. Simple enums can be formatted like braced
1978 // lists, contracted to a single line, etc.
1979 unsigned StoredPosition = Tokens->getPosition();
1980 bool IsSimple = true;
1981 FormatToken *Tok = Tokens->getNextToken();
1982 while (Tok) {
1983 if (Tok->is(tok::r_brace))
1984 break;
1985 if (Tok->isOneOf(tok::l_brace, tok::semi)) {
1986 IsSimple = false;
1987 break;
1988 }
1989 // FIXME: This will also mark enums with braces in the arguments to enum
1990 // constants as "not simple". This is probably fine in practice, though.
1991 Tok = Tokens->getNextToken();
1992 }
1993 FormatTok = Tokens->setPosition(StoredPosition);
1994
1995 if (IsSimple) {
Krasimir Georgiev26b144c2017-07-03 15:05:14 +00001996 nextToken();
Daniel Jasper6be0f552014-11-13 15:56:28 +00001997 parseBracedList();
Daniel Jasperdf2ff002014-11-02 22:31:39 +00001998 addUnwrappedLine();
Daniel Jasper6be0f552014-11-13 15:56:28 +00001999 return;
2000 }
2001
2002 // Parse the body of a more complex enum.
2003 // First add a line for everything up to the "{".
2004 nextToken();
2005 addUnwrappedLine();
2006 ++Line->Level;
2007
2008 // Parse the enum constants.
2009 while (FormatTok) {
2010 if (FormatTok->is(tok::l_brace)) {
2011 // Parse the constant's class body.
2012 parseBlock(/*MustBeDeclaration=*/true, /*AddLevel=*/true,
2013 /*MunchSemi=*/false);
2014 } else if (FormatTok->is(tok::l_paren)) {
2015 parseParens();
2016 } else if (FormatTok->is(tok::comma)) {
2017 nextToken();
2018 addUnwrappedLine();
2019 } else if (FormatTok->is(tok::semi)) {
2020 nextToken();
2021 addUnwrappedLine();
2022 break;
2023 } else if (FormatTok->is(tok::r_brace)) {
2024 addUnwrappedLine();
2025 break;
2026 } else {
2027 nextToken();
2028 }
2029 }
2030
2031 // Parse the class body after the enum's ";" if any.
2032 parseLevel(/*HasOpeningBrace=*/true);
2033 nextToken();
2034 --Line->Level;
2035 addUnwrappedLine();
Daniel Jasperf7935112012-12-03 18:12:45 +00002036}
2037
Martin Probst1027fb82017-02-07 14:05:30 +00002038void UnwrappedLineParser::parseRecord(bool ParseAsExpr) {
Roman Kashitsyna043ced2014-08-11 12:18:01 +00002039 const FormatToken &InitialToken = *FormatTok;
Manuel Klimek28cacc72013-01-07 18:10:23 +00002040 nextToken();
Daniel Jasper04785d02015-05-06 14:03:02 +00002041
Daniel Jasper04785d02015-05-06 14:03:02 +00002042 // The actual identifier can be a nested name specifier, and in macros
2043 // it is often token-pasted.
2044 while (FormatTok->isOneOf(tok::identifier, tok::coloncolon, tok::hashhash,
2045 tok::kw___attribute, tok::kw___declspec,
2046 tok::kw_alignas) ||
2047 ((Style.Language == FormatStyle::LK_Java ||
2048 Style.Language == FormatStyle::LK_JavaScript) &&
2049 FormatTok->isOneOf(tok::period, tok::comma))) {
Martin Probstcb870c52017-08-01 15:46:10 +00002050 if (Style.Language == FormatStyle::LK_JavaScript &&
2051 FormatTok->isOneOf(Keywords.kw_extends, Keywords.kw_implements)) {
2052 // JavaScript/TypeScript supports inline object types in
2053 // extends/implements positions:
2054 // class Foo implements {bar: number} { }
2055 nextToken();
2056 if (FormatTok->is(tok::l_brace)) {
2057 tryToParseBracedList();
2058 continue;
2059 }
2060 }
Daniel Jasper04785d02015-05-06 14:03:02 +00002061 bool IsNonMacroIdentifier =
2062 FormatTok->is(tok::identifier) &&
2063 FormatTok->TokenText != FormatTok->TokenText.upper();
Manuel Klimeke01bab52013-01-15 13:38:33 +00002064 nextToken();
2065 // We can have macros or attributes in between 'class' and the class name.
Daniel Jasper04785d02015-05-06 14:03:02 +00002066 if (!IsNonMacroIdentifier && FormatTok->Tok.is(tok::l_paren))
Manuel Klimeke01bab52013-01-15 13:38:33 +00002067 parseParens();
Daniel Jasper04785d02015-05-06 14:03:02 +00002068 }
Manuel Klimeke01bab52013-01-15 13:38:33 +00002069
Daniel Jasper04785d02015-05-06 14:03:02 +00002070 // Note that parsing away template declarations here leads to incorrectly
2071 // accepting function declarations as record declarations.
2072 // In general, we cannot solve this problem. Consider:
2073 // class A<int> B() {}
2074 // which can be a function definition or a class definition when B() is a
2075 // macro. If we find enough real-world cases where this is a problem, we
2076 // can parse for the 'template' keyword in the beginning of the statement,
2077 // and thus rule out the record production in case there is no template
2078 // (this would still leave us with an ambiguity between template function
2079 // and class declarations).
Daniel Jasperadba2aa2015-05-18 12:52:00 +00002080 if (FormatTok->isOneOf(tok::colon, tok::less)) {
2081 while (!eof()) {
Daniel Jasper3c883d12015-05-18 14:49:19 +00002082 if (FormatTok->is(tok::l_brace)) {
2083 calculateBraceTypes(/*ExpectClassBody=*/true);
2084 if (!tryToParseBracedList())
2085 break;
2086 }
Daniel Jasper04785d02015-05-06 14:03:02 +00002087 if (FormatTok->Tok.is(tok::semi))
2088 return;
2089 nextToken();
Manuel Klimeke01bab52013-01-15 13:38:33 +00002090 }
2091 }
Manuel Klimek15dfe7a2013-05-28 11:55:06 +00002092 if (FormatTok->Tok.is(tok::l_brace)) {
Martin Probst1027fb82017-02-07 14:05:30 +00002093 if (ParseAsExpr) {
2094 parseChildBlock();
2095 } else {
2096 if (ShouldBreakBeforeBrace(Style, InitialToken))
2097 addUnwrappedLine();
Manuel Klimeka8eb9142013-05-13 12:51:40 +00002098
Martin Probst1027fb82017-02-07 14:05:30 +00002099 parseBlock(/*MustBeDeclaration=*/true, /*AddLevel=*/true,
2100 /*MunchSemi=*/false);
2101 }
Manuel Klimeka8eb9142013-05-13 12:51:40 +00002102 }
Daniel Jasper90cf3802015-06-17 09:44:02 +00002103 // There is no addUnwrappedLine() here so that we fall through to parsing a
2104 // structural element afterwards. Thus, in "class A {} n, m;",
2105 // "} n, m;" will end up in one unwrapped line.
Manuel Klimek28cacc72013-01-07 18:10:23 +00002106}
2107
Nico Weber8696a8d2013-01-09 21:15:03 +00002108void UnwrappedLineParser::parseObjCProtocolList() {
Manuel Klimek15dfe7a2013-05-28 11:55:06 +00002109 assert(FormatTok->Tok.is(tok::less) && "'<' expected.");
Nico Weber8696a8d2013-01-09 21:15:03 +00002110 do
2111 nextToken();
Manuel Klimek15dfe7a2013-05-28 11:55:06 +00002112 while (!eof() && FormatTok->Tok.isNot(tok::greater));
Nico Weber8696a8d2013-01-09 21:15:03 +00002113 nextToken(); // Skip '>'.
2114}
2115
2116void UnwrappedLineParser::parseObjCUntilAtEnd() {
2117 do {
Manuel Klimek15dfe7a2013-05-28 11:55:06 +00002118 if (FormatTok->Tok.isObjCAtKeyword(tok::objc_end)) {
Nico Weber8696a8d2013-01-09 21:15:03 +00002119 nextToken();
2120 addUnwrappedLine();
2121 break;
2122 }
Daniel Jaspera15da302013-08-28 08:04:23 +00002123 if (FormatTok->is(tok::l_brace)) {
2124 parseBlock(/*MustBeDeclaration=*/false);
2125 // In ObjC interfaces, nothing should be following the "}".
2126 addUnwrappedLine();
Benjamin Kramere21cb742014-01-08 15:59:42 +00002127 } else if (FormatTok->is(tok::r_brace)) {
2128 // Ignore stray "}". parseStructuralElement doesn't consume them.
2129 nextToken();
2130 addUnwrappedLine();
Daniel Jaspera15da302013-08-28 08:04:23 +00002131 } else {
2132 parseStructuralElement();
2133 }
Nico Weber8696a8d2013-01-09 21:15:03 +00002134 } while (!eof());
2135}
2136
Nico Weber2ce0ac52013-01-09 23:25:37 +00002137void UnwrappedLineParser::parseObjCInterfaceOrImplementation() {
Nico Weber7eecf4b2013-01-09 20:25:35 +00002138 nextToken();
Daniel Jasperd1ae3582013-03-20 12:37:50 +00002139 nextToken(); // interface name
Nico Weber7eecf4b2013-01-09 20:25:35 +00002140
2141 // @interface can be followed by either a base class, or a category.
Manuel Klimek15dfe7a2013-05-28 11:55:06 +00002142 if (FormatTok->Tok.is(tok::colon)) {
Nico Weber7eecf4b2013-01-09 20:25:35 +00002143 nextToken();
Daniel Jasperd1ae3582013-03-20 12:37:50 +00002144 nextToken(); // base class name
Manuel Klimek15dfe7a2013-05-28 11:55:06 +00002145 } else if (FormatTok->Tok.is(tok::l_paren))
Nico Weber7eecf4b2013-01-09 20:25:35 +00002146 // Skip category, if present.
2147 parseParens();
2148
Manuel Klimek15dfe7a2013-05-28 11:55:06 +00002149 if (FormatTok->Tok.is(tok::less))
Nico Weber8696a8d2013-01-09 21:15:03 +00002150 parseObjCProtocolList();
Nico Weber7eecf4b2013-01-09 20:25:35 +00002151
Dinesh Dwivediea3aca82014-05-02 17:01:46 +00002152 if (FormatTok->Tok.is(tok::l_brace)) {
Daniel Jasperc1bc38e2015-09-29 14:57:55 +00002153 if (Style.BraceWrapping.AfterObjCDeclaration)
Dinesh Dwivediea3aca82014-05-02 17:01:46 +00002154 addUnwrappedLine();
Nico Weber9096fc02013-06-26 00:30:14 +00002155 parseBlock(/*MustBeDeclaration=*/true);
Dinesh Dwivediea3aca82014-05-02 17:01:46 +00002156 }
Nico Weber7eecf4b2013-01-09 20:25:35 +00002157
2158 // With instance variables, this puts '}' on its own line. Without instance
2159 // variables, this ends the @interface line.
2160 addUnwrappedLine();
2161
Nico Weber8696a8d2013-01-09 21:15:03 +00002162 parseObjCUntilAtEnd();
2163}
Nico Weber7eecf4b2013-01-09 20:25:35 +00002164
Nico Weber8696a8d2013-01-09 21:15:03 +00002165void UnwrappedLineParser::parseObjCProtocol() {
2166 nextToken();
Daniel Jasperd1ae3582013-03-20 12:37:50 +00002167 nextToken(); // protocol name
Nico Weber8696a8d2013-01-09 21:15:03 +00002168
Manuel Klimek15dfe7a2013-05-28 11:55:06 +00002169 if (FormatTok->Tok.is(tok::less))
Nico Weber8696a8d2013-01-09 21:15:03 +00002170 parseObjCProtocolList();
2171
2172 // Check for protocol declaration.
Manuel Klimek15dfe7a2013-05-28 11:55:06 +00002173 if (FormatTok->Tok.is(tok::semi)) {
Nico Weber8696a8d2013-01-09 21:15:03 +00002174 nextToken();
2175 return addUnwrappedLine();
2176 }
2177
2178 addUnwrappedLine();
2179 parseObjCUntilAtEnd();
Nico Weber7eecf4b2013-01-09 20:25:35 +00002180}
2181
Daniel Jasperfca735c2015-02-19 16:14:18 +00002182void UnwrappedLineParser::parseJavaScriptEs6ImportExport() {
Martin Probst053f1aa2016-04-19 14:55:37 +00002183 bool IsImport = FormatTok->is(Keywords.kw_import);
2184 assert(IsImport || FormatTok->is(tok::kw_export));
Daniel Jasper354aa512015-02-19 16:07:32 +00002185 nextToken();
Daniel Jasperfca735c2015-02-19 16:14:18 +00002186
Daniel Jasperec05fc72015-05-11 09:14:50 +00002187 // Consume the "default" in "export default class/function".
Daniel Jasper668c7bb2015-05-11 09:03:10 +00002188 if (FormatTok->is(tok::kw_default))
2189 nextToken();
Daniel Jasperec05fc72015-05-11 09:14:50 +00002190
Martin Probst5f8445b2016-04-24 22:05:09 +00002191 // Consume "async function", "function" and "default function", so that these
2192 // get parsed as free-standing JS functions, i.e. do not require a trailing
2193 // semicolon.
2194 if (FormatTok->is(Keywords.kw_async))
2195 nextToken();
Daniel Jasper668c7bb2015-05-11 09:03:10 +00002196 if (FormatTok->is(Keywords.kw_function)) {
2197 nextToken();
2198 return;
2199 }
2200
Martin Probst053f1aa2016-04-19 14:55:37 +00002201 // For imports, `export *`, `export {...}`, consume the rest of the line up
2202 // to the terminating `;`. For everything else, just return and continue
2203 // parsing the structural element, i.e. the declaration or expression for
2204 // `export default`.
2205 if (!IsImport && !FormatTok->isOneOf(tok::l_brace, tok::star) &&
2206 !FormatTok->isStringLiteral())
2207 return;
Daniel Jasperfca735c2015-02-19 16:14:18 +00002208
Martin Probstd40bca42017-01-09 08:56:36 +00002209 while (!eof()) {
2210 if (FormatTok->is(tok::semi))
2211 return;
2212 if (Line->Tokens.size() == 0) {
2213 // Common issue: Automatic Semicolon Insertion wrapped the line, so the
2214 // import statement should terminate.
2215 return;
2216 }
Daniel Jasperefc1a832016-01-07 08:53:35 +00002217 if (FormatTok->is(tok::l_brace)) {
2218 FormatTok->BlockKind = BK_Block;
Krasimir Georgiev26b144c2017-07-03 15:05:14 +00002219 nextToken();
Daniel Jasperefc1a832016-01-07 08:53:35 +00002220 parseBracedList();
2221 } else {
2222 nextToken();
2223 }
Daniel Jasper354aa512015-02-19 16:07:32 +00002224 }
2225}
2226
Daniel Jasper3b203a62013-09-05 16:05:56 +00002227LLVM_ATTRIBUTE_UNUSED static void printDebugInfo(const UnwrappedLine &Line,
2228 StringRef Prefix = "") {
Daniel Jasper9fe0e8d2013-09-05 09:29:45 +00002229 llvm::dbgs() << Prefix << "Line(" << Line.Level << ")"
2230 << (Line.InPPDirective ? " MACRO" : "") << ": ";
2231 for (std::list<UnwrappedLineNode>::const_iterator I = Line.Tokens.begin(),
2232 E = Line.Tokens.end();
2233 I != E; ++I) {
Krasimir Georgiev91834222017-01-25 13:58:58 +00002234 llvm::dbgs() << I->Tok->Tok.getName() << "["
2235 << "T=" << I->Tok->Type
2236 << ", OC=" << I->Tok->OriginalColumn << "] ";
Daniel Jasper9fe0e8d2013-09-05 09:29:45 +00002237 }
2238 for (std::list<UnwrappedLineNode>::const_iterator I = Line.Tokens.begin(),
2239 E = Line.Tokens.end();
2240 I != E; ++I) {
2241 const UnwrappedLineNode &Node = *I;
2242 for (SmallVectorImpl<UnwrappedLine>::const_iterator
2243 I = Node.Children.begin(),
2244 E = Node.Children.end();
2245 I != E; ++I) {
2246 printDebugInfo(*I, "\nChild: ");
2247 }
2248 }
2249 llvm::dbgs() << "\n";
2250}
2251
Daniel Jasperf7935112012-12-03 18:12:45 +00002252void UnwrappedLineParser::addUnwrappedLine() {
Daniel Jasperdaffc0d2013-01-16 09:10:19 +00002253 if (Line->Tokens.empty())
Daniel Jasper7c85fde2013-01-08 14:56:18 +00002254 return;
Manuel Klimekab3dc002013-01-16 12:31:12 +00002255 DEBUG({
Daniel Jasper9fe0e8d2013-09-05 09:29:45 +00002256 if (CurrentLines == &Lines)
2257 printDebugInfo(*Line);
Manuel Klimekab3dc002013-01-16 12:31:12 +00002258 });
Benjamin Kramerc7551a42015-05-31 11:18:05 +00002259 CurrentLines->push_back(std::move(*Line));
Daniel Jasperdaffc0d2013-01-16 09:10:19 +00002260 Line->Tokens.clear();
Krasimir Georgiev85c37042017-03-01 16:38:08 +00002261 Line->MatchingOpeningBlockLineIndex = UnwrappedLine::kInvalidIndex;
Manuel Klimekd3b92fa2013-01-18 14:04:34 +00002262 if (CurrentLines == &Lines && !PreprocessorDirectives.empty()) {
Benjamin Kramerc7551a42015-05-31 11:18:05 +00002263 CurrentLines->append(
2264 std::make_move_iterator(PreprocessorDirectives.begin()),
2265 std::make_move_iterator(PreprocessorDirectives.end()));
Manuel Klimekd3b92fa2013-01-18 14:04:34 +00002266 PreprocessorDirectives.clear();
2267 }
Daniel Jasperf7935112012-12-03 18:12:45 +00002268}
2269
Manuel Klimek15dfe7a2013-05-28 11:55:06 +00002270bool UnwrappedLineParser::eof() const { return FormatTok->Tok.is(tok::eof); }
Daniel Jasperf7935112012-12-03 18:12:45 +00002271
Daniel Jasperb05a81d2014-05-09 13:11:16 +00002272bool UnwrappedLineParser::isOnNewLine(const FormatToken &FormatTok) {
Manuel Klimek1fcbe672014-04-11 12:27:47 +00002273 return (Line->InPPDirective || FormatTok.HasUnescapedNewline) &&
2274 FormatTok.NewlinesBefore > 0;
2275}
2276
Krasimir Georgiev91834222017-01-25 13:58:58 +00002277// Checks if \p FormatTok is a line comment that continues the line comment
2278// section on \p Line.
Krasimir Georgievea222a72017-05-22 10:07:56 +00002279static bool continuesLineCommentSection(const FormatToken &FormatTok,
2280 const UnwrappedLine &Line,
2281 llvm::Regex &CommentPragmasRegex) {
Krasimir Georgiev91834222017-01-25 13:58:58 +00002282 if (Line.Tokens.empty())
2283 return false;
Krasimir Georgiev84321612017-01-30 19:18:55 +00002284
Krasimir Georgiev00c5c722017-02-02 15:32:19 +00002285 StringRef IndentContent = FormatTok.TokenText;
2286 if (FormatTok.TokenText.startswith("//") ||
2287 FormatTok.TokenText.startswith("/*"))
2288 IndentContent = FormatTok.TokenText.substr(2);
2289 if (CommentPragmasRegex.match(IndentContent))
2290 return false;
2291
Krasimir Georgiev91834222017-01-25 13:58:58 +00002292 // If Line starts with a line comment, then FormatTok continues the comment
Krasimir Georgiev84321612017-01-30 19:18:55 +00002293 // section if its original column is greater or equal to the original start
Krasimir Georgiev91834222017-01-25 13:58:58 +00002294 // column of the line.
2295 //
Krasimir Georgiev84321612017-01-30 19:18:55 +00002296 // Define the min column token of a line as follows: if a line ends in '{' or
2297 // contains a '{' followed by a line comment, then the min column token is
2298 // that '{'. Otherwise, the min column token of the line is the first token of
2299 // the line.
2300 //
2301 // If Line starts with a token other than a line comment, then FormatTok
2302 // continues the comment section if its original column is greater than the
2303 // original start column of the min column token of the line.
Krasimir Georgiev91834222017-01-25 13:58:58 +00002304 //
2305 // For example, the second line comment continues the first in these cases:
Krasimir Georgievb6ccd382017-02-02 14:36:50 +00002306 //
Krasimir Georgiev91834222017-01-25 13:58:58 +00002307 // // first line
2308 // // second line
Krasimir Georgievb6ccd382017-02-02 14:36:50 +00002309 //
Krasimir Georgiev91834222017-01-25 13:58:58 +00002310 // and:
Krasimir Georgievb6ccd382017-02-02 14:36:50 +00002311 //
Krasimir Georgiev91834222017-01-25 13:58:58 +00002312 // // first line
2313 // // second line
Krasimir Georgievb6ccd382017-02-02 14:36:50 +00002314 //
Krasimir Georgiev91834222017-01-25 13:58:58 +00002315 // and:
Krasimir Georgievb6ccd382017-02-02 14:36:50 +00002316 //
Krasimir Georgiev91834222017-01-25 13:58:58 +00002317 // int i; // first line
2318 // // second line
Krasimir Georgievb6ccd382017-02-02 14:36:50 +00002319 //
Krasimir Georgiev84321612017-01-30 19:18:55 +00002320 // and:
Krasimir Georgievb6ccd382017-02-02 14:36:50 +00002321 //
Krasimir Georgiev84321612017-01-30 19:18:55 +00002322 // do { // first line
2323 // // second line
2324 // int i;
2325 // } while (true);
Krasimir Georgiev91834222017-01-25 13:58:58 +00002326 //
Krasimir Georgievb6ccd382017-02-02 14:36:50 +00002327 // and:
2328 //
2329 // enum {
2330 // a, // first line
2331 // // second line
2332 // b
2333 // };
2334 //
Krasimir Georgiev91834222017-01-25 13:58:58 +00002335 // The second line comment doesn't continue the first in these cases:
Krasimir Georgievb6ccd382017-02-02 14:36:50 +00002336 //
Krasimir Georgiev91834222017-01-25 13:58:58 +00002337 // // first line
2338 // // second line
Krasimir Georgievb6ccd382017-02-02 14:36:50 +00002339 //
Krasimir Georgiev91834222017-01-25 13:58:58 +00002340 // and:
Krasimir Georgievb6ccd382017-02-02 14:36:50 +00002341 //
Krasimir Georgiev91834222017-01-25 13:58:58 +00002342 // int i; // first line
2343 // // second line
Krasimir Georgievb6ccd382017-02-02 14:36:50 +00002344 //
Krasimir Georgiev84321612017-01-30 19:18:55 +00002345 // and:
Krasimir Georgievb6ccd382017-02-02 14:36:50 +00002346 //
Krasimir Georgiev84321612017-01-30 19:18:55 +00002347 // do { // first line
2348 // // second line
2349 // int i;
2350 // } while (true);
Krasimir Georgievb6ccd382017-02-02 14:36:50 +00002351 //
2352 // and:
2353 //
2354 // enum {
2355 // a, // first line
2356 // // second line
2357 // };
Krasimir Georgiev84321612017-01-30 19:18:55 +00002358 const FormatToken *MinColumnToken = Line.Tokens.front().Tok;
2359
2360 // Scan for '{//'. If found, use the column of '{' as a min column for line
2361 // comment section continuation.
2362 const FormatToken *PreviousToken = nullptr;
Krasimir Georgievd86c25d2017-03-10 13:09:29 +00002363 for (const UnwrappedLineNode &Node : Line.Tokens) {
Krasimir Georgiev84321612017-01-30 19:18:55 +00002364 if (PreviousToken && PreviousToken->is(tok::l_brace) &&
2365 isLineComment(*Node.Tok)) {
2366 MinColumnToken = PreviousToken;
2367 break;
2368 }
2369 PreviousToken = Node.Tok;
Krasimir Georgievb6ccd382017-02-02 14:36:50 +00002370
2371 // Grab the last newline preceding a token in this unwrapped line.
2372 if (Node.Tok->NewlinesBefore > 0) {
2373 MinColumnToken = Node.Tok;
2374 }
Krasimir Georgiev84321612017-01-30 19:18:55 +00002375 }
2376 if (PreviousToken && PreviousToken->is(tok::l_brace)) {
2377 MinColumnToken = PreviousToken;
2378 }
2379
Krasimir Georgievea222a72017-05-22 10:07:56 +00002380 return continuesLineComment(FormatTok, /*Previous=*/Line.Tokens.back().Tok,
2381 MinColumnToken);
Krasimir Georgiev91834222017-01-25 13:58:58 +00002382}
2383
Manuel Klimekf92f7bc2013-01-22 16:31:55 +00002384void UnwrappedLineParser::flushComments(bool NewlineBeforeNext) {
2385 bool JustComments = Line->Tokens.empty();
Manuel Klimek15dfe7a2013-05-28 11:55:06 +00002386 for (SmallVectorImpl<FormatToken *>::const_iterator
Manuel Klimekf92f7bc2013-01-22 16:31:55 +00002387 I = CommentsBeforeNextToken.begin(),
2388 E = CommentsBeforeNextToken.end();
2389 I != E; ++I) {
Krasimir Georgiev91834222017-01-25 13:58:58 +00002390 // Line comments that belong to the same line comment section are put on the
2391 // same line since later we might want to reflow content between them.
Krasimir Georgiev753625b2017-01-31 13:32:38 +00002392 // Additional fine-grained breaking of line comment sections is controlled
2393 // by the class BreakableLineCommentSection in case it is desirable to keep
2394 // several line comment sections in the same unwrapped line.
2395 //
2396 // FIXME: Consider putting separate line comment sections as children to the
2397 // unwrapped line instead.
Krasimir Georgiev00c5c722017-02-02 15:32:19 +00002398 (*I)->ContinuesLineCommentSection =
Krasimir Georgievea222a72017-05-22 10:07:56 +00002399 continuesLineCommentSection(**I, *Line, CommentPragmasRegex);
Krasimir Georgievb6ccd382017-02-02 14:36:50 +00002400 if (isOnNewLine(**I) && JustComments && !(*I)->ContinuesLineCommentSection)
Manuel Klimekf92f7bc2013-01-22 16:31:55 +00002401 addUnwrappedLine();
Manuel Klimekf92f7bc2013-01-22 16:31:55 +00002402 pushToken(*I);
2403 }
Daniel Jaspere60cba12015-05-13 11:35:53 +00002404 if (NewlineBeforeNext && JustComments)
Manuel Klimekf92f7bc2013-01-22 16:31:55 +00002405 addUnwrappedLine();
Manuel Klimekf92f7bc2013-01-22 16:31:55 +00002406 CommentsBeforeNextToken.clear();
2407}
2408
Krasimir Georgiev3e051052017-07-24 14:51:59 +00002409void UnwrappedLineParser::nextToken(int LevelDifference) {
Daniel Jasperf7935112012-12-03 18:12:45 +00002410 if (eof())
2411 return;
Manuel Klimek1fcbe672014-04-11 12:27:47 +00002412 flushComments(isOnNewLine(*FormatTok));
Manuel Klimekf92f7bc2013-01-22 16:31:55 +00002413 pushToken(FormatTok);
Daniel Jasper1dcbbcfc2016-03-14 19:21:36 +00002414 if (Style.Language != FormatStyle::LK_JavaScript)
Krasimir Georgiev3e051052017-07-24 14:51:59 +00002415 readToken(LevelDifference);
Daniel Jasper1dcbbcfc2016-03-14 19:21:36 +00002416 else
2417 readTokenWithJavaScriptASI();
Manuel Klimek1abf7892013-01-04 23:34:14 +00002418}
2419
Daniel Jasperb9a49902016-01-09 15:56:28 +00002420const FormatToken *UnwrappedLineParser::getPreviousToken() {
2421 // FIXME: This is a dirty way to access the previous token. Find a better
2422 // solution.
2423 if (!Line || Line->Tokens.empty())
2424 return nullptr;
2425 return Line->Tokens.back().Tok;
2426}
2427
Krasimir Georgievf62f9582017-02-08 10:30:44 +00002428void UnwrappedLineParser::distributeComments(
2429 const SmallVectorImpl<FormatToken *> &Comments,
2430 const FormatToken *NextTok) {
2431 // Whether or not a line comment token continues a line is controlled by
Krasimir Georgievea222a72017-05-22 10:07:56 +00002432 // the method continuesLineCommentSection, with the following caveat:
Krasimir Georgievf62f9582017-02-08 10:30:44 +00002433 //
2434 // Define a trail of Comments to be a nonempty proper postfix of Comments such
2435 // that each comment line from the trail is aligned with the next token, if
2436 // the next token exists. If a trail exists, the beginning of the maximal
2437 // trail is marked as a start of a new comment section.
2438 //
2439 // For example in this code:
2440 //
2441 // int a; // line about a
2442 // // line 1 about b
2443 // // line 2 about b
2444 // int b;
2445 //
2446 // the two lines about b form a maximal trail, so there are two sections, the
2447 // first one consisting of the single comment "// line about a" and the
2448 // second one consisting of the next two comments.
2449 if (Comments.empty())
2450 return;
2451 bool ShouldPushCommentsInCurrentLine = true;
2452 bool HasTrailAlignedWithNextToken = false;
2453 unsigned StartOfTrailAlignedWithNextToken = 0;
2454 if (NextTok) {
2455 // We are skipping the first element intentionally.
2456 for (unsigned i = Comments.size() - 1; i > 0; --i) {
2457 if (Comments[i]->OriginalColumn == NextTok->OriginalColumn) {
2458 HasTrailAlignedWithNextToken = true;
2459 StartOfTrailAlignedWithNextToken = i;
2460 }
2461 }
2462 }
2463 for (unsigned i = 0, e = Comments.size(); i < e; ++i) {
2464 FormatToken *FormatTok = Comments[i];
2465 if (HasTrailAlignedWithNextToken &&
2466 i == StartOfTrailAlignedWithNextToken) {
2467 FormatTok->ContinuesLineCommentSection = false;
2468 } else {
2469 FormatTok->ContinuesLineCommentSection =
Krasimir Georgievea222a72017-05-22 10:07:56 +00002470 continuesLineCommentSection(*FormatTok, *Line, CommentPragmasRegex);
Krasimir Georgievf62f9582017-02-08 10:30:44 +00002471 }
2472 if (!FormatTok->ContinuesLineCommentSection &&
2473 (isOnNewLine(*FormatTok) || FormatTok->IsFirst)) {
2474 ShouldPushCommentsInCurrentLine = false;
2475 }
2476 if (ShouldPushCommentsInCurrentLine) {
2477 pushToken(FormatTok);
2478 } else {
2479 CommentsBeforeNextToken.push_back(FormatTok);
2480 }
2481 }
2482}
2483
Krasimir Georgiev3e051052017-07-24 14:51:59 +00002484void UnwrappedLineParser::readToken(int LevelDifference) {
Krasimir Georgievf62f9582017-02-08 10:30:44 +00002485 SmallVector<FormatToken *, 1> Comments;
Manuel Klimekf92f7bc2013-01-22 16:31:55 +00002486 do {
2487 FormatTok = Tokens->getNextToken();
Alexander Kornienkoc2ee9cf2014-03-13 13:59:48 +00002488 assert(FormatTok);
Manuel Klimek15dfe7a2013-05-28 11:55:06 +00002489 while (!Line->InPPDirective && FormatTok->Tok.is(tok::hash) &&
2490 (FormatTok->HasUnescapedNewline || FormatTok->IsFirst)) {
Krasimir Georgievf62f9582017-02-08 10:30:44 +00002491 distributeComments(Comments, FormatTok);
2492 Comments.clear();
Manuel Klimekf92f7bc2013-01-22 16:31:55 +00002493 // If there is an unfinished unwrapped line, we flush the preprocessor
2494 // directives only after that unwrapped line was finished later.
Daniel Jasper29d39d52015-02-08 09:34:49 +00002495 bool SwitchToPreprocessorLines = !Line->Tokens.empty();
Manuel Klimekf92f7bc2013-01-22 16:31:55 +00002496 ScopedLineState BlockState(*this, SwitchToPreprocessorLines);
Krasimir Georgiev3e051052017-07-24 14:51:59 +00002497 assert((LevelDifference >= 0 ||
2498 static_cast<unsigned>(-LevelDifference) <= Line->Level) &&
2499 "LevelDifference makes Line->Level negative");
2500 Line->Level += LevelDifference;
Alexander Kornienkob1be9d62013-04-03 12:38:53 +00002501 // Comments stored before the preprocessor directive need to be output
2502 // before the preprocessor directive, at the same level as the
2503 // preprocessor directive, as we consider them to apply to the directive.
Manuel Klimek1fcbe672014-04-11 12:27:47 +00002504 flushComments(isOnNewLine(*FormatTok));
Manuel Klimekf92f7bc2013-01-22 16:31:55 +00002505 parsePPDirective();
2506 }
Manuel Klimek68b03042014-04-14 09:14:11 +00002507 while (FormatTok->Type == TT_ConflictStart ||
2508 FormatTok->Type == TT_ConflictEnd ||
2509 FormatTok->Type == TT_ConflictAlternative) {
2510 if (FormatTok->Type == TT_ConflictStart) {
2511 conditionalCompilationStart(/*Unreachable=*/false);
2512 } else if (FormatTok->Type == TT_ConflictAlternative) {
2513 conditionalCompilationAlternative();
Daniel Jasperb05a81d2014-05-09 13:11:16 +00002514 } else if (FormatTok->Type == TT_ConflictEnd) {
Manuel Klimek68b03042014-04-14 09:14:11 +00002515 conditionalCompilationEnd();
2516 }
2517 FormatTok = Tokens->getNextToken();
2518 FormatTok->MustBreakBefore = true;
2519 }
Alexander Kornienkof2e02122013-05-24 18:24:24 +00002520
Francois Ferranda98a95c2017-07-28 07:56:14 +00002521 if (!PPStack.empty() && (PPStack.back().Kind == PP_Unreachable) &&
Alexander Kornienkof2e02122013-05-24 18:24:24 +00002522 !Line->InPPDirective) {
2523 continue;
2524 }
2525
Krasimir Georgievf62f9582017-02-08 10:30:44 +00002526 if (!FormatTok->Tok.is(tok::comment)) {
2527 distributeComments(Comments, FormatTok);
2528 Comments.clear();
Manuel Klimekf92f7bc2013-01-22 16:31:55 +00002529 return;
Manuel Klimekf92f7bc2013-01-22 16:31:55 +00002530 }
Krasimir Georgievf62f9582017-02-08 10:30:44 +00002531
2532 Comments.push_back(FormatTok);
Manuel Klimekf92f7bc2013-01-22 16:31:55 +00002533 } while (!eof());
Krasimir Georgievf62f9582017-02-08 10:30:44 +00002534
2535 distributeComments(Comments, nullptr);
2536 Comments.clear();
Manuel Klimekf92f7bc2013-01-22 16:31:55 +00002537}
2538
Manuel Klimek15dfe7a2013-05-28 11:55:06 +00002539void UnwrappedLineParser::pushToken(FormatToken *Tok) {
Daniel Jasper9fe0e8d2013-09-05 09:29:45 +00002540 Line->Tokens.push_back(UnwrappedLineNode(Tok));
Manuel Klimekf92f7bc2013-01-22 16:31:55 +00002541 if (MustBreakBeforeNextToken) {
Daniel Jasper9fe0e8d2013-09-05 09:29:45 +00002542 Line->Tokens.back().Tok->MustBreakBefore = true;
Manuel Klimekf92f7bc2013-01-22 16:31:55 +00002543 MustBreakBeforeNextToken = false;
Manuel Klimek1abf7892013-01-04 23:34:14 +00002544 }
Daniel Jasperf7935112012-12-03 18:12:45 +00002545}
2546
Daniel Jasper8d1832e2013-01-07 13:26:07 +00002547} // end namespace format
2548} // end namespace clang