blob: bbe05602f6da29af30ba61d472278a1942718d15 [file] [log] [blame]
Daniel Jasperf7935112012-12-03 18:12:45 +00001//===--- UnwrappedLineParser.cpp - Format C++ code ------------------------===//
2//
Chandler Carruth2946cd72019-01-19 08:50:56 +00003// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4// See https://llvm.org/LICENSE.txt for license information.
5// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
Daniel Jasperf7935112012-12-03 18:12:45 +00006//
7//===----------------------------------------------------------------------===//
8///
9/// \file
Adrian Prantl9fc8faf2018-05-09 01:00:01 +000010/// This file contains the implementation of the UnwrappedLineParser,
Daniel Jasperf7935112012-12-03 18:12:45 +000011/// which turns a stream of tokens into UnwrappedLines.
12///
Daniel Jasperf7935112012-12-03 18:12:45 +000013//===----------------------------------------------------------------------===//
14
Chandler Carruth4b417452013-01-19 08:09:44 +000015#include "UnwrappedLineParser.h"
Benjamin Kramer33335df2015-03-01 21:36:40 +000016#include "llvm/ADT/STLExtras.h"
Manuel Klimekab3dc002013-01-16 12:31:12 +000017#include "llvm/Support/Debug.h"
Benjamin Kramer53f5e892015-03-23 18:05:43 +000018#include "llvm/Support/raw_ostream.h"
Manuel Klimekab3dc002013-01-16 12:31:12 +000019
Martin Probst7e0f25b2017-11-25 09:19:42 +000020#include <algorithm>
21
Chandler Carruth10346662014-04-22 03:17:02 +000022#define DEBUG_TYPE "format-parser"
23
Daniel Jasperf7935112012-12-03 18:12:45 +000024namespace clang {
25namespace format {
26
Manuel Klimek15dfe7a2013-05-28 11:55:06 +000027class FormatTokenSource {
28public:
Angel Garcia Gomez637d1e62015-10-20 13:23:58 +000029 virtual ~FormatTokenSource() {}
Manuel Klimek15dfe7a2013-05-28 11:55:06 +000030 virtual FormatToken *getNextToken() = 0;
31
32 virtual unsigned getPosition() = 0;
33 virtual FormatToken *setPosition(unsigned Position) = 0;
34};
35
Craig Topper69665e12013-07-01 04:21:54 +000036namespace {
37
Manuel Klimek0a3a3c92013-01-23 09:32:48 +000038class ScopedDeclarationState {
39public:
40 ScopedDeclarationState(UnwrappedLine &Line, std::vector<bool> &Stack,
41 bool MustBeDeclaration)
42 : Line(Line), Stack(Stack) {
Manuel Klimek0a3a3c92013-01-23 09:32:48 +000043 Line.MustBeDeclaration = MustBeDeclaration;
Manuel Klimek39080572013-01-23 11:03:04 +000044 Stack.push_back(MustBeDeclaration);
Manuel Klimek0a3a3c92013-01-23 09:32:48 +000045 }
46 ~ScopedDeclarationState() {
Manuel Klimek0a3a3c92013-01-23 09:32:48 +000047 Stack.pop_back();
Manuel Klimekc1237a82013-01-23 14:08:21 +000048 if (!Stack.empty())
49 Line.MustBeDeclaration = Stack.back();
50 else
51 Line.MustBeDeclaration = true;
Manuel Klimek0a3a3c92013-01-23 09:32:48 +000052 }
Daniel Jasper393564f2013-05-31 14:56:29 +000053
Manuel Klimek0a3a3c92013-01-23 09:32:48 +000054private:
55 UnwrappedLine &Line;
56 std::vector<bool> &Stack;
57};
58
Krasimir Georgieva1c30932017-05-19 10:34:57 +000059static bool isLineComment(const FormatToken &FormatTok) {
Krasimir Georgiev410ed242017-11-10 12:50:09 +000060 return FormatTok.is(tok::comment) && !FormatTok.TokenText.startswith("/*");
Krasimir Georgieva1c30932017-05-19 10:34:57 +000061}
62
Krasimir Georgievea222a72017-05-22 10:07:56 +000063// Checks if \p FormatTok is a line comment that continues the line comment
64// \p Previous. The original column of \p MinColumnToken is used to determine
65// whether \p FormatTok is indented enough to the right to continue \p Previous.
66static bool continuesLineComment(const FormatToken &FormatTok,
67 const FormatToken *Previous,
68 const FormatToken *MinColumnToken) {
69 if (!Previous || !MinColumnToken)
70 return false;
71 unsigned MinContinueColumn =
72 MinColumnToken->OriginalColumn + (isLineComment(*MinColumnToken) ? 0 : 1);
73 return isLineComment(FormatTok) && FormatTok.NewlinesBefore == 1 &&
74 isLineComment(*Previous) &&
75 FormatTok.OriginalColumn >= MinContinueColumn;
76}
77
Manuel Klimek1abf7892013-01-04 23:34:14 +000078class ScopedMacroState : public FormatTokenSource {
79public:
80 ScopedMacroState(UnwrappedLine &Line, FormatTokenSource *&TokenSource,
Manuel Klimek20e0af62015-05-06 11:56:29 +000081 FormatToken *&ResetToken)
Manuel Klimek1abf7892013-01-04 23:34:14 +000082 : Line(Line), TokenSource(TokenSource), ResetToken(ResetToken),
Manuel Klimek1a18c402013-04-12 14:13:36 +000083 PreviousLineLevel(Line.Level), PreviousTokenSource(TokenSource),
Krasimir Georgieva1c30932017-05-19 10:34:57 +000084 Token(nullptr), PreviousToken(nullptr) {
David L. Jones5de22722018-06-15 06:08:54 +000085 FakeEOF.Tok.startToken();
86 FakeEOF.Tok.setKind(tok::eof);
Manuel Klimek1abf7892013-01-04 23:34:14 +000087 TokenSource = this;
Manuel Klimekef2cfb12013-01-05 22:14:16 +000088 Line.Level = 0;
Manuel Klimek1abf7892013-01-04 23:34:14 +000089 Line.InPPDirective = true;
90 }
91
Alexander Kornienko34eb2072015-04-11 02:00:23 +000092 ~ScopedMacroState() override {
Manuel Klimek1abf7892013-01-04 23:34:14 +000093 TokenSource = PreviousTokenSource;
94 ResetToken = Token;
95 Line.InPPDirective = false;
Manuel Klimekef2cfb12013-01-05 22:14:16 +000096 Line.Level = PreviousLineLevel;
Manuel Klimek1abf7892013-01-04 23:34:14 +000097 }
98
Craig Topperfb6b25b2014-03-15 04:29:04 +000099 FormatToken *getNextToken() override {
Manuel Klimek78725712013-01-07 10:03:37 +0000100 // The \c UnwrappedLineParser guards against this by never calling
101 // \c getNextToken() after it has encountered the first eof token.
102 assert(!eof());
Krasimir Georgieva1c30932017-05-19 10:34:57 +0000103 PreviousToken = Token;
Manuel Klimek1abf7892013-01-04 23:34:14 +0000104 Token = PreviousTokenSource->getNextToken();
105 if (eof())
David L. Jones5de22722018-06-15 06:08:54 +0000106 return &FakeEOF;
Manuel Klimek1abf7892013-01-04 23:34:14 +0000107 return Token;
108 }
109
Craig Topperfb6b25b2014-03-15 04:29:04 +0000110 unsigned getPosition() override { return PreviousTokenSource->getPosition(); }
Manuel Klimekab419912013-05-23 09:41:43 +0000111
Craig Topperfb6b25b2014-03-15 04:29:04 +0000112 FormatToken *setPosition(unsigned Position) override {
Krasimir Georgieva1c30932017-05-19 10:34:57 +0000113 PreviousToken = nullptr;
Manuel Klimekab419912013-05-23 09:41:43 +0000114 Token = PreviousTokenSource->setPosition(Position);
115 return Token;
116 }
117
Manuel Klimek1abf7892013-01-04 23:34:14 +0000118private:
Krasimir Georgieva1c30932017-05-19 10:34:57 +0000119 bool eof() {
120 return Token && Token->HasUnescapedNewline &&
Krasimir Georgievea222a72017-05-22 10:07:56 +0000121 !continuesLineComment(*Token, PreviousToken,
122 /*MinColumnToken=*/PreviousToken);
Krasimir Georgieva1c30932017-05-19 10:34:57 +0000123 }
Manuel Klimek1abf7892013-01-04 23:34:14 +0000124
David L. Jones5de22722018-06-15 06:08:54 +0000125 FormatToken FakeEOF;
Manuel Klimek1abf7892013-01-04 23:34:14 +0000126 UnwrappedLine &Line;
127 FormatTokenSource *&TokenSource;
Manuel Klimek15dfe7a2013-05-28 11:55:06 +0000128 FormatToken *&ResetToken;
Manuel Klimekef2cfb12013-01-05 22:14:16 +0000129 unsigned PreviousLineLevel;
Manuel Klimek1abf7892013-01-04 23:34:14 +0000130 FormatTokenSource *PreviousTokenSource;
131
Manuel Klimek15dfe7a2013-05-28 11:55:06 +0000132 FormatToken *Token;
Krasimir Georgieva1c30932017-05-19 10:34:57 +0000133 FormatToken *PreviousToken;
Manuel Klimek1abf7892013-01-04 23:34:14 +0000134};
135
Craig Topper69665e12013-07-01 04:21:54 +0000136} // end anonymous namespace
137
Manuel Klimek8e07a1b2013-01-10 11:52:21 +0000138class ScopedLineState {
139public:
Manuel Klimekd3b92fa2013-01-18 14:04:34 +0000140 ScopedLineState(UnwrappedLineParser &Parser,
141 bool SwitchToPreprocessorLines = false)
David Blaikieefb6eb22014-08-09 20:02:07 +0000142 : Parser(Parser), OriginalLines(Parser.CurrentLines) {
Manuel Klimekd3b92fa2013-01-18 14:04:34 +0000143 if (SwitchToPreprocessorLines)
144 Parser.CurrentLines = &Parser.PreprocessorDirectives;
Daniel Jasper9fe0e8d2013-09-05 09:29:45 +0000145 else if (!Parser.Line->Tokens.empty())
146 Parser.CurrentLines = &Parser.Line->Tokens.back().Children;
David Blaikieefb6eb22014-08-09 20:02:07 +0000147 PreBlockLine = std::move(Parser.Line);
Jonas Devlieghere2b3d49b2019-08-14 23:04:18 +0000148 Parser.Line = std::make_unique<UnwrappedLine>();
Daniel Jasperdaffc0d2013-01-16 09:10:19 +0000149 Parser.Line->Level = PreBlockLine->Level;
150 Parser.Line->InPPDirective = PreBlockLine->InPPDirective;
Manuel Klimek8e07a1b2013-01-10 11:52:21 +0000151 }
152
153 ~ScopedLineState() {
Daniel Jasperdaffc0d2013-01-16 09:10:19 +0000154 if (!Parser.Line->Tokens.empty()) {
Manuel Klimek8e07a1b2013-01-10 11:52:21 +0000155 Parser.addUnwrappedLine();
156 }
Daniel Jasperdaffc0d2013-01-16 09:10:19 +0000157 assert(Parser.Line->Tokens.empty());
David Blaikieefb6eb22014-08-09 20:02:07 +0000158 Parser.Line = std::move(PreBlockLine);
Daniel Jasper9fe0e8d2013-09-05 09:29:45 +0000159 if (Parser.CurrentLines == &Parser.PreprocessorDirectives)
160 Parser.MustBreakBeforeNextToken = true;
161 Parser.CurrentLines = OriginalLines;
Manuel Klimek8e07a1b2013-01-10 11:52:21 +0000162 }
163
164private:
165 UnwrappedLineParser &Parser;
166
David Blaikieefb6eb22014-08-09 20:02:07 +0000167 std::unique_ptr<UnwrappedLine> PreBlockLine;
Daniel Jasper9fe0e8d2013-09-05 09:29:45 +0000168 SmallVectorImpl<UnwrappedLine> *OriginalLines;
Manuel Klimek8e07a1b2013-01-10 11:52:21 +0000169};
170
Alexander Kornienko3a33f022013-12-12 09:49:52 +0000171class CompoundStatementIndenter {
172public:
173 CompoundStatementIndenter(UnwrappedLineParser *Parser,
174 const FormatStyle &Style, unsigned &LineLevel)
Owen Pan806d5742019-04-08 23:36:25 +0000175 : CompoundStatementIndenter(Parser, LineLevel,
176 Style.BraceWrapping.AfterControlStatement,
Nico Weberff9f4b52019-07-29 13:26:48 +0000177 Style.BraceWrapping.IndentBraces) {}
Owen Pan806d5742019-04-08 23:36:25 +0000178 CompoundStatementIndenter(UnwrappedLineParser *Parser, unsigned &LineLevel,
179 bool WrapBrace, bool IndentBrace)
Alexander Kornienko3a33f022013-12-12 09:49:52 +0000180 : LineLevel(LineLevel), OldLineLevel(LineLevel) {
Owen Pan806d5742019-04-08 23:36:25 +0000181 if (WrapBrace)
Alexander Kornienko3a33f022013-12-12 09:49:52 +0000182 Parser->addUnwrappedLine();
Owen Pan806d5742019-04-08 23:36:25 +0000183 if (IndentBrace)
Alexander Kornienko3a33f022013-12-12 09:49:52 +0000184 ++LineLevel;
Alexander Kornienko3a33f022013-12-12 09:49:52 +0000185 }
Daniel Jasperb05a81d2014-05-09 13:11:16 +0000186 ~CompoundStatementIndenter() { LineLevel = OldLineLevel; }
Alexander Kornienko3a33f022013-12-12 09:49:52 +0000187
188private:
189 unsigned &LineLevel;
190 unsigned OldLineLevel;
191};
192
Craig Topper69665e12013-07-01 04:21:54 +0000193namespace {
194
Manuel Klimekab419912013-05-23 09:41:43 +0000195class IndexedTokenSource : public FormatTokenSource {
196public:
Manuel Klimek15dfe7a2013-05-28 11:55:06 +0000197 IndexedTokenSource(ArrayRef<FormatToken *> Tokens)
Manuel Klimekab419912013-05-23 09:41:43 +0000198 : Tokens(Tokens), Position(-1) {}
199
Craig Topperfb6b25b2014-03-15 04:29:04 +0000200 FormatToken *getNextToken() override {
Manuel Klimekab419912013-05-23 09:41:43 +0000201 ++Position;
202 return Tokens[Position];
203 }
204
Craig Topperfb6b25b2014-03-15 04:29:04 +0000205 unsigned getPosition() override {
Manuel Klimekab419912013-05-23 09:41:43 +0000206 assert(Position >= 0);
207 return Position;
208 }
209
Craig Topperfb6b25b2014-03-15 04:29:04 +0000210 FormatToken *setPosition(unsigned P) override {
Manuel Klimekab419912013-05-23 09:41:43 +0000211 Position = P;
212 return Tokens[Position];
213 }
214
Manuel Klimek71814b42013-10-11 21:25:45 +0000215 void reset() { Position = -1; }
216
Manuel Klimekab419912013-05-23 09:41:43 +0000217private:
Manuel Klimek15dfe7a2013-05-28 11:55:06 +0000218 ArrayRef<FormatToken *> Tokens;
Manuel Klimekab419912013-05-23 09:41:43 +0000219 int Position;
220};
221
Craig Topper69665e12013-07-01 04:21:54 +0000222} // end anonymous namespace
223
Daniel Jasperd2ae41a2013-05-15 08:14:19 +0000224UnwrappedLineParser::UnwrappedLineParser(const FormatStyle &Style,
Daniel Jasperd0ec0d62014-11-04 12:41:02 +0000225 const AdditionalKeywords &Keywords,
Krasimir Georgiev9ad83fe2017-10-30 14:01:50 +0000226 unsigned FirstStartColumn,
Manuel Klimek15dfe7a2013-05-28 11:55:06 +0000227 ArrayRef<FormatToken *> Tokens,
Daniel Jasperd2ae41a2013-05-15 08:14:19 +0000228 UnwrappedLineConsumer &Callback)
Daniel Jasperb05a81d2014-05-09 13:11:16 +0000229 : Line(new UnwrappedLine), MustBreakBeforeNextToken(false),
Krasimir Georgiev00c5c722017-02-02 15:32:19 +0000230 CurrentLines(&Lines), Style(Style), Keywords(Keywords),
231 CommentPragmasRegex(Style.CommentPragmas), Tokens(nullptr),
Krasimir Georgievad47c902017-08-30 14:34:57 +0000232 Callback(Callback), AllTokens(Tokens), PPBranchLevel(-1),
Mark Zeren1c3afaf2018-02-05 15:59:00 +0000233 IncludeGuard(Style.IndentPPDirectives == FormatStyle::PPDIS_None
234 ? IG_Rejected
235 : IG_Inited),
236 IncludeGuardToken(nullptr), FirstStartColumn(FirstStartColumn) {}
Manuel Klimek71814b42013-10-11 21:25:45 +0000237
238void UnwrappedLineParser::reset() {
239 PPBranchLevel = -1;
Mark Zeren1c3afaf2018-02-05 15:59:00 +0000240 IncludeGuard = Style.IndentPPDirectives == FormatStyle::PPDIS_None
241 ? IG_Rejected
242 : IG_Inited;
243 IncludeGuardToken = nullptr;
Manuel Klimek71814b42013-10-11 21:25:45 +0000244 Line.reset(new UnwrappedLine);
245 CommentsBeforeNextToken.clear();
Craig Topper2145bc02014-05-09 08:15:10 +0000246 FormatTok = nullptr;
Manuel Klimek71814b42013-10-11 21:25:45 +0000247 MustBreakBeforeNextToken = false;
248 PreprocessorDirectives.clear();
249 CurrentLines = &Lines;
250 DeclarationScopeStack.clear();
Manuel Klimek71814b42013-10-11 21:25:45 +0000251 PPStack.clear();
Krasimir Georgiev9ad83fe2017-10-30 14:01:50 +0000252 Line->FirstStartColumn = FirstStartColumn;
Manuel Klimek71814b42013-10-11 21:25:45 +0000253}
Daniel Jasperf7935112012-12-03 18:12:45 +0000254
Manuel Klimek20e0af62015-05-06 11:56:29 +0000255void UnwrappedLineParser::parse() {
Manuel Klimekab419912013-05-23 09:41:43 +0000256 IndexedTokenSource TokenSource(AllTokens);
Krasimir Georgiev9ad83fe2017-10-30 14:01:50 +0000257 Line->FirstStartColumn = FirstStartColumn;
Manuel Klimek71814b42013-10-11 21:25:45 +0000258 do {
Nicola Zaghen3538b392018-05-15 13:30:56 +0000259 LLVM_DEBUG(llvm::dbgs() << "----\n");
Manuel Klimek71814b42013-10-11 21:25:45 +0000260 reset();
261 Tokens = &TokenSource;
262 TokenSource.reset();
Daniel Jaspera79064a2013-03-01 18:11:39 +0000263
Manuel Klimek71814b42013-10-11 21:25:45 +0000264 readToken();
265 parseFile();
Mark Zeren1c3afaf2018-02-05 15:59:00 +0000266
267 // If we found an include guard then all preprocessor directives (other than
268 // the guard) are over-indented by one.
269 if (IncludeGuard == IG_Found)
270 for (auto &Line : Lines)
271 if (Line.InPPDirective && Line.Level > 0)
272 --Line.Level;
273
Manuel Klimek71814b42013-10-11 21:25:45 +0000274 // Create line with eof token.
275 pushToken(FormatTok);
276 addUnwrappedLine();
277
278 for (SmallVectorImpl<UnwrappedLine>::iterator I = Lines.begin(),
279 E = Lines.end();
280 I != E; ++I) {
281 Callback.consumeUnwrappedLine(*I);
282 }
283 Callback.finishRun();
284 Lines.clear();
285 while (!PPLevelBranchIndex.empty() &&
Daniel Jasper53bd1672013-10-12 13:32:56 +0000286 PPLevelBranchIndex.back() + 1 >= PPLevelBranchCount.back()) {
Manuel Klimek71814b42013-10-11 21:25:45 +0000287 PPLevelBranchIndex.resize(PPLevelBranchIndex.size() - 1);
288 PPLevelBranchCount.resize(PPLevelBranchCount.size() - 1);
289 }
290 if (!PPLevelBranchIndex.empty()) {
291 ++PPLevelBranchIndex.back();
292 assert(PPLevelBranchIndex.size() == PPLevelBranchCount.size());
293 assert(PPLevelBranchIndex.back() <= PPLevelBranchCount.back());
294 }
295 } while (!PPLevelBranchIndex.empty());
Manuel Klimek1abf7892013-01-04 23:34:14 +0000296}
297
Manuel Klimek1a18c402013-04-12 14:13:36 +0000298void UnwrappedLineParser::parseFile() {
Daniel Jasper9326f912015-05-05 08:40:32 +0000299 // The top-level context in a file always has declarations, except for pre-
300 // processor directives and JavaScript files.
301 bool MustBeDeclaration =
302 !Line->InPPDirective && Style.Language != FormatStyle::LK_JavaScript;
303 ScopedDeclarationState DeclarationState(*Line, DeclarationScopeStack,
304 MustBeDeclaration);
Krasimir Georgiev26b144c2017-07-03 15:05:14 +0000305 if (Style.Language == FormatStyle::LK_TextProto)
306 parseBracedList();
307 else
308 parseLevel(/*HasOpeningBrace=*/false);
Manuel Klimek1abf7892013-01-04 23:34:14 +0000309 // Make sure to format the remaining tokens.
Krasimir Georgiev0895f5e2018-06-25 11:08:24 +0000310 //
311 // LK_TextProto is special since its top-level is parsed as the body of a
312 // braced list, which does not necessarily have natural line separators such
313 // as a semicolon. Comments after the last entry that have been determined to
314 // not belong to that line, as in:
315 // key: value
316 // // endfile comment
317 // do not have a chance to be put on a line of their own until this point.
318 // Here we add this newline before end-of-file comments.
319 if (Style.Language == FormatStyle::LK_TextProto &&
320 !CommentsBeforeNextToken.empty())
321 addUnwrappedLine();
Manuel Klimekf92f7bc2013-01-22 16:31:55 +0000322 flushComments(true);
Manuel Klimek1abf7892013-01-04 23:34:14 +0000323 addUnwrappedLine();
Daniel Jasperf7935112012-12-03 18:12:45 +0000324}
325
Manuel Klimek1a18c402013-04-12 14:13:36 +0000326void UnwrappedLineParser::parseLevel(bool HasOpeningBrace) {
Daniel Jasper516d7972013-07-25 11:31:57 +0000327 bool SwitchLabelEncountered = false;
Daniel Jasperf7935112012-12-03 18:12:45 +0000328 do {
Birunthan Mohanathasb001a0b2015-07-03 17:25:16 +0000329 tok::TokenKind kind = FormatTok->Tok.getKind();
330 if (FormatTok->Type == TT_MacroBlockBegin) {
331 kind = tok::l_brace;
332 } else if (FormatTok->Type == TT_MacroBlockEnd) {
333 kind = tok::r_brace;
334 }
335
336 switch (kind) {
Daniel Jasperf7935112012-12-03 18:12:45 +0000337 case tok::comment:
Daniel Jaspere25509f2012-12-17 11:29:41 +0000338 nextToken();
339 addUnwrappedLine();
Daniel Jasperf7935112012-12-03 18:12:45 +0000340 break;
341 case tok::l_brace:
Manuel Klimek0a3a3c92013-01-23 09:32:48 +0000342 // FIXME: Add parameter whether this can happen - if this happens, we must
343 // be in a non-declaration context.
Daniel Jasperb86e2722015-08-24 13:23:37 +0000344 if (!FormatTok->is(TT_MacroBlockBegin) && tryToParseBracedList())
345 continue;
Nico Weber9096fc02013-06-26 00:30:14 +0000346 parseBlock(/*MustBeDeclaration=*/false);
Daniel Jasperf7935112012-12-03 18:12:45 +0000347 addUnwrappedLine();
348 break;
349 case tok::r_brace:
Manuel Klimek1a18c402013-04-12 14:13:36 +0000350 if (HasOpeningBrace)
351 return;
Manuel Klimek1a18c402013-04-12 14:13:36 +0000352 nextToken();
353 addUnwrappedLine();
Manuel Klimek1058d982013-01-06 20:07:31 +0000354 break;
Nico Weberc29f83b2018-01-23 16:30:56 +0000355 case tok::kw_default: {
356 unsigned StoredPosition = Tokens->getPosition();
Jonas Toth90d2aa22018-08-24 17:25:06 +0000357 FormatToken *Next;
358 do {
359 Next = Tokens->getNextToken();
360 } while (Next && Next->is(tok::comment));
Nico Weberc29f83b2018-01-23 16:30:56 +0000361 FormatTok = Tokens->setPosition(StoredPosition);
362 if (Next && Next->isNot(tok::colon)) {
363 // default not followed by ':' is not a case label; treat it like
364 // an identifier.
365 parseStructuralElement();
366 break;
367 }
368 // Else, if it is 'default:', fall through to the case handling.
Nico Weberf1add5e2018-01-24 01:47:22 +0000369 LLVM_FALLTHROUGH;
Nico Weberc29f83b2018-01-23 16:30:56 +0000370 }
Daniel Jasper516d7972013-07-25 11:31:57 +0000371 case tok::kw_case:
Manuel Klimek89628f62017-09-20 09:51:03 +0000372 if (Style.Language == FormatStyle::LK_JavaScript &&
373 Line->MustBeDeclaration) {
Martin Probstf785fd92017-08-04 17:07:15 +0000374 // A 'case: string' style field declaration.
375 parseStructuralElement();
376 break;
377 }
Daniel Jasper72407622013-09-02 08:26:29 +0000378 if (!SwitchLabelEncountered &&
379 (Style.IndentCaseLabels || (Line->InPPDirective && Line->Level == 1)))
380 ++Line->Level;
Daniel Jasper516d7972013-07-25 11:31:57 +0000381 SwitchLabelEncountered = true;
382 parseStructuralElement();
383 break;
Daniel Jasperf7935112012-12-03 18:12:45 +0000384 default:
Manuel Klimek6b9eeba2013-01-07 14:56:16 +0000385 parseStructuralElement();
Daniel Jasperf7935112012-12-03 18:12:45 +0000386 break;
387 }
388 } while (!eof());
389}
390
Daniel Jasperadba2aa2015-05-18 12:52:00 +0000391void UnwrappedLineParser::calculateBraceTypes(bool ExpectClassBody) {
Manuel Klimekab419912013-05-23 09:41:43 +0000392 // We'll parse forward through the tokens until we hit
393 // a closing brace or eof - note that getNextToken() will
394 // parse macros, so this will magically work inside macro
395 // definitions, too.
396 unsigned StoredPosition = Tokens->getPosition();
Manuel Klimek15dfe7a2013-05-28 11:55:06 +0000397 FormatToken *Tok = FormatTok;
Manuel Klimek89628f62017-09-20 09:51:03 +0000398 const FormatToken *PrevTok = Tok->Previous;
Manuel Klimekab419912013-05-23 09:41:43 +0000399 // Keep a stack of positions of lbrace tokens. We will
400 // update information about whether an lbrace starts a
401 // braced init list or a different block during the loop.
Daniel Jasperb1f74a82013-07-09 09:06:29 +0000402 SmallVector<FormatToken *, 8> LBraceStack;
Manuel Klimek15dfe7a2013-05-28 11:55:06 +0000403 assert(Tok->Tok.is(tok::l_brace));
Manuel Klimekab419912013-05-23 09:41:43 +0000404 do {
Daniel Jaspereb65e912015-12-21 18:31:15 +0000405 // Get next non-comment token.
Daniel Jasper7f5d53e2013-07-01 09:15:46 +0000406 FormatToken *NextTok;
Daniel Jasperca7bd722013-07-01 16:43:38 +0000407 unsigned ReadTokens = 0;
Daniel Jasper7f5d53e2013-07-01 09:15:46 +0000408 do {
409 NextTok = Tokens->getNextToken();
Daniel Jasperca7bd722013-07-01 16:43:38 +0000410 ++ReadTokens;
Daniel Jasper7f5d53e2013-07-01 09:15:46 +0000411 } while (NextTok->is(tok::comment));
412
Manuel Klimek15dfe7a2013-05-28 11:55:06 +0000413 switch (Tok->Tok.getKind()) {
Manuel Klimekab419912013-05-23 09:41:43 +0000414 case tok::l_brace:
Martin Probst95ed8e72017-05-31 09:29:40 +0000415 if (Style.Language == FormatStyle::LK_JavaScript && PrevTok) {
Martin Probste8e27ca2017-11-25 09:33:47 +0000416 if (PrevTok->isOneOf(tok::colon, tok::less))
417 // A ':' indicates this code is in a type, or a braced list
418 // following a label in an object literal ({a: {b: 1}}).
419 // A '<' could be an object used in a comparison, but that is nonsense
420 // code (can never return true), so more likely it is a generic type
421 // argument (`X<{a: string; b: number}>`).
422 // The code below could be confused by semicolons between the
423 // individual members in a type member list, which would normally
424 // trigger BK_Block. In both cases, this must be parsed as an inline
425 // braced init.
Martin Probst95ed8e72017-05-31 09:29:40 +0000426 Tok->BlockKind = BK_BracedInit;
427 else if (PrevTok->is(tok::r_paren))
428 // `) { }` can only occur in function or method declarations in JS.
429 Tok->BlockKind = BK_Block;
430 } else {
Daniel Jasperb9a49902016-01-09 15:56:28 +0000431 Tok->BlockKind = BK_Unknown;
Martin Probst95ed8e72017-05-31 09:29:40 +0000432 }
Daniel Jasperb1f74a82013-07-09 09:06:29 +0000433 LBraceStack.push_back(Tok);
Manuel Klimekab419912013-05-23 09:41:43 +0000434 break;
435 case tok::r_brace:
Daniel Jasperb9a49902016-01-09 15:56:28 +0000436 if (LBraceStack.empty())
437 break;
438 if (LBraceStack.back()->BlockKind == BK_Unknown) {
439 bool ProbablyBracedList = false;
440 if (Style.Language == FormatStyle::LK_Proto) {
441 ProbablyBracedList = NextTok->isOneOf(tok::comma, tok::r_square);
442 } else {
443 // Using OriginalColumn to distinguish between ObjC methods and
444 // binary operators is a bit hacky.
445 bool NextIsObjCMethod = NextTok->isOneOf(tok::plus, tok::minus) &&
446 NextTok->OriginalColumn == 0;
Daniel Jasper91b032a2014-05-22 12:46:38 +0000447
Daniel Jasperb9a49902016-01-09 15:56:28 +0000448 // If there is a comma, semicolon or right paren after the closing
449 // brace, we assume this is a braced initializer list. Note that
450 // regardless how we mark inner braces here, we will overwrite the
451 // BlockKind later if we parse a braced list (where all blocks
452 // inside are by default braced lists), or when we explicitly detect
453 // blocks (for example while parsing lambdas).
Martin Probst95ed8e72017-05-31 09:29:40 +0000454 // FIXME: Some of these do not apply to JS, e.g. "} {" can never be a
455 // braced list in JS.
Daniel Jasperb9a49902016-01-09 15:56:28 +0000456 ProbablyBracedList =
Daniel Jasperacffeb82016-03-05 18:34:26 +0000457 (Style.Language == FormatStyle::LK_JavaScript &&
Martin Probste1e12a72016-08-19 14:35:01 +0000458 NextTok->isOneOf(Keywords.kw_of, Keywords.kw_in,
459 Keywords.kw_as)) ||
Martin Probstb7fb2672017-05-10 13:53:29 +0000460 (Style.isCpp() && NextTok->is(tok::l_paren)) ||
Daniel Jasperb9a49902016-01-09 15:56:28 +0000461 NextTok->isOneOf(tok::comma, tok::period, tok::colon,
462 tok::r_paren, tok::r_square, tok::l_brace,
Manuel Klimekd0f3fe52018-04-11 14:51:54 +0000463 tok::ellipsis) ||
Daniel Jaspere4ada022016-12-13 10:05:03 +0000464 (NextTok->is(tok::identifier) &&
465 !PrevTok->isOneOf(tok::semi, tok::r_brace, tok::l_brace)) ||
Daniel Jasperb9a49902016-01-09 15:56:28 +0000466 (NextTok->is(tok::semi) &&
467 (!ExpectClassBody || LBraceStack.size() != 1)) ||
468 (NextTok->isBinaryOperator() && !NextIsObjCMethod);
Manuel Klimekd0f3fe52018-04-11 14:51:54 +0000469 if (NextTok->is(tok::l_square)) {
470 // We can have an array subscript after a braced init
471 // list, but C++11 attributes are expected after blocks.
472 NextTok = Tokens->getNextToken();
473 ++ReadTokens;
474 ProbablyBracedList = NextTok->isNot(tok::l_square);
475 }
Manuel Klimekab419912013-05-23 09:41:43 +0000476 }
Daniel Jasperb9a49902016-01-09 15:56:28 +0000477 if (ProbablyBracedList) {
478 Tok->BlockKind = BK_BracedInit;
479 LBraceStack.back()->BlockKind = BK_BracedInit;
480 } else {
481 Tok->BlockKind = BK_Block;
482 LBraceStack.back()->BlockKind = BK_Block;
483 }
Manuel Klimekab419912013-05-23 09:41:43 +0000484 }
Daniel Jasperb9a49902016-01-09 15:56:28 +0000485 LBraceStack.pop_back();
Manuel Klimekab419912013-05-23 09:41:43 +0000486 break;
Francois Ferrand6f40e212018-10-02 16:37:51 +0000487 case tok::identifier:
488 if (!Tok->is(TT_StatementMacro))
Paul Hoad5bcf99b2019-03-01 09:09:54 +0000489 break;
Francois Ferrand6f40e212018-10-02 16:37:51 +0000490 LLVM_FALLTHROUGH;
Daniel Jasperac7e34e2014-03-13 10:11:17 +0000491 case tok::at:
Manuel Klimekab419912013-05-23 09:41:43 +0000492 case tok::semi:
493 case tok::kw_if:
494 case tok::kw_while:
495 case tok::kw_for:
496 case tok::kw_switch:
497 case tok::kw_try:
Nico Weberfac23712015-02-04 15:26:27 +0000498 case tok::kw___try:
Daniel Jasperb9a49902016-01-09 15:56:28 +0000499 if (!LBraceStack.empty() && LBraceStack.back()->BlockKind == BK_Unknown)
Daniel Jasperb1f74a82013-07-09 09:06:29 +0000500 LBraceStack.back()->BlockKind = BK_Block;
Manuel Klimekab419912013-05-23 09:41:43 +0000501 break;
502 default:
503 break;
504 }
Daniel Jasperb9a49902016-01-09 15:56:28 +0000505 PrevTok = Tok;
Manuel Klimekab419912013-05-23 09:41:43 +0000506 Tok = NextTok;
Manuel Klimekbab25fd2013-09-04 08:20:47 +0000507 } while (Tok->Tok.isNot(tok::eof) && !LBraceStack.empty());
Daniel Jasperb9a49902016-01-09 15:56:28 +0000508
Manuel Klimekab419912013-05-23 09:41:43 +0000509 // Assume other blocks for all unclosed opening braces.
510 for (unsigned i = 0, e = LBraceStack.size(); i != e; ++i) {
Daniel Jasperb1f74a82013-07-09 09:06:29 +0000511 if (LBraceStack[i]->BlockKind == BK_Unknown)
512 LBraceStack[i]->BlockKind = BK_Block;
Manuel Klimekab419912013-05-23 09:41:43 +0000513 }
Manuel Klimekbab25fd2013-09-04 08:20:47 +0000514
Manuel Klimekab419912013-05-23 09:41:43 +0000515 FormatTok = Tokens->setPosition(StoredPosition);
516}
517
Francois Ferranda98a95c2017-07-28 07:56:14 +0000518template <class T>
519static inline void hash_combine(std::size_t &seed, const T &v) {
520 std::hash<T> hasher;
521 seed ^= hasher(v) + 0x9e3779b9 + (seed << 6) + (seed >> 2);
522}
523
524size_t UnwrappedLineParser::computePPHash() const {
525 size_t h = 0;
526 for (const auto &i : PPStack) {
527 hash_combine(h, size_t(i.Kind));
528 hash_combine(h, i.Line);
529 }
530 return h;
531}
532
Manuel Klimekb212f3b2013-10-12 22:46:56 +0000533void UnwrappedLineParser::parseBlock(bool MustBeDeclaration, bool AddLevel,
534 bool MunchSemi) {
Birunthan Mohanathasb001a0b2015-07-03 17:25:16 +0000535 assert(FormatTok->isOneOf(tok::l_brace, TT_MacroBlockBegin) &&
536 "'{' or macro block token expected");
537 const bool MacroBlock = FormatTok->is(TT_MacroBlockBegin);
Daniel Jaspereb65e912015-12-21 18:31:15 +0000538 FormatTok->BlockKind = BK_Block;
Birunthan Mohanathasb001a0b2015-07-03 17:25:16 +0000539
Francois Ferranda98a95c2017-07-28 07:56:14 +0000540 size_t PPStartHash = computePPHash();
541
Daniel Jasper516d7972013-07-25 11:31:57 +0000542 unsigned InitialLevel = Line->Level;
Krasimir Georgiev3e051052017-07-24 14:51:59 +0000543 nextToken(/*LevelDifference=*/AddLevel ? 1 : 0);
Daniel Jasperf7935112012-12-03 18:12:45 +0000544
Birunthan Mohanathasb001a0b2015-07-03 17:25:16 +0000545 if (MacroBlock && FormatTok->is(tok::l_paren))
546 parseParens();
547
Francois Ferranda98a95c2017-07-28 07:56:14 +0000548 size_t NbPreprocessorDirectives =
549 CurrentLines == &Lines ? PreprocessorDirectives.size() : 0;
Manuel Klimeka4fe1c12013-01-21 16:42:44 +0000550 addUnwrappedLine();
Francois Ferranda98a95c2017-07-28 07:56:14 +0000551 size_t OpeningLineIndex =
552 CurrentLines->empty()
553 ? (UnwrappedLine::kInvalidIndex)
554 : (CurrentLines->size() - 1 - NbPreprocessorDirectives);
Daniel Jasperf7935112012-12-03 18:12:45 +0000555
Manuel Klimek0a3a3c92013-01-23 09:32:48 +0000556 ScopedDeclarationState DeclarationState(*Line, DeclarationScopeStack,
557 MustBeDeclaration);
Daniel Jasper65ee3472013-07-31 23:16:02 +0000558 if (AddLevel)
559 ++Line->Level;
Nico Weber9096fc02013-06-26 00:30:14 +0000560 parseLevel(/*HasOpeningBrace=*/true);
Alexander Kornienko578fdd82012-12-06 18:03:27 +0000561
Marianne Mailhot-Sarrasin03137c62016-04-14 14:56:49 +0000562 if (eof())
563 return;
564
Birunthan Mohanathasb001a0b2015-07-03 17:25:16 +0000565 if (MacroBlock ? !FormatTok->is(TT_MacroBlockEnd)
566 : !FormatTok->is(tok::r_brace)) {
Daniel Jasper516d7972013-07-25 11:31:57 +0000567 Line->Level = InitialLevel;
Daniel Jaspereb65e912015-12-21 18:31:15 +0000568 FormatTok->BlockKind = BK_Block;
Manuel Klimek1a18c402013-04-12 14:13:36 +0000569 return;
Manuel Klimekf92f7bc2013-01-22 16:31:55 +0000570 }
Alexander Kornienko0ea8e102012-12-04 15:40:36 +0000571
Francois Ferranda98a95c2017-07-28 07:56:14 +0000572 size_t PPEndHash = computePPHash();
573
Krasimir Georgiev3e051052017-07-24 14:51:59 +0000574 // Munch the closing brace.
575 nextToken(/*LevelDifference=*/AddLevel ? -1 : 0);
Birunthan Mohanathasb001a0b2015-07-03 17:25:16 +0000576
577 if (MacroBlock && FormatTok->is(tok::l_paren))
578 parseParens();
579
Manuel Klimekb212f3b2013-10-12 22:46:56 +0000580 if (MunchSemi && FormatTok->Tok.is(tok::semi))
581 nextToken();
Krasimir Georgiev3e051052017-07-24 14:51:59 +0000582 Line->Level = InitialLevel;
Francois Ferranda98a95c2017-07-28 07:56:14 +0000583
584 if (PPStartHash == PPEndHash) {
585 Line->MatchingOpeningBlockLineIndex = OpeningLineIndex;
586 if (OpeningLineIndex != UnwrappedLine::kInvalidIndex) {
587 // Update the opening line to add the forward reference as well
Manuel Klimek0dddcf72018-04-23 09:34:26 +0000588 (*CurrentLines)[OpeningLineIndex].MatchingClosingBlockLineIndex =
Francois Ferranda98a95c2017-07-28 07:56:14 +0000589 CurrentLines->size() - 1;
590 }
Francois Ferrande56a8292017-06-14 12:29:47 +0000591 }
Daniel Jasperf7935112012-12-03 18:12:45 +0000592}
593
Daniel Jasper02c7bca2015-03-30 09:56:50 +0000594static bool isGoogScope(const UnwrappedLine &Line) {
Daniel Jasper616de8642014-11-23 16:46:28 +0000595 // FIXME: Closure-library specific stuff should not be hard-coded but be
596 // configurable.
Daniel Jasper4a39c842014-05-06 13:54:10 +0000597 if (Line.Tokens.size() < 4)
598 return false;
599 auto I = Line.Tokens.begin();
600 if (I->Tok->TokenText != "goog")
601 return false;
602 ++I;
603 if (I->Tok->isNot(tok::period))
604 return false;
605 ++I;
606 if (I->Tok->TokenText != "scope")
607 return false;
608 ++I;
609 return I->Tok->is(tok::l_paren);
610}
611
Martin Probst101ec892017-05-09 20:04:09 +0000612static bool isIIFE(const UnwrappedLine &Line,
613 const AdditionalKeywords &Keywords) {
614 // Look for the start of an immediately invoked anonymous function.
615 // https://en.wikipedia.org/wiki/Immediately-invoked_function_expression
616 // This is commonly done in JavaScript to create a new, anonymous scope.
617 // Example: (function() { ... })()
618 if (Line.Tokens.size() < 3)
619 return false;
620 auto I = Line.Tokens.begin();
621 if (I->Tok->isNot(tok::l_paren))
622 return false;
623 ++I;
624 if (I->Tok->isNot(Keywords.kw_function))
625 return false;
626 ++I;
627 return I->Tok->is(tok::l_paren);
628}
629
Roman Kashitsyna043ced2014-08-11 12:18:01 +0000630static bool ShouldBreakBeforeBrace(const FormatStyle &Style,
631 const FormatToken &InitialToken) {
Francois Ferrande8a301f2019-06-06 20:06:23 +0000632 if (InitialToken.isOneOf(tok::kw_namespace, TT_NamespaceMacro))
Daniel Jasperc1bc38e2015-09-29 14:57:55 +0000633 return Style.BraceWrapping.AfterNamespace;
634 if (InitialToken.is(tok::kw_class))
635 return Style.BraceWrapping.AfterClass;
636 if (InitialToken.is(tok::kw_union))
637 return Style.BraceWrapping.AfterUnion;
638 if (InitialToken.is(tok::kw_struct))
639 return Style.BraceWrapping.AfterStruct;
640 return false;
Roman Kashitsyna043ced2014-08-11 12:18:01 +0000641}
642
Manuel Klimek516e0542013-09-04 13:25:30 +0000643void UnwrappedLineParser::parseChildBlock() {
644 FormatTok->BlockKind = BK_Block;
645 nextToken();
646 {
Manuel Klimek89628f62017-09-20 09:51:03 +0000647 bool SkipIndent = (Style.Language == FormatStyle::LK_JavaScript &&
648 (isGoogScope(*Line) || isIIFE(*Line, Keywords)));
Manuel Klimek516e0542013-09-04 13:25:30 +0000649 ScopedLineState LineState(*this);
650 ScopedDeclarationState DeclarationState(*Line, DeclarationScopeStack,
651 /*MustBeDeclaration=*/false);
Martin Probst101ec892017-05-09 20:04:09 +0000652 Line->Level += SkipIndent ? 0 : 1;
Manuel Klimek516e0542013-09-04 13:25:30 +0000653 parseLevel(/*HasOpeningBrace=*/true);
Daniel Jasper02c7bca2015-03-30 09:56:50 +0000654 flushComments(isOnNewLine(*FormatTok));
Martin Probst101ec892017-05-09 20:04:09 +0000655 Line->Level -= SkipIndent ? 0 : 1;
Manuel Klimek516e0542013-09-04 13:25:30 +0000656 }
657 nextToken();
658}
659
Daniel Jasperf7935112012-12-03 18:12:45 +0000660void UnwrappedLineParser::parsePPDirective() {
Manuel Klimek15dfe7a2013-05-28 11:55:06 +0000661 assert(FormatTok->Tok.is(tok::hash) && "'#' expected");
Manuel Klimek20e0af62015-05-06 11:56:29 +0000662 ScopedMacroState MacroState(*Line, Tokens, FormatTok);
Paul Hoad701a0d72019-03-20 20:49:43 +0000663
Manuel Klimeka71e5d82013-01-02 16:30:12 +0000664 nextToken();
665
Craig Topper2145bc02014-05-09 08:15:10 +0000666 if (!FormatTok->Tok.getIdentifierInfo()) {
Manuel Klimek591b5802013-01-31 15:58:48 +0000667 parsePPUnknown();
Manuel Klimeka71e5d82013-01-02 16:30:12 +0000668 return;
Daniel Jasperf7935112012-12-03 18:12:45 +0000669 }
Manuel Klimeka71e5d82013-01-02 16:30:12 +0000670
Manuel Klimek15dfe7a2013-05-28 11:55:06 +0000671 switch (FormatTok->Tok.getIdentifierInfo()->getPPKeywordID()) {
Manuel Klimek1abf7892013-01-04 23:34:14 +0000672 case tok::pp_define:
673 parsePPDefine();
Alexander Kornienkof2e02122013-05-24 18:24:24 +0000674 return;
675 case tok::pp_if:
Manuel Klimek71814b42013-10-11 21:25:45 +0000676 parsePPIf(/*IfDef=*/false);
Alexander Kornienkof2e02122013-05-24 18:24:24 +0000677 break;
678 case tok::pp_ifdef:
679 case tok::pp_ifndef:
Manuel Klimek71814b42013-10-11 21:25:45 +0000680 parsePPIf(/*IfDef=*/true);
Alexander Kornienkof2e02122013-05-24 18:24:24 +0000681 break;
682 case tok::pp_else:
683 parsePPElse();
684 break;
685 case tok::pp_elif:
686 parsePPElIf();
687 break;
688 case tok::pp_endif:
689 parsePPEndIf();
Manuel Klimek1abf7892013-01-04 23:34:14 +0000690 break;
691 default:
692 parsePPUnknown();
693 break;
694 }
695}
696
Manuel Klimek68b03042014-04-14 09:14:11 +0000697void UnwrappedLineParser::conditionalCompilationCondition(bool Unreachable) {
Francois Ferranda98a95c2017-07-28 07:56:14 +0000698 size_t Line = CurrentLines->size();
699 if (CurrentLines == &PreprocessorDirectives)
700 Line += Lines.size();
701
702 if (Unreachable ||
703 (!PPStack.empty() && PPStack.back().Kind == PP_Unreachable))
704 PPStack.push_back({PP_Unreachable, Line});
Alexander Kornienkof2e02122013-05-24 18:24:24 +0000705 else
Francois Ferranda98a95c2017-07-28 07:56:14 +0000706 PPStack.push_back({PP_Conditional, Line});
Alexander Kornienkof2e02122013-05-24 18:24:24 +0000707}
708
Manuel Klimek68b03042014-04-14 09:14:11 +0000709void UnwrappedLineParser::conditionalCompilationStart(bool Unreachable) {
Manuel Klimek71814b42013-10-11 21:25:45 +0000710 ++PPBranchLevel;
711 assert(PPBranchLevel >= 0 && PPBranchLevel <= (int)PPLevelBranchIndex.size());
712 if (PPBranchLevel == (int)PPLevelBranchIndex.size()) {
713 PPLevelBranchIndex.push_back(0);
714 PPLevelBranchCount.push_back(0);
715 }
716 PPChainBranchIndex.push(0);
Manuel Klimek68b03042014-04-14 09:14:11 +0000717 bool Skip = PPLevelBranchIndex[PPBranchLevel] > 0;
718 conditionalCompilationCondition(Unreachable || Skip);
Alexander Kornienkof2e02122013-05-24 18:24:24 +0000719}
720
Manuel Klimek68b03042014-04-14 09:14:11 +0000721void UnwrappedLineParser::conditionalCompilationAlternative() {
Alexander Kornienkof2e02122013-05-24 18:24:24 +0000722 if (!PPStack.empty())
723 PPStack.pop_back();
Manuel Klimek71814b42013-10-11 21:25:45 +0000724 assert(PPBranchLevel < (int)PPLevelBranchIndex.size());
725 if (!PPChainBranchIndex.empty())
726 ++PPChainBranchIndex.top();
Manuel Klimek68b03042014-04-14 09:14:11 +0000727 conditionalCompilationCondition(
728 PPBranchLevel >= 0 && !PPChainBranchIndex.empty() &&
729 PPLevelBranchIndex[PPBranchLevel] != PPChainBranchIndex.top());
Alexander Kornienkof2e02122013-05-24 18:24:24 +0000730}
731
Manuel Klimek68b03042014-04-14 09:14:11 +0000732void UnwrappedLineParser::conditionalCompilationEnd() {
Manuel Klimek71814b42013-10-11 21:25:45 +0000733 assert(PPBranchLevel < (int)PPLevelBranchIndex.size());
734 if (PPBranchLevel >= 0 && !PPChainBranchIndex.empty()) {
735 if (PPChainBranchIndex.top() + 1 > PPLevelBranchCount[PPBranchLevel]) {
Manuel Klimek71814b42013-10-11 21:25:45 +0000736 PPLevelBranchCount[PPBranchLevel] = PPChainBranchIndex.top() + 1;
737 }
738 }
Manuel Klimek14bd9172014-01-29 08:49:02 +0000739 // Guard against #endif's without #if.
Krasimir Georgievad47c902017-08-30 14:34:57 +0000740 if (PPBranchLevel > -1)
Manuel Klimek14bd9172014-01-29 08:49:02 +0000741 --PPBranchLevel;
Manuel Klimek71814b42013-10-11 21:25:45 +0000742 if (!PPChainBranchIndex.empty())
743 PPChainBranchIndex.pop();
Alexander Kornienkof2e02122013-05-24 18:24:24 +0000744 if (!PPStack.empty())
745 PPStack.pop_back();
Manuel Klimek68b03042014-04-14 09:14:11 +0000746}
747
748void UnwrappedLineParser::parsePPIf(bool IfDef) {
Daniel Jasper62703eb2017-03-01 11:10:11 +0000749 bool IfNDef = FormatTok->is(tok::pp_ifndef);
Manuel Klimek68b03042014-04-14 09:14:11 +0000750 nextToken();
Daniel Jaspereab6cd42017-03-01 10:47:52 +0000751 bool Unreachable = false;
752 if (!IfDef && (FormatTok->is(tok::kw_false) || FormatTok->TokenText == "0"))
753 Unreachable = true;
Daniel Jasper62703eb2017-03-01 11:10:11 +0000754 if (IfDef && !IfNDef && FormatTok->TokenText == "SWIG")
Daniel Jaspereab6cd42017-03-01 10:47:52 +0000755 Unreachable = true;
756 conditionalCompilationStart(Unreachable);
Krasimir Georgievad47c902017-08-30 14:34:57 +0000757 FormatToken *IfCondition = FormatTok;
758 // If there's a #ifndef on the first line, and the only lines before it are
759 // comments, it could be an include guard.
760 bool MaybeIncludeGuard = IfNDef;
Mark Zeren1c3afaf2018-02-05 15:59:00 +0000761 if (IncludeGuard == IG_Inited && MaybeIncludeGuard)
Krasimir Georgievad47c902017-08-30 14:34:57 +0000762 for (auto &Line : Lines) {
763 if (!Line.Tokens.front().Tok->is(tok::comment)) {
764 MaybeIncludeGuard = false;
Mark Zeren1c3afaf2018-02-05 15:59:00 +0000765 IncludeGuard = IG_Rejected;
Krasimir Georgievad47c902017-08-30 14:34:57 +0000766 break;
767 }
768 }
Krasimir Georgievad47c902017-08-30 14:34:57 +0000769 --PPBranchLevel;
Manuel Klimek68b03042014-04-14 09:14:11 +0000770 parsePPUnknown();
Krasimir Georgievad47c902017-08-30 14:34:57 +0000771 ++PPBranchLevel;
Mark Zeren1c3afaf2018-02-05 15:59:00 +0000772 if (IncludeGuard == IG_Inited && MaybeIncludeGuard) {
773 IncludeGuard = IG_IfNdefed;
774 IncludeGuardToken = IfCondition;
775 }
Manuel Klimek68b03042014-04-14 09:14:11 +0000776}
777
778void UnwrappedLineParser::parsePPElse() {
Krasimir Georgievad47c902017-08-30 14:34:57 +0000779 // If a potential include guard has an #else, it's not an include guard.
Mark Zeren1c3afaf2018-02-05 15:59:00 +0000780 if (IncludeGuard == IG_Defined && PPBranchLevel == 0)
781 IncludeGuard = IG_Rejected;
Manuel Klimek68b03042014-04-14 09:14:11 +0000782 conditionalCompilationAlternative();
Krasimir Georgievad47c902017-08-30 14:34:57 +0000783 if (PPBranchLevel > -1)
784 --PPBranchLevel;
Manuel Klimek68b03042014-04-14 09:14:11 +0000785 parsePPUnknown();
Krasimir Georgievad47c902017-08-30 14:34:57 +0000786 ++PPBranchLevel;
Manuel Klimek68b03042014-04-14 09:14:11 +0000787}
788
789void UnwrappedLineParser::parsePPElIf() { parsePPElse(); }
790
791void UnwrappedLineParser::parsePPEndIf() {
792 conditionalCompilationEnd();
Alexander Kornienkof2e02122013-05-24 18:24:24 +0000793 parsePPUnknown();
Krasimir Georgievad47c902017-08-30 14:34:57 +0000794 // If the #endif of a potential include guard is the last thing in the file,
Mark Zeren1c3afaf2018-02-05 15:59:00 +0000795 // then we found an include guard.
Krasimir Georgievad47c902017-08-30 14:34:57 +0000796 unsigned TokenPosition = Tokens->getPosition();
797 FormatToken *PeekNext = AllTokens[TokenPosition];
Mark Zeren1c3afaf2018-02-05 15:59:00 +0000798 if (IncludeGuard == IG_Defined && PPBranchLevel == -1 &&
799 PeekNext->is(tok::eof) &&
Daniel Jasper4df130f2017-09-04 13:33:52 +0000800 Style.IndentPPDirectives != FormatStyle::PPDIS_None)
Mark Zeren1c3afaf2018-02-05 15:59:00 +0000801 IncludeGuard = IG_Found;
Alexander Kornienkof2e02122013-05-24 18:24:24 +0000802}
803
Manuel Klimek1abf7892013-01-04 23:34:14 +0000804void UnwrappedLineParser::parsePPDefine() {
805 nextToken();
806
Owen Panfb73b79a2019-04-18 20:17:08 +0000807 if (!FormatTok->Tok.getIdentifierInfo()) {
Mark Zeren1c3afaf2018-02-05 15:59:00 +0000808 IncludeGuard = IG_Rejected;
809 IncludeGuardToken = nullptr;
Manuel Klimek1abf7892013-01-04 23:34:14 +0000810 parsePPUnknown();
811 return;
812 }
Mark Zeren1c3afaf2018-02-05 15:59:00 +0000813
814 if (IncludeGuard == IG_IfNdefed &&
815 IncludeGuardToken->TokenText == FormatTok->TokenText) {
816 IncludeGuard = IG_Defined;
817 IncludeGuardToken = nullptr;
Krasimir Georgievad47c902017-08-30 14:34:57 +0000818 for (auto &Line : Lines) {
819 if (!Line.Tokens.front().Tok->isOneOf(tok::comment, tok::hash)) {
Mark Zeren1c3afaf2018-02-05 15:59:00 +0000820 IncludeGuard = IG_Rejected;
Krasimir Georgievad47c902017-08-30 14:34:57 +0000821 break;
822 }
823 }
824 }
Mark Zeren1c3afaf2018-02-05 15:59:00 +0000825
Manuel Klimek1abf7892013-01-04 23:34:14 +0000826 nextToken();
Manuel Klimek15dfe7a2013-05-28 11:55:06 +0000827 if (FormatTok->Tok.getKind() == tok::l_paren &&
828 FormatTok->WhitespaceRange.getBegin() ==
829 FormatTok->WhitespaceRange.getEnd()) {
Manuel Klimek1abf7892013-01-04 23:34:14 +0000830 parseParens();
831 }
Paul Hoad701a0d72019-03-20 20:49:43 +0000832 if (Style.IndentPPDirectives != FormatStyle::PPDIS_None)
Krasimir Georgievad47c902017-08-30 14:34:57 +0000833 Line->Level += PPBranchLevel + 1;
Manuel Klimek1abf7892013-01-04 23:34:14 +0000834 addUnwrappedLine();
Krasimir Georgievad47c902017-08-30 14:34:57 +0000835 ++Line->Level;
Manuel Klimek1b896292013-01-07 09:34:28 +0000836
837 // Errors during a preprocessor directive can only affect the layout of the
838 // preprocessor directive, and thus we ignore them. An alternative approach
839 // would be to use the same approach we use on the file level (no
840 // re-indentation if there was a structural error) within the macro
841 // definition.
Manuel Klimek1abf7892013-01-04 23:34:14 +0000842 parseFile();
843}
844
845void UnwrappedLineParser::parsePPUnknown() {
Manuel Klimeka71e5d82013-01-02 16:30:12 +0000846 do {
Manuel Klimeka71e5d82013-01-02 16:30:12 +0000847 nextToken();
848 } while (!eof());
Paul Hoad701a0d72019-03-20 20:49:43 +0000849 if (Style.IndentPPDirectives != FormatStyle::PPDIS_None)
Krasimir Georgievad47c902017-08-30 14:34:57 +0000850 Line->Level += PPBranchLevel + 1;
Manuel Klimeka71e5d82013-01-02 16:30:12 +0000851 addUnwrappedLine();
Daniel Jasperf7935112012-12-03 18:12:45 +0000852}
853
Alexander Kornienkoa04e5e22013-04-09 16:15:19 +0000854// Here we blacklist certain tokens that are not usually the first token in an
855// unwrapped line. This is used in attempt to distinguish macro calls without
856// trailing semicolons from other constructs split to several lines.
Benjamin Kramer8407df72015-03-09 16:47:52 +0000857static bool tokenCanStartNewLine(const clang::Token &Tok) {
Alexander Kornienkoa04e5e22013-04-09 16:15:19 +0000858 // Semicolon can be a null-statement, l_square can be a start of a macro or
859 // a C++11 attribute, but this doesn't seem to be common.
860 return Tok.isNot(tok::semi) && Tok.isNot(tok::l_brace) &&
861 Tok.isNot(tok::l_square) &&
862 // Tokens that can only be used as binary operators and a part of
863 // overloaded operator names.
864 Tok.isNot(tok::period) && Tok.isNot(tok::periodstar) &&
865 Tok.isNot(tok::arrow) && Tok.isNot(tok::arrowstar) &&
866 Tok.isNot(tok::less) && Tok.isNot(tok::greater) &&
867 Tok.isNot(tok::slash) && Tok.isNot(tok::percent) &&
868 Tok.isNot(tok::lessless) && Tok.isNot(tok::greatergreater) &&
869 Tok.isNot(tok::equal) && Tok.isNot(tok::plusequal) &&
870 Tok.isNot(tok::minusequal) && Tok.isNot(tok::starequal) &&
871 Tok.isNot(tok::slashequal) && Tok.isNot(tok::percentequal) &&
872 Tok.isNot(tok::ampequal) && Tok.isNot(tok::pipeequal) &&
873 Tok.isNot(tok::caretequal) && Tok.isNot(tok::greatergreaterequal) &&
874 Tok.isNot(tok::lesslessequal) &&
875 // Colon is used in labels, base class lists, initializer lists,
876 // range-based for loops, ternary operator, but should never be the
877 // first token in an unwrapped line.
Daniel Jasper5ebb2f32014-05-21 13:08:17 +0000878 Tok.isNot(tok::colon) &&
879 // 'noexcept' is a trailing annotation.
880 Tok.isNot(tok::kw_noexcept);
Alexander Kornienkoa04e5e22013-04-09 16:15:19 +0000881}
882
Martin Probst533965c2016-04-19 18:19:06 +0000883static bool mustBeJSIdent(const AdditionalKeywords &Keywords,
884 const FormatToken *FormatTok) {
Daniel Jasper1dcbbcfc2016-03-14 19:21:36 +0000885 // FIXME: This returns true for C/C++ keywords like 'struct'.
886 return FormatTok->is(tok::identifier) &&
887 (FormatTok->Tok.getIdentifierInfo() == nullptr ||
Martin Probst3dbbefa2016-11-10 16:21:02 +0000888 !FormatTok->isOneOf(
889 Keywords.kw_in, Keywords.kw_of, Keywords.kw_as, Keywords.kw_async,
890 Keywords.kw_await, Keywords.kw_yield, Keywords.kw_finally,
891 Keywords.kw_function, Keywords.kw_import, Keywords.kw_is,
892 Keywords.kw_let, Keywords.kw_var, tok::kw_const,
893 Keywords.kw_abstract, Keywords.kw_extends, Keywords.kw_implements,
Manuel Klimek89628f62017-09-20 09:51:03 +0000894 Keywords.kw_instanceof, Keywords.kw_interface, Keywords.kw_throws,
895 Keywords.kw_from));
Daniel Jasper1dcbbcfc2016-03-14 19:21:36 +0000896}
897
Martin Probst533965c2016-04-19 18:19:06 +0000898static bool mustBeJSIdentOrValue(const AdditionalKeywords &Keywords,
899 const FormatToken *FormatTok) {
Martin Probstb9316ff2016-09-18 17:21:52 +0000900 return FormatTok->Tok.isLiteral() ||
901 FormatTok->isOneOf(tok::kw_true, tok::kw_false) ||
902 mustBeJSIdent(Keywords, FormatTok);
Martin Probst533965c2016-04-19 18:19:06 +0000903}
904
Daniel Jasper1dcbbcfc2016-03-14 19:21:36 +0000905// isJSDeclOrStmt returns true if |FormatTok| starts a declaration or statement
906// when encountered after a value (see mustBeJSIdentOrValue).
907static bool isJSDeclOrStmt(const AdditionalKeywords &Keywords,
908 const FormatToken *FormatTok) {
909 return FormatTok->isOneOf(
Martin Probst5f8445b2016-04-24 22:05:09 +0000910 tok::kw_return, Keywords.kw_yield,
Daniel Jasper1dcbbcfc2016-03-14 19:21:36 +0000911 // conditionals
912 tok::kw_if, tok::kw_else,
913 // loops
914 tok::kw_for, tok::kw_while, tok::kw_do, tok::kw_continue, tok::kw_break,
915 // switch/case
916 tok::kw_switch, tok::kw_case,
917 // exceptions
918 tok::kw_throw, tok::kw_try, tok::kw_catch, Keywords.kw_finally,
919 // declaration
920 tok::kw_const, tok::kw_class, Keywords.kw_var, Keywords.kw_let,
Martin Probst5f8445b2016-04-24 22:05:09 +0000921 Keywords.kw_async, Keywords.kw_function,
922 // import/export
923 Keywords.kw_import, tok::kw_export);
Daniel Jasper1dcbbcfc2016-03-14 19:21:36 +0000924}
925
926// readTokenWithJavaScriptASI reads the next token and terminates the current
927// line if JavaScript Automatic Semicolon Insertion must
928// happen between the current token and the next token.
929//
930// This method is conservative - it cannot cover all edge cases of JavaScript,
931// but only aims to correctly handle certain well known cases. It *must not*
932// return true in speculative cases.
933void UnwrappedLineParser::readTokenWithJavaScriptASI() {
934 FormatToken *Previous = FormatTok;
935 readToken();
936 FormatToken *Next = FormatTok;
937
938 bool IsOnSameLine =
939 CommentsBeforeNextToken.empty()
940 ? Next->NewlinesBefore == 0
941 : CommentsBeforeNextToken.front()->NewlinesBefore == 0;
942 if (IsOnSameLine)
943 return;
944
945 bool PreviousMustBeValue = mustBeJSIdentOrValue(Keywords, Previous);
Martin Probst717f6dc2016-10-21 05:11:38 +0000946 bool PreviousStartsTemplateExpr =
947 Previous->is(TT_TemplateString) && Previous->TokenText.endswith("${");
Martin Probst7e0f25b2017-11-25 09:19:42 +0000948 if (PreviousMustBeValue || Previous->is(tok::r_paren)) {
949 // If the line contains an '@' sign, the previous token might be an
950 // annotation, which can precede another identifier/value.
951 bool HasAt = std::find_if(Line->Tokens.begin(), Line->Tokens.end(),
952 [](UnwrappedLineNode &LineNode) {
953 return LineNode.Tok->is(tok::at);
954 }) != Line->Tokens.end();
955 if (HasAt)
Martin Probstbbffeac2016-04-11 07:35:57 +0000956 return;
957 }
Daniel Jasper1dcbbcfc2016-03-14 19:21:36 +0000958 if (Next->is(tok::exclaim) && PreviousMustBeValue)
Martin Probstd40bca42017-01-09 08:56:36 +0000959 return addUnwrappedLine();
Daniel Jasper1dcbbcfc2016-03-14 19:21:36 +0000960 bool NextMustBeValue = mustBeJSIdentOrValue(Keywords, Next);
Martin Probst717f6dc2016-10-21 05:11:38 +0000961 bool NextEndsTemplateExpr =
962 Next->is(TT_TemplateString) && Next->TokenText.startswith("}");
963 if (NextMustBeValue && !NextEndsTemplateExpr && !PreviousStartsTemplateExpr &&
964 (PreviousMustBeValue ||
965 Previous->isOneOf(tok::r_square, tok::r_paren, tok::plusplus,
966 tok::minusminus)))
Martin Probstd40bca42017-01-09 08:56:36 +0000967 return addUnwrappedLine();
Martin Probst0a19d432017-08-09 15:19:16 +0000968 if ((PreviousMustBeValue || Previous->is(tok::r_paren)) &&
969 isJSDeclOrStmt(Keywords, Next))
Martin Probstd40bca42017-01-09 08:56:36 +0000970 return addUnwrappedLine();
Daniel Jasper1dcbbcfc2016-03-14 19:21:36 +0000971}
972
Manuel Klimek6b9eeba2013-01-07 14:56:16 +0000973void UnwrappedLineParser::parseStructuralElement() {
Daniel Jasper498f5582015-12-25 08:53:31 +0000974 assert(!FormatTok->is(tok::l_brace));
975 if (Style.Language == FormatStyle::LK_TableGen &&
976 FormatTok->is(tok::pp_include)) {
977 nextToken();
978 if (FormatTok->is(tok::string_literal))
979 nextToken();
980 addUnwrappedLine();
981 return;
982 }
Manuel Klimek15dfe7a2013-05-28 11:55:06 +0000983 switch (FormatTok->Tok.getKind()) {
Daniel Jasper8f463652014-08-26 23:15:12 +0000984 case tok::kw_asm:
Daniel Jasper8f463652014-08-26 23:15:12 +0000985 nextToken();
986 if (FormatTok->is(tok::l_brace)) {
Daniel Jasperc6366072015-05-10 08:42:04 +0000987 FormatTok->Type = TT_InlineASMBrace;
Daniel Jasper2337f282015-01-12 10:14:56 +0000988 nextToken();
Daniel Jasper4429f142014-08-27 17:16:46 +0000989 while (FormatTok && FormatTok->isNot(tok::eof)) {
Daniel Jasper8f463652014-08-26 23:15:12 +0000990 if (FormatTok->is(tok::r_brace)) {
Daniel Jasperc6366072015-05-10 08:42:04 +0000991 FormatTok->Type = TT_InlineASMBrace;
Daniel Jasper8f463652014-08-26 23:15:12 +0000992 nextToken();
Daniel Jasper790d4f92015-05-11 11:59:46 +0000993 addUnwrappedLine();
Daniel Jasper8f463652014-08-26 23:15:12 +0000994 break;
995 }
Daniel Jasper2337f282015-01-12 10:14:56 +0000996 FormatTok->Finalized = true;
Daniel Jasper8f463652014-08-26 23:15:12 +0000997 nextToken();
998 }
999 }
1000 break;
Alexander Kornienko578fdd82012-12-06 18:03:27 +00001001 case tok::kw_namespace:
1002 parseNamespace();
1003 return;
Alexander Kornienkob7076a22012-12-04 14:46:19 +00001004 case tok::kw_public:
1005 case tok::kw_protected:
1006 case tok::kw_private:
Daniel Jasper83709082015-02-18 17:14:05 +00001007 if (Style.Language == FormatStyle::LK_Java ||
Paul Hoadcbb726d2019-03-21 13:09:22 +00001008 Style.Language == FormatStyle::LK_JavaScript || Style.isCSharp())
Daniel Jasperc58c70e2014-09-15 11:21:46 +00001009 nextToken();
1010 else
1011 parseAccessSpecifier();
Daniel Jasperf7935112012-12-03 18:12:45 +00001012 return;
Alexander Kornienkob7076a22012-12-04 14:46:19 +00001013 case tok::kw_if:
1014 parseIfThenElse();
Daniel Jasperf7935112012-12-03 18:12:45 +00001015 return;
Alexander Kornienko37d6c942012-12-05 15:06:06 +00001016 case tok::kw_for:
1017 case tok::kw_while:
1018 parseForOrWhileLoop();
1019 return;
Alexander Kornienkob7076a22012-12-04 14:46:19 +00001020 case tok::kw_do:
1021 parseDoWhile();
1022 return;
1023 case tok::kw_switch:
Martin Probstf785fd92017-08-04 17:07:15 +00001024 if (Style.Language == FormatStyle::LK_JavaScript && Line->MustBeDeclaration)
1025 // 'switch: string' field declaration.
1026 break;
Alexander Kornienkob7076a22012-12-04 14:46:19 +00001027 parseSwitch();
1028 return;
1029 case tok::kw_default:
Martin Probstf785fd92017-08-04 17:07:15 +00001030 if (Style.Language == FormatStyle::LK_JavaScript && Line->MustBeDeclaration)
1031 // 'default: string' field declaration.
1032 break;
Alexander Kornienkob7076a22012-12-04 14:46:19 +00001033 nextToken();
Nico Weberc29f83b2018-01-23 16:30:56 +00001034 if (FormatTok->is(tok::colon)) {
1035 parseLabel();
1036 return;
1037 }
1038 // e.g. "default void f() {}" in a Java interface.
1039 break;
Alexander Kornienkob7076a22012-12-04 14:46:19 +00001040 case tok::kw_case:
Martin Probstf785fd92017-08-04 17:07:15 +00001041 if (Style.Language == FormatStyle::LK_JavaScript && Line->MustBeDeclaration)
1042 // 'case: string' field declaration.
1043 break;
Alexander Kornienkob7076a22012-12-04 14:46:19 +00001044 parseCaseLabel();
1045 return;
Daniel Jasper04a71a42014-05-08 11:58:24 +00001046 case tok::kw_try:
Nico Weberfac23712015-02-04 15:26:27 +00001047 case tok::kw___try:
Daniel Jasper04a71a42014-05-08 11:58:24 +00001048 parseTryCatch();
1049 return;
Manuel Klimekae610d12013-01-21 14:32:05 +00001050 case tok::kw_extern:
1051 nextToken();
Manuel Klimek15dfe7a2013-05-28 11:55:06 +00001052 if (FormatTok->Tok.is(tok::string_literal)) {
Manuel Klimekae610d12013-01-21 14:32:05 +00001053 nextToken();
Manuel Klimek15dfe7a2013-05-28 11:55:06 +00001054 if (FormatTok->Tok.is(tok::l_brace)) {
Krasimir Georgievd6ce9372017-09-15 11:23:50 +00001055 if (Style.BraceWrapping.AfterExternBlock) {
1056 addUnwrappedLine();
1057 parseBlock(/*MustBeDeclaration=*/true);
1058 } else {
1059 parseBlock(/*MustBeDeclaration=*/true, /*AddLevel=*/false);
1060 }
Manuel Klimekae610d12013-01-21 14:32:05 +00001061 addUnwrappedLine();
1062 return;
1063 }
1064 }
Daniel Jaspere1e43192014-04-01 12:55:11 +00001065 break;
Daniel Jasperfca735c2015-02-19 16:14:18 +00001066 case tok::kw_export:
1067 if (Style.Language == FormatStyle::LK_JavaScript) {
1068 parseJavaScriptEs6ImportExport();
1069 return;
1070 }
Sam McCall6f3778c2018-09-05 07:44:02 +00001071 if (!Style.isCpp())
1072 break;
1073 // Handle C++ "(inline|export) namespace".
1074 LLVM_FALLTHROUGH;
1075 case tok::kw_inline:
1076 nextToken();
1077 if (FormatTok->Tok.is(tok::kw_namespace)) {
1078 parseNamespace();
1079 return;
1080 }
Daniel Jasperfca735c2015-02-19 16:14:18 +00001081 break;
Daniel Jaspere1e43192014-04-01 12:55:11 +00001082 case tok::identifier:
Daniel Jasper66cb8c52015-05-04 09:22:29 +00001083 if (FormatTok->is(TT_ForEachMacro)) {
Daniel Jaspere1e43192014-04-01 12:55:11 +00001084 parseForOrWhileLoop();
1085 return;
1086 }
Birunthan Mohanathasb001a0b2015-07-03 17:25:16 +00001087 if (FormatTok->is(TT_MacroBlockBegin)) {
1088 parseBlock(/*MustBeDeclaration=*/false, /*AddLevel=*/true,
1089 /*MunchSemi=*/false);
1090 return;
1091 }
Daniel Jasper3d5a7d62016-06-20 18:20:38 +00001092 if (FormatTok->is(Keywords.kw_import)) {
1093 if (Style.Language == FormatStyle::LK_JavaScript) {
1094 parseJavaScriptEs6ImportExport();
1095 return;
1096 }
1097 if (Style.Language == FormatStyle::LK_Proto) {
1098 nextToken();
Daniel Jasper8b61d142016-06-20 20:39:53 +00001099 if (FormatTok->is(tok::kw_public))
1100 nextToken();
Daniel Jasper3d5a7d62016-06-20 18:20:38 +00001101 if (!FormatTok->is(tok::string_literal))
1102 return;
1103 nextToken();
1104 if (FormatTok->is(tok::semi))
1105 nextToken();
1106 addUnwrappedLine();
1107 return;
1108 }
Daniel Jasper354aa512015-02-19 16:07:32 +00001109 }
Daniel Jasper1dbc2102017-03-31 13:30:24 +00001110 if (Style.isCpp() &&
Daniel Jasper72b33572017-03-31 12:04:37 +00001111 FormatTok->isOneOf(Keywords.kw_signals, Keywords.kw_qsignals,
Daniel Jaspera00de632015-12-01 12:05:04 +00001112 Keywords.kw_slots, Keywords.kw_qslots)) {
Daniel Jasperde0d1f32015-04-24 07:50:34 +00001113 nextToken();
1114 if (FormatTok->is(tok::colon)) {
1115 nextToken();
1116 addUnwrappedLine();
Daniel Jasper31343832016-07-27 10:13:24 +00001117 return;
Daniel Jasperde0d1f32015-04-24 07:50:34 +00001118 }
Daniel Jasper53395402015-04-07 15:04:40 +00001119 }
Francois Ferrand6f40e212018-10-02 16:37:51 +00001120 if (Style.isCpp() && FormatTok->is(TT_StatementMacro)) {
1121 parseStatementMacro();
1122 return;
1123 }
Francois Ferrande8a301f2019-06-06 20:06:23 +00001124 if (Style.isCpp() && FormatTok->is(TT_NamespaceMacro)) {
1125 parseNamespace();
1126 return;
1127 }
Manuel Klimekae610d12013-01-21 14:32:05 +00001128 // In all other cases, parse the declaration.
1129 break;
Alexander Kornienkob7076a22012-12-04 14:46:19 +00001130 default:
1131 break;
Daniel Jasperf7935112012-12-03 18:12:45 +00001132 }
Daniel Jasperf7935112012-12-03 18:12:45 +00001133 do {
Manuel Klimeke411aa82017-09-20 09:29:37 +00001134 const FormatToken *Previous = FormatTok->Previous;
Manuel Klimek15dfe7a2013-05-28 11:55:06 +00001135 switch (FormatTok->Tok.getKind()) {
Nico Weber372d8dc2013-02-10 20:35:35 +00001136 case tok::at:
1137 nextToken();
Krasimir Georgiev26b144c2017-07-03 15:05:14 +00001138 if (FormatTok->Tok.is(tok::l_brace)) {
1139 nextToken();
Nico Weber372d8dc2013-02-10 20:35:35 +00001140 parseBracedList();
Nico Weberc068ff72018-01-23 17:10:25 +00001141 break;
Hans Wennborg749c1b52018-10-19 16:19:52 +00001142 } else if (Style.Language == FormatStyle::LK_Java &&
1143 FormatTok->is(Keywords.kw_interface)) {
1144 nextToken();
1145 break;
Nico Weberc068ff72018-01-23 17:10:25 +00001146 }
1147 switch (FormatTok->Tok.getObjCKeywordID()) {
1148 case tok::objc_public:
1149 case tok::objc_protected:
1150 case tok::objc_package:
1151 case tok::objc_private:
1152 return parseAccessSpecifier();
1153 case tok::objc_interface:
1154 case tok::objc_implementation:
1155 return parseObjCInterfaceOrImplementation();
1156 case tok::objc_protocol:
1157 if (parseObjCProtocol())
1158 return;
1159 break;
1160 case tok::objc_end:
1161 return; // Handled by the caller.
1162 case tok::objc_optional:
1163 case tok::objc_required:
1164 nextToken();
1165 addUnwrappedLine();
1166 return;
1167 case tok::objc_autoreleasepool:
1168 nextToken();
1169 if (FormatTok->Tok.is(tok::l_brace)) {
Paul Hoadfb13e652019-10-03 18:42:31 +00001170 if (Style.BraceWrapping.AfterControlStatement ==
1171 FormatStyle::BWACS_Always)
Nico Weberc068ff72018-01-23 17:10:25 +00001172 addUnwrappedLine();
1173 parseBlock(/*MustBeDeclaration=*/false);
1174 }
1175 addUnwrappedLine();
1176 return;
Francois Ferrandba91c3d2018-02-27 13:48:21 +00001177 case tok::objc_synchronized:
1178 nextToken();
1179 if (FormatTok->Tok.is(tok::l_paren))
Paul Hoad5bcf99b2019-03-01 09:09:54 +00001180 // Skip synchronization object
1181 parseParens();
Francois Ferrandba91c3d2018-02-27 13:48:21 +00001182 if (FormatTok->Tok.is(tok::l_brace)) {
Paul Hoadfb13e652019-10-03 18:42:31 +00001183 if (Style.BraceWrapping.AfterControlStatement ==
1184 FormatStyle::BWACS_Always)
Francois Ferrandba91c3d2018-02-27 13:48:21 +00001185 addUnwrappedLine();
1186 parseBlock(/*MustBeDeclaration=*/false);
1187 }
1188 addUnwrappedLine();
1189 return;
Nico Weberc068ff72018-01-23 17:10:25 +00001190 case tok::objc_try:
1191 // This branch isn't strictly necessary (the kw_try case below would
1192 // do this too after the tok::at is parsed above). But be explicit.
1193 parseTryCatch();
1194 return;
1195 default:
1196 break;
Krasimir Georgiev26b144c2017-07-03 15:05:14 +00001197 }
Nico Weber372d8dc2013-02-10 20:35:35 +00001198 break;
Alexander Kornienkob7076a22012-12-04 14:46:19 +00001199 case tok::kw_enum:
Daniel Jaspera7900ad2016-05-08 18:12:22 +00001200 // Ignore if this is part of "template <enum ...".
1201 if (Previous && Previous->is(tok::less)) {
1202 nextToken();
1203 break;
1204 }
1205
Daniel Jasper90cf3802015-06-17 09:44:02 +00001206 // parseEnum falls through and does not yet add an unwrapped line as an
1207 // enum definition can start a structural element.
Daniel Jasper6f5a1932015-12-29 08:54:23 +00001208 if (!parseEnum())
1209 break;
Daniel Jasperc6dd2732015-07-16 14:25:43 +00001210 // This only applies for C++.
Daniel Jasper1dbc2102017-03-31 13:30:24 +00001211 if (!Style.isCpp()) {
Daniel Jasper90cf3802015-06-17 09:44:02 +00001212 addUnwrappedLine();
1213 return;
1214 }
Manuel Klimek2cec0192013-01-21 19:17:52 +00001215 break;
Daniel Jaspera88f80a2014-01-30 14:38:37 +00001216 case tok::kw_typedef:
1217 nextToken();
Daniel Jasper31f6c542014-12-05 10:42:21 +00001218 if (FormatTok->isOneOf(Keywords.kw_NS_ENUM, Keywords.kw_NS_OPTIONS,
Ben Hamiltond9212ef2019-07-22 18:20:01 +00001219 Keywords.kw_CF_ENUM, Keywords.kw_CF_OPTIONS,
Nico Weberff9f4b52019-07-29 13:26:48 +00001220 Keywords.kw_CF_CLOSED_ENUM,
1221 Keywords.kw_NS_CLOSED_ENUM))
Daniel Jaspera88f80a2014-01-30 14:38:37 +00001222 parseEnum();
1223 break;
Alexander Kornienko1231e062013-01-16 11:43:46 +00001224 case tok::kw_struct:
1225 case tok::kw_union:
Manuel Klimek28cacc72013-01-07 18:10:23 +00001226 case tok::kw_class:
Daniel Jasper910807d2015-06-12 04:52:02 +00001227 // parseRecord falls through and does not yet add an unwrapped line as a
1228 // record declaration or definition can start a structural element.
Manuel Klimeke01bab52013-01-15 13:38:33 +00001229 parseRecord();
Paul Hoadcbb726d2019-03-21 13:09:22 +00001230 // This does not apply for Java, JavaScript and C#.
Daniel Jasper910807d2015-06-12 04:52:02 +00001231 if (Style.Language == FormatStyle::LK_Java ||
Paul Hoadcbb726d2019-03-21 13:09:22 +00001232 Style.Language == FormatStyle::LK_JavaScript || Style.isCSharp()) {
Daniel Jasperd5ec65b2016-01-08 07:06:07 +00001233 if (FormatTok->is(tok::semi))
1234 nextToken();
Daniel Jasper910807d2015-06-12 04:52:02 +00001235 addUnwrappedLine();
1236 return;
1237 }
Manuel Klimeke01bab52013-01-15 13:38:33 +00001238 break;
Daniel Jaspere5d74862014-11-26 08:17:08 +00001239 case tok::period:
1240 nextToken();
1241 // In Java, classes have an implicit static member "class".
1242 if (Style.Language == FormatStyle::LK_Java && FormatTok &&
1243 FormatTok->is(tok::kw_class))
1244 nextToken();
Daniel Jasperba52fcb2015-09-28 14:29:45 +00001245 if (Style.Language == FormatStyle::LK_JavaScript && FormatTok &&
1246 FormatTok->Tok.getIdentifierInfo())
1247 // JavaScript only has pseudo keywords, all keywords are allowed to
1248 // appear in "IdentifierName" positions. See http://es5.github.io/#x7.6
1249 nextToken();
Daniel Jaspere5d74862014-11-26 08:17:08 +00001250 break;
Daniel Jasperf7935112012-12-03 18:12:45 +00001251 case tok::semi:
1252 nextToken();
1253 addUnwrappedLine();
1254 return;
Alexander Kornienko1231e062013-01-16 11:43:46 +00001255 case tok::r_brace:
1256 addUnwrappedLine();
1257 return;
Daniel Jasperf7935112012-12-03 18:12:45 +00001258 case tok::l_paren:
1259 parseParens();
1260 break;
Daniel Jasper5af04a42015-10-07 03:43:10 +00001261 case tok::kw_operator:
1262 nextToken();
1263 if (FormatTok->isBinaryOperator())
1264 nextToken();
1265 break;
Manuel Klimek516e0542013-09-04 13:25:30 +00001266 case tok::caret:
1267 nextToken();
Daniel Jasper395193c2014-03-28 07:48:59 +00001268 if (FormatTok->Tok.isAnyIdentifier() ||
1269 FormatTok->isSimpleTypeSpecifier())
1270 nextToken();
1271 if (FormatTok->is(tok::l_paren))
1272 parseParens();
1273 if (FormatTok->is(tok::l_brace))
Manuel Klimek516e0542013-09-04 13:25:30 +00001274 parseChildBlock();
Manuel Klimek516e0542013-09-04 13:25:30 +00001275 break;
Daniel Jasperf7935112012-12-03 18:12:45 +00001276 case tok::l_brace:
Manuel Klimekab419912013-05-23 09:41:43 +00001277 if (!tryToParseBracedList()) {
1278 // A block outside of parentheses must be the last part of a
1279 // structural element.
1280 // FIXME: Figure out cases where this is not true, and add projections
1281 // for them (the one we know is missing are lambdas).
Daniel Jasperc1bc38e2015-09-29 14:57:55 +00001282 if (Style.BraceWrapping.AfterFunction)
Manuel Klimekab419912013-05-23 09:41:43 +00001283 addUnwrappedLine();
Alexander Kornienko3cfa9732013-11-20 16:33:05 +00001284 FormatTok->Type = TT_FunctionLBrace;
Nico Weber9096fc02013-06-26 00:30:14 +00001285 parseBlock(/*MustBeDeclaration=*/false);
Manuel Klimeka8eb9142013-05-13 12:51:40 +00001286 addUnwrappedLine();
Manuel Klimekab419912013-05-23 09:41:43 +00001287 return;
1288 }
1289 // Otherwise this was a braced init list, and the structural
1290 // element continues.
1291 break;
Daniel Jasper04a71a42014-05-08 11:58:24 +00001292 case tok::kw_try:
1293 // We arrive here when parsing function-try blocks.
Owen Pancb5ffbe2018-09-28 09:17:00 +00001294 if (Style.BraceWrapping.AfterFunction)
1295 addUnwrappedLine();
Daniel Jasper04a71a42014-05-08 11:58:24 +00001296 parseTryCatch();
1297 return;
Daniel Jasper40e19212013-05-29 13:16:10 +00001298 case tok::identifier: {
Birunthan Mohanathasb001a0b2015-07-03 17:25:16 +00001299 if (FormatTok->is(TT_MacroBlockEnd)) {
1300 addUnwrappedLine();
1301 return;
1302 }
1303
Martin Probst973ff792017-04-27 13:07:24 +00001304 // Function declarations (as opposed to function expressions) are parsed
1305 // on their own unwrapped line by continuing this loop. Function
1306 // expressions (functions that are not on their own line) must not create
1307 // a new unwrapped line, so they are special cased below.
1308 size_t TokenCount = Line->Tokens.size();
Daniel Jasper9326f912015-05-05 08:40:32 +00001309 if (Style.Language == FormatStyle::LK_JavaScript &&
Martin Probst973ff792017-04-27 13:07:24 +00001310 FormatTok->is(Keywords.kw_function) &&
1311 (TokenCount > 1 || (TokenCount == 1 && !Line->Tokens.front().Tok->is(
1312 Keywords.kw_async)))) {
Daniel Jasper069e5f42014-05-20 11:14:57 +00001313 tryToParseJSFunction();
1314 break;
1315 }
Daniel Jasper9326f912015-05-05 08:40:32 +00001316 if ((Style.Language == FormatStyle::LK_JavaScript ||
1317 Style.Language == FormatStyle::LK_Java) &&
1318 FormatTok->is(Keywords.kw_interface)) {
Martin Probst1e8261e2016-04-19 18:18:59 +00001319 if (Style.Language == FormatStyle::LK_JavaScript) {
1320 // In JavaScript/TypeScript, "interface" can be used as a standalone
1321 // identifier, e.g. in `var interface = 1;`. If "interface" is
1322 // followed by another identifier, it is very like to be an actual
1323 // interface declaration.
1324 unsigned StoredPosition = Tokens->getPosition();
1325 FormatToken *Next = Tokens->getNextToken();
1326 FormatTok = Tokens->setPosition(StoredPosition);
Martin Probst533965c2016-04-19 18:19:06 +00001327 if (Next && !mustBeJSIdent(Keywords, Next)) {
Martin Probst1e8261e2016-04-19 18:18:59 +00001328 nextToken();
1329 break;
1330 }
1331 }
Daniel Jasper9326f912015-05-05 08:40:32 +00001332 parseRecord();
Daniel Jasper259188b2015-06-12 04:56:34 +00001333 addUnwrappedLine();
Daniel Jasper5c235c02015-07-06 14:26:04 +00001334 return;
Daniel Jasper9326f912015-05-05 08:40:32 +00001335 }
1336
Francois Ferrand6f40e212018-10-02 16:37:51 +00001337 if (Style.isCpp() && FormatTok->is(TT_StatementMacro)) {
1338 parseStatementMacro();
1339 return;
1340 }
1341
Daniel Jasper1dcbbcfc2016-03-14 19:21:36 +00001342 // See if the following token should start a new unwrapped line.
Daniel Jasper9326f912015-05-05 08:40:32 +00001343 StringRef Text = FormatTok->TokenText;
Daniel Jasperf7935112012-12-03 18:12:45 +00001344 nextToken();
Owen Pan945890a2019-05-01 15:03:41 +00001345
1346 // JS doesn't have macros, and within classes colons indicate fields, not
1347 // labels.
1348 if (Style.Language == FormatStyle::LK_JavaScript)
1349 break;
1350
1351 TokenCount = Line->Tokens.size();
1352 if (TokenCount == 1 ||
1353 (TokenCount == 2 && Line->Tokens.front().Tok->is(tok::comment))) {
Daniel Jasper676e5162015-04-07 14:36:33 +00001354 if (FormatTok->Tok.is(tok::colon) && !Line->MustBeDeclaration) {
Daniel Jasper40609472016-04-06 15:02:46 +00001355 Line->Tokens.begin()->Tok->MustBreakBefore = true;
Paul Hoad3867a2d2019-09-12 10:07:14 +00001356 parseLabel(!Style.IndentGotoLabels);
Alexander Kornienkode644272013-04-08 22:16:06 +00001357 return;
1358 }
Daniel Jasper680b09b2014-11-05 10:48:04 +00001359 // Recognize function-like macro usages without trailing semicolon as
Daniel Jasper83709082015-02-18 17:14:05 +00001360 // well as free-standing macros like Q_OBJECT.
Daniel Jasper680b09b2014-11-05 10:48:04 +00001361 bool FunctionLike = FormatTok->is(tok::l_paren);
1362 if (FunctionLike)
Alexander Kornienkode644272013-04-08 22:16:06 +00001363 parseParens();
Daniel Jaspere60cba12015-05-13 11:35:53 +00001364
1365 bool FollowedByNewline =
1366 CommentsBeforeNextToken.empty()
1367 ? FormatTok->NewlinesBefore > 0
1368 : CommentsBeforeNextToken.front()->NewlinesBefore > 0;
1369
Daniel Jaspere6fcf7d2015-06-17 13:08:06 +00001370 if (FollowedByNewline && (Text.size() >= 5 || FunctionLike) &&
Daniel Jasper680b09b2014-11-05 10:48:04 +00001371 tokenCanStartNewLine(FormatTok->Tok) && Text == Text.upper()) {
Daniel Jasper40e19212013-05-29 13:16:10 +00001372 addUnwrappedLine();
Daniel Jasper41a0f782013-05-29 14:09:17 +00001373 return;
Alexander Kornienkode644272013-04-08 22:16:06 +00001374 }
Daniel Jasperf7935112012-12-03 18:12:45 +00001375 }
1376 break;
Daniel Jasper40e19212013-05-29 13:16:10 +00001377 }
Daniel Jaspere25509f2012-12-17 11:29:41 +00001378 case tok::equal:
Manuel Klimek79e06082015-05-21 12:23:34 +00001379 // Fat arrows (=>) have tok::TokenKind tok::equal but TokenType
1380 // TT_JsFatArrow. The always start an expression or a child block if
1381 // followed by a curly.
1382 if (FormatTok->is(TT_JsFatArrow)) {
1383 nextToken();
Daniel Jasperbe520bd2015-05-31 08:51:54 +00001384 if (FormatTok->is(tok::l_brace))
Manuel Klimek79e06082015-05-21 12:23:34 +00001385 parseChildBlock();
Manuel Klimek79e06082015-05-21 12:23:34 +00001386 break;
1387 }
1388
Daniel Jaspere25509f2012-12-17 11:29:41 +00001389 nextToken();
Krasimir Georgiev26b144c2017-07-03 15:05:14 +00001390 if (FormatTok->Tok.is(tok::l_brace)) {
1391 nextToken();
Manuel Klimek8e07a1b2013-01-10 11:52:21 +00001392 parseBracedList();
Krasimir Georgiev26b144c2017-07-03 15:05:14 +00001393 } else if (Style.Language == FormatStyle::LK_Proto &&
Manuel Klimek89628f62017-09-20 09:51:03 +00001394 FormatTok->Tok.is(tok::less)) {
Krasimir Georgiev26b144c2017-07-03 15:05:14 +00001395 nextToken();
Krasimir Georgiev0b41fcb2017-06-27 13:58:41 +00001396 parseBracedList(/*ContinueOnSemicolons=*/false,
1397 /*ClosingBraceKind=*/tok::greater);
Krasimir Georgiev26b144c2017-07-03 15:05:14 +00001398 }
Daniel Jaspere25509f2012-12-17 11:29:41 +00001399 break;
Manuel Klimekffdeb592013-09-03 15:10:01 +00001400 case tok::l_square:
Daniel Jasperb88b25f2013-12-23 07:29:06 +00001401 parseSquare();
Manuel Klimekffdeb592013-09-03 15:10:01 +00001402 break;
Daniel Jasper6acf5132015-03-12 14:44:29 +00001403 case tok::kw_new:
1404 parseNew();
1405 break;
Alexander Kornienkob7076a22012-12-04 14:46:19 +00001406 default:
1407 nextToken();
1408 break;
Daniel Jasperf7935112012-12-03 18:12:45 +00001409 }
1410 } while (!eof());
1411}
1412
Daniel Jasperb88b25f2013-12-23 07:29:06 +00001413bool UnwrappedLineParser::tryToParseLambda() {
Daniel Jasper1dbc2102017-03-31 13:30:24 +00001414 if (!Style.isCpp()) {
Daniel Jasper1feab0f2015-06-02 15:31:37 +00001415 nextToken();
1416 return false;
1417 }
Daniel Jasper9fe0e8d2013-09-05 09:29:45 +00001418 assert(FormatTok->is(tok::l_square));
1419 FormatToken &LSquare = *FormatTok;
Daniel Jasper9a8d48b2013-09-05 10:04:31 +00001420 if (!tryToParseLambdaIntroducer())
Daniel Jasperb88b25f2013-12-23 07:29:06 +00001421 return false;
Manuel Klimekffdeb592013-09-03 15:10:01 +00001422
Krasimir Georgievc416c522019-03-11 16:02:52 +00001423 bool SeenArrow = false;
1424
Alexander Kornienkoc2ee9cf2014-03-13 13:59:48 +00001425 while (FormatTok->isNot(tok::l_brace)) {
Daniel Jaspercb51cf42014-01-16 09:11:55 +00001426 if (FormatTok->isSimpleTypeSpecifier()) {
1427 nextToken();
1428 continue;
1429 }
Manuel Klimekffdeb592013-09-03 15:10:01 +00001430 switch (FormatTok->Tok.getKind()) {
Daniel Jasper9a8d48b2013-09-05 10:04:31 +00001431 case tok::l_brace:
1432 break;
1433 case tok::l_paren:
1434 parseParens();
1435 break;
Daniel Jasperbcb55ee2014-11-21 14:08:38 +00001436 case tok::amp:
1437 case tok::star:
1438 case tok::kw_const:
Daniel Jasper3431b752014-12-08 13:22:37 +00001439 case tok::comma:
Daniel Jaspercb51cf42014-01-16 09:11:55 +00001440 case tok::less:
1441 case tok::greater:
Daniel Jasper9a8d48b2013-09-05 10:04:31 +00001442 case tok::identifier:
Daniel Jasper5eaa0092015-08-13 13:37:08 +00001443 case tok::numeric_constant:
Daniel Jasper1067ab02014-02-11 10:16:55 +00001444 case tok::coloncolon:
Nico Weber41f4d682019-09-13 13:18:55 +00001445 case tok::kw_class:
Daniel Jasper9a8d48b2013-09-05 10:04:31 +00001446 case tok::kw_mutable:
Ben Hamilton4e442bb2019-01-30 13:54:32 +00001447 case tok::kw_noexcept:
Nico Weber41f4d682019-09-13 13:18:55 +00001448 case tok::kw_template:
1449 case tok::kw_typename:
Krasimir Georgievc416c522019-03-11 16:02:52 +00001450 nextToken();
1451 break;
Jan Korous88e15142019-03-05 19:27:24 +00001452 // Specialization of a template with an integer parameter can contain
1453 // arithmetic, logical, comparison and ternary operators.
Krasimir Georgievc416c522019-03-11 16:02:52 +00001454 //
1455 // FIXME: This also accepts sequences of operators that are not in the scope
1456 // of a template argument list.
1457 //
1458 // In a C++ lambda a template type can only occur after an arrow. We use
1459 // this as an heuristic to distinguish between Objective-C expressions
1460 // followed by an `a->b` expression, such as:
1461 // ([obj func:arg] + a->b)
1462 // Otherwise the code below would parse as a lambda.
Nico Weber41f4d682019-09-13 13:18:55 +00001463 //
1464 // FIXME: This heuristic is incorrect for C++20 generic lambdas with
1465 // explicit template lists: []<bool b = true && false>(U &&u){}
Jan Korous88e15142019-03-05 19:27:24 +00001466 case tok::plus:
1467 case tok::minus:
1468 case tok::exclaim:
1469 case tok::tilde:
1470 case tok::slash:
1471 case tok::percent:
1472 case tok::lessless:
1473 case tok::pipe:
1474 case tok::pipepipe:
1475 case tok::ampamp:
1476 case tok::caret:
1477 case tok::equalequal:
1478 case tok::exclaimequal:
1479 case tok::greaterequal:
1480 case tok::lessequal:
1481 case tok::question:
1482 case tok::colon:
Paul Hoad10de3952019-03-05 22:20:25 +00001483 case tok::kw_true:
1484 case tok::kw_false:
Krasimir Georgievc416c522019-03-11 16:02:52 +00001485 if (SeenArrow) {
1486 nextToken();
1487 break;
1488 }
1489 return true;
Daniel Jaspercb51cf42014-01-16 09:11:55 +00001490 case tok::arrow:
Ben Hamilton30b7d092019-02-08 15:55:18 +00001491 // This might or might not actually be a lambda arrow (this could be an
1492 // ObjC method invocation followed by a dereferencing arrow). We might
1493 // reset this back to TT_Unknown in TokenAnnotator.
Daniel Jasper6f2b88a2015-06-05 13:18:09 +00001494 FormatTok->Type = TT_LambdaArrow;
Krasimir Georgievc416c522019-03-11 16:02:52 +00001495 SeenArrow = true;
Daniel Jasper9a8d48b2013-09-05 10:04:31 +00001496 nextToken();
1497 break;
1498 default:
Daniel Jasperb88b25f2013-12-23 07:29:06 +00001499 return true;
Manuel Klimekffdeb592013-09-03 15:10:01 +00001500 }
1501 }
Ronald Wamplera83e2db2019-03-26 20:18:14 +00001502 FormatTok->Type = TT_LambdaLBrace;
Daniel Jasper9fe0e8d2013-09-05 09:29:45 +00001503 LSquare.Type = TT_LambdaLSquare;
Manuel Klimek516e0542013-09-04 13:25:30 +00001504 parseChildBlock();
Daniel Jasperb88b25f2013-12-23 07:29:06 +00001505 return true;
Manuel Klimekffdeb592013-09-03 15:10:01 +00001506}
1507
1508bool UnwrappedLineParser::tryToParseLambdaIntroducer() {
Manuel Klimek89628f62017-09-20 09:51:03 +00001509 const FormatToken *Previous = FormatTok->Previous;
Manuel Klimek9f0a4e52017-09-19 09:59:30 +00001510 if (Previous &&
1511 (Previous->isOneOf(tok::identifier, tok::kw_operator, tok::kw_new,
Manuel Klimekd0f3fe52018-04-11 14:51:54 +00001512 tok::kw_delete, tok::l_square) ||
Manuel Klimek89628f62017-09-20 09:51:03 +00001513 FormatTok->isCppStructuredBinding(Style) || Previous->closesScope() ||
1514 Previous->isSimpleTypeSpecifier())) {
Manuel Klimekffdeb592013-09-03 15:10:01 +00001515 nextToken();
Manuel Klimek9f0a4e52017-09-19 09:59:30 +00001516 return false;
Manuel Klimekffdeb592013-09-03 15:10:01 +00001517 }
Manuel Klimek9f0a4e52017-09-19 09:59:30 +00001518 nextToken();
Manuel Klimekd0f3fe52018-04-11 14:51:54 +00001519 if (FormatTok->is(tok::l_square)) {
1520 return false;
1521 }
Manuel Klimek9f0a4e52017-09-19 09:59:30 +00001522 parseSquare(/*LambdaIntroducer=*/true);
1523 return true;
Manuel Klimekffdeb592013-09-03 15:10:01 +00001524}
1525
Daniel Jasperc03e16a2014-05-08 09:25:39 +00001526void UnwrappedLineParser::tryToParseJSFunction() {
Martin Probst409697e2016-05-29 14:41:07 +00001527 assert(FormatTok->is(Keywords.kw_function) ||
1528 FormatTok->startsSequence(Keywords.kw_async, Keywords.kw_function));
Martin Probst5f8445b2016-04-24 22:05:09 +00001529 if (FormatTok->is(Keywords.kw_async))
1530 nextToken();
1531 // Consume "function".
Daniel Jasperc03e16a2014-05-08 09:25:39 +00001532 nextToken();
Daniel Jasper5217a8b2014-06-13 07:02:04 +00001533
Daniel Jasper71e50af2016-11-01 06:22:59 +00001534 // Consume * (generator function). Treat it like C++'s overloaded operators.
1535 if (FormatTok->is(tok::star)) {
1536 FormatTok->Type = TT_OverloadedOperator;
Martin Probst5f8445b2016-04-24 22:05:09 +00001537 nextToken();
Daniel Jasper71e50af2016-11-01 06:22:59 +00001538 }
Martin Probst5f8445b2016-04-24 22:05:09 +00001539
Daniel Jasper5217a8b2014-06-13 07:02:04 +00001540 // Consume function name.
1541 if (FormatTok->is(tok::identifier))
Daniel Jasperfca735c2015-02-19 16:14:18 +00001542 nextToken();
Daniel Jasper5217a8b2014-06-13 07:02:04 +00001543
Daniel Jasperc03e16a2014-05-08 09:25:39 +00001544 if (FormatTok->isNot(tok::l_paren))
1545 return;
Manuel Klimek79e06082015-05-21 12:23:34 +00001546
1547 // Parse formal parameter list.
Daniel Jasperbe520bd2015-05-31 08:51:54 +00001548 parseParens();
Manuel Klimek79e06082015-05-21 12:23:34 +00001549
1550 if (FormatTok->is(tok::colon)) {
1551 // Parse a type definition.
1552 nextToken();
1553
1554 // Eat the type declaration. For braced inline object types, balance braces,
1555 // otherwise just parse until finding an l_brace for the function body.
Daniel Jasperbe520bd2015-05-31 08:51:54 +00001556 if (FormatTok->is(tok::l_brace))
1557 tryToParseBracedList();
1558 else
Martin Probstaf16c502017-01-04 13:36:43 +00001559 while (!FormatTok->isOneOf(tok::l_brace, tok::semi) && !eof())
Manuel Klimek79e06082015-05-21 12:23:34 +00001560 nextToken();
Manuel Klimek79e06082015-05-21 12:23:34 +00001561 }
1562
Martin Probstaf16c502017-01-04 13:36:43 +00001563 if (FormatTok->is(tok::semi))
1564 return;
1565
Manuel Klimek79e06082015-05-21 12:23:34 +00001566 parseChildBlock();
1567}
1568
Daniel Jasper3c883d12015-05-18 14:49:19 +00001569bool UnwrappedLineParser::tryToParseBracedList() {
Daniel Jasperb1f74a82013-07-09 09:06:29 +00001570 if (FormatTok->BlockKind == BK_Unknown)
Daniel Jasper3c883d12015-05-18 14:49:19 +00001571 calculateBraceTypes();
Daniel Jasperb1f74a82013-07-09 09:06:29 +00001572 assert(FormatTok->BlockKind != BK_Unknown);
1573 if (FormatTok->BlockKind == BK_Block)
Manuel Klimekab419912013-05-23 09:41:43 +00001574 return false;
Krasimir Georgiev26b144c2017-07-03 15:05:14 +00001575 nextToken();
Manuel Klimekab419912013-05-23 09:41:43 +00001576 parseBracedList();
1577 return true;
1578}
1579
Krasimir Georgievff747be2017-06-27 13:43:07 +00001580bool UnwrappedLineParser::parseBracedList(bool ContinueOnSemicolons,
1581 tok::TokenKind ClosingBraceKind) {
Daniel Jasper015ed022013-09-13 09:20:45 +00001582 bool HasError = false;
Manuel Klimek8e07a1b2013-01-10 11:52:21 +00001583
Manuel Klimeka3ff45e2013-04-10 09:52:05 +00001584 // FIXME: Once we have an expression parser in the UnwrappedLineParser,
1585 // replace this by using parseAssigmentExpression() inside.
Manuel Klimek8e07a1b2013-01-10 11:52:21 +00001586 do {
Manuel Klimek79e06082015-05-21 12:23:34 +00001587 if (Style.Language == FormatStyle::LK_JavaScript) {
Martin Probst409697e2016-05-29 14:41:07 +00001588 if (FormatTok->is(Keywords.kw_function) ||
1589 FormatTok->startsSequence(Keywords.kw_async, Keywords.kw_function)) {
Manuel Klimek79e06082015-05-21 12:23:34 +00001590 tryToParseJSFunction();
1591 continue;
Daniel Jasperbe520bd2015-05-31 08:51:54 +00001592 }
1593 if (FormatTok->is(TT_JsFatArrow)) {
Manuel Klimek79e06082015-05-21 12:23:34 +00001594 nextToken();
1595 // Fat arrows can be followed by simple expressions or by child blocks
1596 // in curly braces.
Daniel Jaspere6fcf7d2015-06-17 13:08:06 +00001597 if (FormatTok->is(tok::l_brace)) {
Manuel Klimek79e06082015-05-21 12:23:34 +00001598 parseChildBlock();
1599 continue;
1600 }
1601 }
Martin Probst8e3eba02017-02-07 16:33:13 +00001602 if (FormatTok->is(tok::l_brace)) {
1603 // Could be a method inside of a braced list `{a() { return 1; }}`.
1604 if (tryToParseBracedList())
1605 continue;
1606 parseChildBlock();
1607 }
Daniel Jasperc03e16a2014-05-08 09:25:39 +00001608 }
Krasimir Georgievff747be2017-06-27 13:43:07 +00001609 if (FormatTok->Tok.getKind() == ClosingBraceKind) {
1610 nextToken();
1611 return !HasError;
1612 }
Manuel Klimek15dfe7a2013-05-28 11:55:06 +00001613 switch (FormatTok->Tok.getKind()) {
Manuel Klimek516e0542013-09-04 13:25:30 +00001614 case tok::caret:
1615 nextToken();
1616 if (FormatTok->is(tok::l_brace)) {
1617 parseChildBlock();
1618 }
1619 break;
1620 case tok::l_square:
1621 tryToParseLambda();
1622 break;
Daniel Jaspera87af7a2015-06-30 11:32:22 +00001623 case tok::l_paren:
1624 parseParens();
Daniel Jasperf46dec82015-03-31 14:34:15 +00001625 // JavaScript can just have free standing methods and getters/setters in
1626 // object literals. Detect them by a "{" following ")".
1627 if (Style.Language == FormatStyle::LK_JavaScript) {
Daniel Jasperf46dec82015-03-31 14:34:15 +00001628 if (FormatTok->is(tok::l_brace))
1629 parseChildBlock();
1630 break;
1631 }
Daniel Jasperf46dec82015-03-31 14:34:15 +00001632 break;
Martin Probst8e3eba02017-02-07 16:33:13 +00001633 case tok::l_brace:
1634 // Assume there are no blocks inside a braced init list apart
1635 // from the ones we explicitly parse out (like lambdas).
1636 FormatTok->BlockKind = BK_BracedInit;
Krasimir Georgiev26b144c2017-07-03 15:05:14 +00001637 nextToken();
Martin Probst8e3eba02017-02-07 16:33:13 +00001638 parseBracedList();
1639 break;
Krasimir Georgievfa4dbb62017-08-03 13:43:45 +00001640 case tok::less:
1641 if (Style.Language == FormatStyle::LK_Proto) {
1642 nextToken();
1643 parseBracedList(/*ContinueOnSemicolons=*/false,
1644 /*ClosingBraceKind=*/tok::greater);
1645 } else {
1646 nextToken();
1647 }
1648 break;
Manuel Klimeka3ff45e2013-04-10 09:52:05 +00001649 case tok::semi:
Daniel Jasperb9a49902016-01-09 15:56:28 +00001650 // JavaScript (or more precisely TypeScript) can have semicolons in braced
1651 // lists (in so-called TypeMemberLists). Thus, the semicolon cannot be
1652 // used for error recovery if we have otherwise determined that this is
1653 // a braced list.
1654 if (Style.Language == FormatStyle::LK_JavaScript) {
1655 nextToken();
1656 break;
1657 }
Daniel Jasper015ed022013-09-13 09:20:45 +00001658 HasError = true;
1659 if (!ContinueOnSemicolons)
1660 return !HasError;
1661 nextToken();
1662 break;
Manuel Klimeka3ff45e2013-04-10 09:52:05 +00001663 case tok::comma:
1664 nextToken();
Manuel Klimeka3ff45e2013-04-10 09:52:05 +00001665 break;
Manuel Klimek8e07a1b2013-01-10 11:52:21 +00001666 default:
1667 nextToken();
1668 break;
1669 }
1670 } while (!eof());
Daniel Jasper015ed022013-09-13 09:20:45 +00001671 return false;
Manuel Klimek8e07a1b2013-01-10 11:52:21 +00001672}
1673
Daniel Jasperf7935112012-12-03 18:12:45 +00001674void UnwrappedLineParser::parseParens() {
Manuel Klimek15dfe7a2013-05-28 11:55:06 +00001675 assert(FormatTok->Tok.is(tok::l_paren) && "'(' expected.");
Daniel Jasperf7935112012-12-03 18:12:45 +00001676 nextToken();
1677 do {
Manuel Klimek15dfe7a2013-05-28 11:55:06 +00001678 switch (FormatTok->Tok.getKind()) {
Daniel Jasperf7935112012-12-03 18:12:45 +00001679 case tok::l_paren:
1680 parseParens();
Daniel Jasper5f1fa852015-01-04 20:40:51 +00001681 if (Style.Language == FormatStyle::LK_Java && FormatTok->is(tok::l_brace))
1682 parseChildBlock();
Daniel Jasperf7935112012-12-03 18:12:45 +00001683 break;
1684 case tok::r_paren:
1685 nextToken();
1686 return;
Daniel Jasper393564f2013-05-31 14:56:29 +00001687 case tok::r_brace:
1688 // A "}" inside parenthesis is an error if there wasn't a matching "{".
1689 return;
Daniel Jasper9a8d48b2013-09-05 10:04:31 +00001690 case tok::l_square:
1691 tryToParseLambda();
1692 break;
Daniel Jasper5f1fa852015-01-04 20:40:51 +00001693 case tok::l_brace:
Daniel Jasperadba2aa2015-05-18 12:52:00 +00001694 if (!tryToParseBracedList())
Manuel Klimekf017dc02013-09-04 13:34:14 +00001695 parseChildBlock();
Manuel Klimek8e07a1b2013-01-10 11:52:21 +00001696 break;
Nico Weber372d8dc2013-02-10 20:35:35 +00001697 case tok::at:
1698 nextToken();
Krasimir Georgiev26b144c2017-07-03 15:05:14 +00001699 if (FormatTok->Tok.is(tok::l_brace)) {
1700 nextToken();
Nico Weber372d8dc2013-02-10 20:35:35 +00001701 parseBracedList();
Krasimir Georgiev26b144c2017-07-03 15:05:14 +00001702 }
Nico Weber372d8dc2013-02-10 20:35:35 +00001703 break;
Martin Probst1027fb82017-02-07 14:05:30 +00001704 case tok::kw_class:
1705 if (Style.Language == FormatStyle::LK_JavaScript)
1706 parseRecord(/*ParseAsExpr=*/true);
1707 else
1708 nextToken();
1709 break;
Daniel Jasper3f69ba12014-09-05 08:42:27 +00001710 case tok::identifier:
1711 if (Style.Language == FormatStyle::LK_JavaScript &&
Martin Probst409697e2016-05-29 14:41:07 +00001712 (FormatTok->is(Keywords.kw_function) ||
1713 FormatTok->startsSequence(Keywords.kw_async, Keywords.kw_function)))
Daniel Jasper3f69ba12014-09-05 08:42:27 +00001714 tryToParseJSFunction();
1715 else
1716 nextToken();
1717 break;
Daniel Jasperf7935112012-12-03 18:12:45 +00001718 default:
1719 nextToken();
1720 break;
1721 }
1722 } while (!eof());
1723}
1724
Manuel Klimek9f0a4e52017-09-19 09:59:30 +00001725void UnwrappedLineParser::parseSquare(bool LambdaIntroducer) {
1726 if (!LambdaIntroducer) {
1727 assert(FormatTok->Tok.is(tok::l_square) && "'[' expected.");
1728 if (tryToParseLambda())
1729 return;
1730 }
Daniel Jasperb88b25f2013-12-23 07:29:06 +00001731 do {
Daniel Jasperb88b25f2013-12-23 07:29:06 +00001732 switch (FormatTok->Tok.getKind()) {
1733 case tok::l_paren:
1734 parseParens();
1735 break;
1736 case tok::r_square:
1737 nextToken();
1738 return;
1739 case tok::r_brace:
1740 // A "}" inside parenthesis is an error if there wasn't a matching "{".
1741 return;
1742 case tok::l_square:
1743 parseSquare();
1744 break;
1745 case tok::l_brace: {
Daniel Jasperadba2aa2015-05-18 12:52:00 +00001746 if (!tryToParseBracedList())
Daniel Jasperb88b25f2013-12-23 07:29:06 +00001747 parseChildBlock();
Daniel Jasperb88b25f2013-12-23 07:29:06 +00001748 break;
1749 }
1750 case tok::at:
1751 nextToken();
Krasimir Georgiev26b144c2017-07-03 15:05:14 +00001752 if (FormatTok->Tok.is(tok::l_brace)) {
1753 nextToken();
Daniel Jasperb88b25f2013-12-23 07:29:06 +00001754 parseBracedList();
Krasimir Georgiev26b144c2017-07-03 15:05:14 +00001755 }
Daniel Jasperb88b25f2013-12-23 07:29:06 +00001756 break;
1757 default:
1758 nextToken();
1759 break;
1760 }
1761 } while (!eof());
1762}
1763
Daniel Jasperf7935112012-12-03 18:12:45 +00001764void UnwrappedLineParser::parseIfThenElse() {
Manuel Klimek15dfe7a2013-05-28 11:55:06 +00001765 assert(FormatTok->Tok.is(tok::kw_if) && "'if' expected");
Daniel Jasperf7935112012-12-03 18:12:45 +00001766 nextToken();
Nico Weber1361a4c2019-07-27 02:41:40 +00001767 if (FormatTok->Tok.isOneOf(tok::kw_constexpr, tok::identifier))
Daniel Jasper6a7d5a72017-06-19 07:40:49 +00001768 nextToken();
Manuel Klimek15dfe7a2013-05-28 11:55:06 +00001769 if (FormatTok->Tok.is(tok::l_paren))
Manuel Klimekadededf2013-01-11 18:28:36 +00001770 parseParens();
Daniel Jasperf7935112012-12-03 18:12:45 +00001771 bool NeedsUnwrappedLine = false;
Manuel Klimek15dfe7a2013-05-28 11:55:06 +00001772 if (FormatTok->Tok.is(tok::l_brace)) {
Alexander Kornienko3a33f022013-12-12 09:49:52 +00001773 CompoundStatementIndenter Indenter(this, Style, Line->Level);
Nico Weber9096fc02013-06-26 00:30:14 +00001774 parseBlock(/*MustBeDeclaration=*/false);
Daniel Jasperc1bc38e2015-09-29 14:57:55 +00001775 if (Style.BraceWrapping.BeforeElse)
Manuel Klimekd3ed59a2013-08-02 21:31:59 +00001776 addUnwrappedLine();
Daniel Jasperc1bc38e2015-09-29 14:57:55 +00001777 else
Manuel Klimekd3ed59a2013-08-02 21:31:59 +00001778 NeedsUnwrappedLine = true;
Daniel Jasperf7935112012-12-03 18:12:45 +00001779 } else {
1780 addUnwrappedLine();
Manuel Klimek52b15152013-01-09 15:25:02 +00001781 ++Line->Level;
Manuel Klimek6b9eeba2013-01-07 14:56:16 +00001782 parseStructuralElement();
Manuel Klimek52b15152013-01-09 15:25:02 +00001783 --Line->Level;
Daniel Jasperf7935112012-12-03 18:12:45 +00001784 }
Manuel Klimek15dfe7a2013-05-28 11:55:06 +00001785 if (FormatTok->Tok.is(tok::kw_else)) {
Daniel Jasperf7935112012-12-03 18:12:45 +00001786 nextToken();
Manuel Klimek15dfe7a2013-05-28 11:55:06 +00001787 if (FormatTok->Tok.is(tok::l_brace)) {
Alexander Kornienko3a33f022013-12-12 09:49:52 +00001788 CompoundStatementIndenter Indenter(this, Style, Line->Level);
Nico Weber9096fc02013-06-26 00:30:14 +00001789 parseBlock(/*MustBeDeclaration=*/false);
Daniel Jasperf7935112012-12-03 18:12:45 +00001790 addUnwrappedLine();
Manuel Klimek15dfe7a2013-05-28 11:55:06 +00001791 } else if (FormatTok->Tok.is(tok::kw_if)) {
Daniel Jasperf7935112012-12-03 18:12:45 +00001792 parseIfThenElse();
1793 } else {
1794 addUnwrappedLine();
Manuel Klimek52b15152013-01-09 15:25:02 +00001795 ++Line->Level;
Manuel Klimek6b9eeba2013-01-07 14:56:16 +00001796 parseStructuralElement();
Daniel Jasper451544a2016-05-19 06:30:48 +00001797 if (FormatTok->is(tok::eof))
1798 addUnwrappedLine();
Manuel Klimek52b15152013-01-09 15:25:02 +00001799 --Line->Level;
Daniel Jasperf7935112012-12-03 18:12:45 +00001800 }
1801 } else if (NeedsUnwrappedLine) {
1802 addUnwrappedLine();
1803 }
1804}
1805
Daniel Jasper04a71a42014-05-08 11:58:24 +00001806void UnwrappedLineParser::parseTryCatch() {
Nico Weberfac23712015-02-04 15:26:27 +00001807 assert(FormatTok->isOneOf(tok::kw_try, tok::kw___try) && "'try' expected");
Daniel Jasper04a71a42014-05-08 11:58:24 +00001808 nextToken();
1809 bool NeedsUnwrappedLine = false;
1810 if (FormatTok->is(tok::colon)) {
1811 // We are in a function try block, what comes is an initializer list.
1812 nextToken();
1813 while (FormatTok->is(tok::identifier)) {
1814 nextToken();
1815 if (FormatTok->is(tok::l_paren))
1816 parseParens();
Daniel Jasper04a71a42014-05-08 11:58:24 +00001817 if (FormatTok->is(tok::comma))
1818 nextToken();
1819 }
1820 }
Daniel Jaspere189d462015-01-14 10:48:41 +00001821 // Parse try with resource.
1822 if (Style.Language == FormatStyle::LK_Java && FormatTok->is(tok::l_paren)) {
1823 parseParens();
1824 }
Daniel Jasper04a71a42014-05-08 11:58:24 +00001825 if (FormatTok->is(tok::l_brace)) {
1826 CompoundStatementIndenter Indenter(this, Style, Line->Level);
1827 parseBlock(/*MustBeDeclaration=*/false);
Daniel Jasperc1bc38e2015-09-29 14:57:55 +00001828 if (Style.BraceWrapping.BeforeCatch) {
Daniel Jasper04a71a42014-05-08 11:58:24 +00001829 addUnwrappedLine();
1830 } else {
1831 NeedsUnwrappedLine = true;
1832 }
1833 } else if (!FormatTok->is(tok::kw_catch)) {
1834 // The C++ standard requires a compound-statement after a try.
1835 // If there's none, we try to assume there's a structuralElement
1836 // and try to continue.
Daniel Jasper04a71a42014-05-08 11:58:24 +00001837 addUnwrappedLine();
1838 ++Line->Level;
1839 parseStructuralElement();
1840 --Line->Level;
1841 }
Nico Weber33381f52015-02-07 01:57:32 +00001842 while (1) {
1843 if (FormatTok->is(tok::at))
1844 nextToken();
1845 if (!(FormatTok->isOneOf(tok::kw_catch, Keywords.kw___except,
1846 tok::kw___finally) ||
1847 ((Style.Language == FormatStyle::LK_Java ||
1848 Style.Language == FormatStyle::LK_JavaScript) &&
1849 FormatTok->is(Keywords.kw_finally)) ||
1850 (FormatTok->Tok.isObjCAtKeyword(tok::objc_catch) ||
1851 FormatTok->Tok.isObjCAtKeyword(tok::objc_finally))))
1852 break;
Daniel Jasper04a71a42014-05-08 11:58:24 +00001853 nextToken();
1854 while (FormatTok->isNot(tok::l_brace)) {
1855 if (FormatTok->is(tok::l_paren)) {
1856 parseParens();
1857 continue;
1858 }
Daniel Jasper2bd7a642015-01-19 10:50:51 +00001859 if (FormatTok->isOneOf(tok::semi, tok::r_brace, tok::eof))
Daniel Jasper04a71a42014-05-08 11:58:24 +00001860 return;
1861 nextToken();
1862 }
1863 NeedsUnwrappedLine = false;
1864 CompoundStatementIndenter Indenter(this, Style, Line->Level);
1865 parseBlock(/*MustBeDeclaration=*/false);
Daniel Jasperc1bc38e2015-09-29 14:57:55 +00001866 if (Style.BraceWrapping.BeforeCatch)
Daniel Jasper04a71a42014-05-08 11:58:24 +00001867 addUnwrappedLine();
Daniel Jasperc1bc38e2015-09-29 14:57:55 +00001868 else
Daniel Jasper04a71a42014-05-08 11:58:24 +00001869 NeedsUnwrappedLine = true;
Daniel Jasper04a71a42014-05-08 11:58:24 +00001870 }
Daniel Jasperc1bc38e2015-09-29 14:57:55 +00001871 if (NeedsUnwrappedLine)
Daniel Jasper04a71a42014-05-08 11:58:24 +00001872 addUnwrappedLine();
Daniel Jasper04a71a42014-05-08 11:58:24 +00001873}
1874
Alexander Kornienko578fdd82012-12-06 18:03:27 +00001875void UnwrappedLineParser::parseNamespace() {
Francois Ferrande8a301f2019-06-06 20:06:23 +00001876 assert(FormatTok->isOneOf(tok::kw_namespace, TT_NamespaceMacro) &&
1877 "'namespace' expected");
Roman Kashitsyna043ced2014-08-11 12:18:01 +00001878
1879 const FormatToken &InitialToken = *FormatTok;
Alexander Kornienko578fdd82012-12-06 18:03:27 +00001880 nextToken();
Francois Ferrande8a301f2019-06-06 20:06:23 +00001881 if (InitialToken.is(TT_NamespaceMacro)) {
1882 parseParens();
1883 } else {
Nico Weber37944132019-07-23 17:49:45 +00001884 while (FormatTok->isOneOf(tok::identifier, tok::coloncolon, tok::kw_inline,
1885 tok::l_square)) {
1886 if (FormatTok->is(tok::l_square))
1887 parseSquare();
1888 else
1889 nextToken();
1890 }
Francois Ferrande8a301f2019-06-06 20:06:23 +00001891 }
Manuel Klimek15dfe7a2013-05-28 11:55:06 +00001892 if (FormatTok->Tok.is(tok::l_brace)) {
Roman Kashitsyna043ced2014-08-11 12:18:01 +00001893 if (ShouldBreakBeforeBrace(Style, InitialToken))
Manuel Klimeka8eb9142013-05-13 12:51:40 +00001894 addUnwrappedLine();
1895
Daniel Jasper65ee3472013-07-31 23:16:02 +00001896 bool AddLevel = Style.NamespaceIndentation == FormatStyle::NI_All ||
1897 (Style.NamespaceIndentation == FormatStyle::NI_Inner &&
1898 DeclarationScopeStack.size() > 1);
1899 parseBlock(/*MustBeDeclaration=*/true, AddLevel);
Manuel Klimek046b9302013-02-06 16:08:09 +00001900 // Munch the semicolon after a namespace. This is more common than one would
1901 // think. Puttin the semicolon into its own line is very ugly.
Manuel Klimek15dfe7a2013-05-28 11:55:06 +00001902 if (FormatTok->Tok.is(tok::semi))
Manuel Klimek046b9302013-02-06 16:08:09 +00001903 nextToken();
Alexander Kornienko578fdd82012-12-06 18:03:27 +00001904 addUnwrappedLine();
1905 }
1906 // FIXME: Add error handling.
1907}
1908
Daniel Jasper6acf5132015-03-12 14:44:29 +00001909void UnwrappedLineParser::parseNew() {
1910 assert(FormatTok->is(tok::kw_new) && "'new' expected");
1911 nextToken();
1912 if (Style.Language != FormatStyle::LK_Java)
1913 return;
1914
1915 // In Java, we can parse everything up to the parens, which aren't optional.
1916 do {
1917 // There should not be a ;, { or } before the new's open paren.
1918 if (FormatTok->isOneOf(tok::semi, tok::l_brace, tok::r_brace))
1919 return;
1920
1921 // Consume the parens.
1922 if (FormatTok->is(tok::l_paren)) {
1923 parseParens();
1924
1925 // If there is a class body of an anonymous class, consume that as child.
1926 if (FormatTok->is(tok::l_brace))
1927 parseChildBlock();
1928 return;
1929 }
1930 nextToken();
1931 } while (!eof());
1932}
1933
Alexander Kornienko37d6c942012-12-05 15:06:06 +00001934void UnwrappedLineParser::parseForOrWhileLoop() {
Daniel Jasper66cb8c52015-05-04 09:22:29 +00001935 assert(FormatTok->isOneOf(tok::kw_for, tok::kw_while, TT_ForEachMacro) &&
Daniel Jaspere1e43192014-04-01 12:55:11 +00001936 "'for', 'while' or foreach macro expected");
Alexander Kornienko37d6c942012-12-05 15:06:06 +00001937 nextToken();
Martin Probsta050f412017-05-18 21:19:29 +00001938 // JS' for await ( ...
Martin Probstbd49e322017-05-15 19:33:20 +00001939 if (Style.Language == FormatStyle::LK_JavaScript &&
Martin Probsta050f412017-05-18 21:19:29 +00001940 FormatTok->is(Keywords.kw_await))
Martin Probstbd49e322017-05-15 19:33:20 +00001941 nextToken();
Manuel Klimek15dfe7a2013-05-28 11:55:06 +00001942 if (FormatTok->Tok.is(tok::l_paren))
Manuel Klimek9fa8d552013-01-11 19:23:05 +00001943 parseParens();
Manuel Klimek15dfe7a2013-05-28 11:55:06 +00001944 if (FormatTok->Tok.is(tok::l_brace)) {
Alexander Kornienko3a33f022013-12-12 09:49:52 +00001945 CompoundStatementIndenter Indenter(this, Style, Line->Level);
Nico Weber9096fc02013-06-26 00:30:14 +00001946 parseBlock(/*MustBeDeclaration=*/false);
Alexander Kornienko37d6c942012-12-05 15:06:06 +00001947 addUnwrappedLine();
1948 } else {
1949 addUnwrappedLine();
Manuel Klimek52b15152013-01-09 15:25:02 +00001950 ++Line->Level;
Manuel Klimek6b9eeba2013-01-07 14:56:16 +00001951 parseStructuralElement();
Manuel Klimek52b15152013-01-09 15:25:02 +00001952 --Line->Level;
Alexander Kornienko37d6c942012-12-05 15:06:06 +00001953 }
1954}
1955
Daniel Jasperf7935112012-12-03 18:12:45 +00001956void UnwrappedLineParser::parseDoWhile() {
Manuel Klimek15dfe7a2013-05-28 11:55:06 +00001957 assert(FormatTok->Tok.is(tok::kw_do) && "'do' expected");
Daniel Jasperf7935112012-12-03 18:12:45 +00001958 nextToken();
Manuel Klimek15dfe7a2013-05-28 11:55:06 +00001959 if (FormatTok->Tok.is(tok::l_brace)) {
Alexander Kornienko3a33f022013-12-12 09:49:52 +00001960 CompoundStatementIndenter Indenter(this, Style, Line->Level);
Nico Weber9096fc02013-06-26 00:30:14 +00001961 parseBlock(/*MustBeDeclaration=*/false);
Daniel Jasperc1bc38e2015-09-29 14:57:55 +00001962 if (Style.BraceWrapping.IndentBraces)
Alexander Kornienko3a33f022013-12-12 09:49:52 +00001963 addUnwrappedLine();
Daniel Jasperf7935112012-12-03 18:12:45 +00001964 } else {
1965 addUnwrappedLine();
Manuel Klimek52b15152013-01-09 15:25:02 +00001966 ++Line->Level;
Manuel Klimek6b9eeba2013-01-07 14:56:16 +00001967 parseStructuralElement();
Manuel Klimek52b15152013-01-09 15:25:02 +00001968 --Line->Level;
Daniel Jasperf7935112012-12-03 18:12:45 +00001969 }
1970
Alexander Kornienko0ea8e102012-12-04 15:40:36 +00001971 // FIXME: Add error handling.
Manuel Klimek15dfe7a2013-05-28 11:55:06 +00001972 if (!FormatTok->Tok.is(tok::kw_while)) {
Alexander Kornienko0ea8e102012-12-04 15:40:36 +00001973 addUnwrappedLine();
1974 return;
1975 }
1976
Daniel Jasperf7935112012-12-03 18:12:45 +00001977 nextToken();
Manuel Klimek6b9eeba2013-01-07 14:56:16 +00001978 parseStructuralElement();
Daniel Jasperf7935112012-12-03 18:12:45 +00001979}
1980
Paul Hoad3867a2d2019-09-12 10:07:14 +00001981void UnwrappedLineParser::parseLabel(bool LeftAlignLabel) {
Daniel Jasperf7935112012-12-03 18:12:45 +00001982 nextToken();
Manuel Klimek52b15152013-01-09 15:25:02 +00001983 unsigned OldLineLevel = Line->Level;
Daniel Jaspera1275122013-03-20 10:23:53 +00001984 if (Line->Level > 1 || (!Line->InPPDirective && Line->Level > 0))
Manuel Klimek52b15152013-01-09 15:25:02 +00001985 --Line->Level;
Paul Hoad3867a2d2019-09-12 10:07:14 +00001986 if (LeftAlignLabel)
1987 Line->Level = 0;
Manuel Klimek15dfe7a2013-05-28 11:55:06 +00001988 if (CommentsBeforeNextToken.empty() && FormatTok->Tok.is(tok::l_brace)) {
Owen Pan806d5742019-04-08 23:36:25 +00001989 CompoundStatementIndenter Indenter(this, Line->Level,
1990 Style.BraceWrapping.AfterCaseLabel,
1991 Style.BraceWrapping.IndentBraces);
Nico Weber9096fc02013-06-26 00:30:14 +00001992 parseBlock(/*MustBeDeclaration=*/false);
Manuel Klimekd3ed59a2013-08-02 21:31:59 +00001993 if (FormatTok->Tok.is(tok::kw_break)) {
Paul Hoadfb13e652019-10-03 18:42:31 +00001994 if (Style.BraceWrapping.AfterControlStatement ==
1995 FormatStyle::BWACS_Always)
Manuel Klimekd3ed59a2013-08-02 21:31:59 +00001996 addUnwrappedLine();
1997 parseStructuralElement();
1998 }
Alexander Kornienko3a33f022013-12-12 09:49:52 +00001999 addUnwrappedLine();
2000 } else {
Daniel Jasper1fe0d5c2015-05-06 15:19:47 +00002001 if (FormatTok->is(tok::semi))
2002 nextToken();
Alexander Kornienko3a33f022013-12-12 09:49:52 +00002003 addUnwrappedLine();
Daniel Jasperf7935112012-12-03 18:12:45 +00002004 }
Manuel Klimek52b15152013-01-09 15:25:02 +00002005 Line->Level = OldLineLevel;
Daniel Jasper2cce7b72016-04-06 16:41:39 +00002006 if (FormatTok->isNot(tok::l_brace)) {
Daniel Jasper40609472016-04-06 15:02:46 +00002007 parseStructuralElement();
Daniel Jasper2cce7b72016-04-06 16:41:39 +00002008 addUnwrappedLine();
2009 }
Daniel Jasperf7935112012-12-03 18:12:45 +00002010}
2011
2012void UnwrappedLineParser::parseCaseLabel() {
Manuel Klimek15dfe7a2013-05-28 11:55:06 +00002013 assert(FormatTok->Tok.is(tok::kw_case) && "'case' expected");
Daniel Jasperf7935112012-12-03 18:12:45 +00002014 // FIXME: fix handling of complex expressions here.
2015 do {
2016 nextToken();
Manuel Klimek15dfe7a2013-05-28 11:55:06 +00002017 } while (!eof() && !FormatTok->Tok.is(tok::colon));
Daniel Jasperf7935112012-12-03 18:12:45 +00002018 parseLabel();
2019}
2020
2021void UnwrappedLineParser::parseSwitch() {
Manuel Klimek15dfe7a2013-05-28 11:55:06 +00002022 assert(FormatTok->Tok.is(tok::kw_switch) && "'switch' expected");
Daniel Jasperf7935112012-12-03 18:12:45 +00002023 nextToken();
Manuel Klimek15dfe7a2013-05-28 11:55:06 +00002024 if (FormatTok->Tok.is(tok::l_paren))
Manuel Klimek9fa8d552013-01-11 19:23:05 +00002025 parseParens();
Manuel Klimek15dfe7a2013-05-28 11:55:06 +00002026 if (FormatTok->Tok.is(tok::l_brace)) {
Alexander Kornienko3a33f022013-12-12 09:49:52 +00002027 CompoundStatementIndenter Indenter(this, Style, Line->Level);
Daniel Jasper65ee3472013-07-31 23:16:02 +00002028 parseBlock(/*MustBeDeclaration=*/false);
Daniel Jasperf7935112012-12-03 18:12:45 +00002029 addUnwrappedLine();
2030 } else {
2031 addUnwrappedLine();
Daniel Jasper516d7972013-07-25 11:31:57 +00002032 ++Line->Level;
Manuel Klimek6b9eeba2013-01-07 14:56:16 +00002033 parseStructuralElement();
Daniel Jasper516d7972013-07-25 11:31:57 +00002034 --Line->Level;
Daniel Jasperf7935112012-12-03 18:12:45 +00002035 }
2036}
2037
2038void UnwrappedLineParser::parseAccessSpecifier() {
2039 nextToken();
Daniel Jasper84c47a12013-11-23 17:53:41 +00002040 // Understand Qt's slots.
Daniel Jasper53395402015-04-07 15:04:40 +00002041 if (FormatTok->isOneOf(Keywords.kw_slots, Keywords.kw_qslots))
Daniel Jasper84c47a12013-11-23 17:53:41 +00002042 nextToken();
Alexander Kornienko2ca766f2012-12-10 16:34:48 +00002043 // Otherwise, we don't know what it is, and we'd better keep the next token.
Manuel Klimek15dfe7a2013-05-28 11:55:06 +00002044 if (FormatTok->Tok.is(tok::colon))
Alexander Kornienko2ca766f2012-12-10 16:34:48 +00002045 nextToken();
Daniel Jasperf7935112012-12-03 18:12:45 +00002046 addUnwrappedLine();
2047}
2048
Daniel Jasper6f5a1932015-12-29 08:54:23 +00002049bool UnwrappedLineParser::parseEnum() {
Daniel Jasper6be0f552014-11-13 15:56:28 +00002050 // Won't be 'enum' for NS_ENUMs.
2051 if (FormatTok->Tok.is(tok::kw_enum))
Daniel Jasperccb68b42014-11-19 22:38:18 +00002052 nextToken();
Daniel Jasper6be0f552014-11-13 15:56:28 +00002053
Daniel Jasper6f5a1932015-12-29 08:54:23 +00002054 // In TypeScript, "enum" can also be used as property name, e.g. in interface
2055 // declarations. An "enum" keyword followed by a colon would be a syntax
2056 // error and thus assume it is just an identifier.
Daniel Jasper87379302016-02-03 05:33:44 +00002057 if (Style.Language == FormatStyle::LK_JavaScript &&
2058 FormatTok->isOneOf(tok::colon, tok::question))
Daniel Jasper6f5a1932015-12-29 08:54:23 +00002059 return false;
2060
Paul Hoada87ba1c2019-03-23 14:24:30 +00002061 // In protobuf, "enum" can be used as a field name.
2062 if (Style.Language == FormatStyle::LK_Proto && FormatTok->is(tok::equal))
2063 return false;
2064
Daniel Jasper2b41a822013-08-20 12:42:50 +00002065 // Eat up enum class ...
Daniel Jasperb05a81d2014-05-09 13:11:16 +00002066 if (FormatTok->Tok.is(tok::kw_class) || FormatTok->Tok.is(tok::kw_struct))
2067 nextToken();
Daniel Jasperb5a0b852015-06-19 08:17:32 +00002068
Daniel Jasper786a5502013-09-06 21:32:35 +00002069 while (FormatTok->Tok.getIdentifierInfo() ||
Daniel Jasperccb68b42014-11-19 22:38:18 +00002070 FormatTok->isOneOf(tok::colon, tok::coloncolon, tok::less,
2071 tok::greater, tok::comma, tok::question)) {
Manuel Klimek2cec0192013-01-21 19:17:52 +00002072 nextToken();
2073 // We can have macros or attributes in between 'enum' and the enum name.
Daniel Jasperccb68b42014-11-19 22:38:18 +00002074 if (FormatTok->is(tok::l_paren))
Alexander Kornienkob7076a22012-12-04 14:46:19 +00002075 parseParens();
Daniel Jasperb5a0b852015-06-19 08:17:32 +00002076 if (FormatTok->is(tok::identifier)) {
Manuel Klimek2cec0192013-01-21 19:17:52 +00002077 nextToken();
Daniel Jasperb5a0b852015-06-19 08:17:32 +00002078 // If there are two identifiers in a row, this is likely an elaborate
2079 // return type. In Java, this can be "implements", etc.
Daniel Jasper1dbc2102017-03-31 13:30:24 +00002080 if (Style.isCpp() && FormatTok->is(tok::identifier))
Daniel Jasper6f5a1932015-12-29 08:54:23 +00002081 return false;
Daniel Jasperb5a0b852015-06-19 08:17:32 +00002082 }
Manuel Klimek2cec0192013-01-21 19:17:52 +00002083 }
Daniel Jasper6be0f552014-11-13 15:56:28 +00002084
2085 // Just a declaration or something is wrong.
Daniel Jasperccb68b42014-11-19 22:38:18 +00002086 if (FormatTok->isNot(tok::l_brace))
Daniel Jasper6f5a1932015-12-29 08:54:23 +00002087 return true;
Daniel Jasper6be0f552014-11-13 15:56:28 +00002088 FormatTok->BlockKind = BK_Block;
2089
2090 if (Style.Language == FormatStyle::LK_Java) {
2091 // Java enums are different.
2092 parseJavaEnumBody();
Daniel Jasper6f5a1932015-12-29 08:54:23 +00002093 return true;
2094 }
2095 if (Style.Language == FormatStyle::LK_Proto) {
Daniel Jasperc6dd2732015-07-16 14:25:43 +00002096 parseBlock(/*MustBeDeclaration=*/true);
Daniel Jasper6f5a1932015-12-29 08:54:23 +00002097 return true;
Manuel Klimek2cec0192013-01-21 19:17:52 +00002098 }
Daniel Jasper6be0f552014-11-13 15:56:28 +00002099
2100 // Parse enum body.
Krasimir Georgiev26b144c2017-07-03 15:05:14 +00002101 nextToken();
Daniel Jasper6be0f552014-11-13 15:56:28 +00002102 bool HasError = !parseBracedList(/*ContinueOnSemicolons=*/true);
2103 if (HasError) {
2104 if (FormatTok->is(tok::semi))
2105 nextToken();
2106 addUnwrappedLine();
2107 }
Daniel Jasper6f5a1932015-12-29 08:54:23 +00002108 return true;
Daniel Jasper6be0f552014-11-13 15:56:28 +00002109
Daniel Jasper90cf3802015-06-17 09:44:02 +00002110 // There is no addUnwrappedLine() here so that we fall through to parsing a
2111 // structural element afterwards. Thus, in "enum A {} n, m;",
Manuel Klimek2cec0192013-01-21 19:17:52 +00002112 // "} n, m;" will end up in one unwrapped line.
Daniel Jasper6be0f552014-11-13 15:56:28 +00002113}
2114
2115void UnwrappedLineParser::parseJavaEnumBody() {
2116 // Determine whether the enum is simple, i.e. does not have a semicolon or
2117 // constants with class bodies. Simple enums can be formatted like braced
2118 // lists, contracted to a single line, etc.
2119 unsigned StoredPosition = Tokens->getPosition();
2120 bool IsSimple = true;
2121 FormatToken *Tok = Tokens->getNextToken();
2122 while (Tok) {
2123 if (Tok->is(tok::r_brace))
2124 break;
2125 if (Tok->isOneOf(tok::l_brace, tok::semi)) {
2126 IsSimple = false;
2127 break;
2128 }
2129 // FIXME: This will also mark enums with braces in the arguments to enum
2130 // constants as "not simple". This is probably fine in practice, though.
2131 Tok = Tokens->getNextToken();
2132 }
2133 FormatTok = Tokens->setPosition(StoredPosition);
2134
2135 if (IsSimple) {
Krasimir Georgiev26b144c2017-07-03 15:05:14 +00002136 nextToken();
Daniel Jasper6be0f552014-11-13 15:56:28 +00002137 parseBracedList();
Daniel Jasperdf2ff002014-11-02 22:31:39 +00002138 addUnwrappedLine();
Daniel Jasper6be0f552014-11-13 15:56:28 +00002139 return;
2140 }
2141
2142 // Parse the body of a more complex enum.
2143 // First add a line for everything up to the "{".
2144 nextToken();
2145 addUnwrappedLine();
2146 ++Line->Level;
2147
2148 // Parse the enum constants.
2149 while (FormatTok) {
2150 if (FormatTok->is(tok::l_brace)) {
2151 // Parse the constant's class body.
2152 parseBlock(/*MustBeDeclaration=*/true, /*AddLevel=*/true,
2153 /*MunchSemi=*/false);
2154 } else if (FormatTok->is(tok::l_paren)) {
2155 parseParens();
2156 } else if (FormatTok->is(tok::comma)) {
2157 nextToken();
2158 addUnwrappedLine();
2159 } else if (FormatTok->is(tok::semi)) {
2160 nextToken();
2161 addUnwrappedLine();
2162 break;
2163 } else if (FormatTok->is(tok::r_brace)) {
2164 addUnwrappedLine();
2165 break;
2166 } else {
2167 nextToken();
2168 }
2169 }
2170
2171 // Parse the class body after the enum's ";" if any.
2172 parseLevel(/*HasOpeningBrace=*/true);
2173 nextToken();
2174 --Line->Level;
2175 addUnwrappedLine();
Daniel Jasperf7935112012-12-03 18:12:45 +00002176}
2177
Martin Probst1027fb82017-02-07 14:05:30 +00002178void UnwrappedLineParser::parseRecord(bool ParseAsExpr) {
Roman Kashitsyna043ced2014-08-11 12:18:01 +00002179 const FormatToken &InitialToken = *FormatTok;
Manuel Klimek28cacc72013-01-07 18:10:23 +00002180 nextToken();
Daniel Jasper04785d02015-05-06 14:03:02 +00002181
Daniel Jasper04785d02015-05-06 14:03:02 +00002182 // The actual identifier can be a nested name specifier, and in macros
2183 // it is often token-pasted.
2184 while (FormatTok->isOneOf(tok::identifier, tok::coloncolon, tok::hashhash,
2185 tok::kw___attribute, tok::kw___declspec,
2186 tok::kw_alignas) ||
2187 ((Style.Language == FormatStyle::LK_Java ||
2188 Style.Language == FormatStyle::LK_JavaScript) &&
2189 FormatTok->isOneOf(tok::period, tok::comma))) {
Martin Probstcb870c52017-08-01 15:46:10 +00002190 if (Style.Language == FormatStyle::LK_JavaScript &&
2191 FormatTok->isOneOf(Keywords.kw_extends, Keywords.kw_implements)) {
2192 // JavaScript/TypeScript supports inline object types in
2193 // extends/implements positions:
2194 // class Foo implements {bar: number} { }
2195 nextToken();
2196 if (FormatTok->is(tok::l_brace)) {
2197 tryToParseBracedList();
2198 continue;
2199 }
2200 }
Daniel Jasper04785d02015-05-06 14:03:02 +00002201 bool IsNonMacroIdentifier =
2202 FormatTok->is(tok::identifier) &&
2203 FormatTok->TokenText != FormatTok->TokenText.upper();
Manuel Klimeke01bab52013-01-15 13:38:33 +00002204 nextToken();
2205 // We can have macros or attributes in between 'class' and the class name.
Daniel Jasper04785d02015-05-06 14:03:02 +00002206 if (!IsNonMacroIdentifier && FormatTok->Tok.is(tok::l_paren))
Manuel Klimeke01bab52013-01-15 13:38:33 +00002207 parseParens();
Daniel Jasper04785d02015-05-06 14:03:02 +00002208 }
Manuel Klimeke01bab52013-01-15 13:38:33 +00002209
Daniel Jasper04785d02015-05-06 14:03:02 +00002210 // Note that parsing away template declarations here leads to incorrectly
2211 // accepting function declarations as record declarations.
2212 // In general, we cannot solve this problem. Consider:
2213 // class A<int> B() {}
2214 // which can be a function definition or a class definition when B() is a
2215 // macro. If we find enough real-world cases where this is a problem, we
2216 // can parse for the 'template' keyword in the beginning of the statement,
2217 // and thus rule out the record production in case there is no template
2218 // (this would still leave us with an ambiguity between template function
2219 // and class declarations).
Daniel Jasperadba2aa2015-05-18 12:52:00 +00002220 if (FormatTok->isOneOf(tok::colon, tok::less)) {
2221 while (!eof()) {
Daniel Jasper3c883d12015-05-18 14:49:19 +00002222 if (FormatTok->is(tok::l_brace)) {
2223 calculateBraceTypes(/*ExpectClassBody=*/true);
2224 if (!tryToParseBracedList())
2225 break;
2226 }
Daniel Jasper04785d02015-05-06 14:03:02 +00002227 if (FormatTok->Tok.is(tok::semi))
2228 return;
2229 nextToken();
Manuel Klimeke01bab52013-01-15 13:38:33 +00002230 }
2231 }
Manuel Klimek15dfe7a2013-05-28 11:55:06 +00002232 if (FormatTok->Tok.is(tok::l_brace)) {
Martin Probst1027fb82017-02-07 14:05:30 +00002233 if (ParseAsExpr) {
2234 parseChildBlock();
2235 } else {
2236 if (ShouldBreakBeforeBrace(Style, InitialToken))
2237 addUnwrappedLine();
Manuel Klimeka8eb9142013-05-13 12:51:40 +00002238
Martin Probst1027fb82017-02-07 14:05:30 +00002239 parseBlock(/*MustBeDeclaration=*/true, /*AddLevel=*/true,
2240 /*MunchSemi=*/false);
2241 }
Manuel Klimeka8eb9142013-05-13 12:51:40 +00002242 }
Daniel Jasper90cf3802015-06-17 09:44:02 +00002243 // There is no addUnwrappedLine() here so that we fall through to parsing a
2244 // structural element afterwards. Thus, in "class A {} n, m;",
2245 // "} n, m;" will end up in one unwrapped line.
Manuel Klimek28cacc72013-01-07 18:10:23 +00002246}
2247
Ben Hamilton707e68f2018-05-30 15:21:38 +00002248void UnwrappedLineParser::parseObjCMethod() {
2249 assert(FormatTok->Tok.isOneOf(tok::l_paren, tok::identifier) &&
2250 "'(' or identifier expected.");
2251 do {
2252 if (FormatTok->Tok.is(tok::semi)) {
2253 nextToken();
2254 addUnwrappedLine();
2255 return;
2256 } else if (FormatTok->Tok.is(tok::l_brace)) {
Ben Hamilton97034a32018-10-12 19:43:01 +00002257 if (Style.BraceWrapping.AfterFunction)
2258 addUnwrappedLine();
Ben Hamilton707e68f2018-05-30 15:21:38 +00002259 parseBlock(/*MustBeDeclaration=*/false);
2260 addUnwrappedLine();
2261 return;
2262 } else {
2263 nextToken();
2264 }
2265 } while (!eof());
2266}
2267
Nico Weber8696a8d2013-01-09 21:15:03 +00002268void UnwrappedLineParser::parseObjCProtocolList() {
Manuel Klimek15dfe7a2013-05-28 11:55:06 +00002269 assert(FormatTok->Tok.is(tok::less) && "'<' expected.");
Ben Hamilton1462e842018-04-05 15:26:25 +00002270 do {
Nico Weber8696a8d2013-01-09 21:15:03 +00002271 nextToken();
Ben Hamilton1462e842018-04-05 15:26:25 +00002272 // Early exit in case someone forgot a close angle.
2273 if (FormatTok->isOneOf(tok::semi, tok::l_brace) ||
2274 FormatTok->Tok.isObjCAtKeyword(tok::objc_end))
2275 return;
2276 } while (!eof() && FormatTok->Tok.isNot(tok::greater));
Nico Weber8696a8d2013-01-09 21:15:03 +00002277 nextToken(); // Skip '>'.
2278}
2279
2280void UnwrappedLineParser::parseObjCUntilAtEnd() {
2281 do {
Manuel Klimek15dfe7a2013-05-28 11:55:06 +00002282 if (FormatTok->Tok.isObjCAtKeyword(tok::objc_end)) {
Nico Weber8696a8d2013-01-09 21:15:03 +00002283 nextToken();
2284 addUnwrappedLine();
2285 break;
2286 }
Daniel Jaspera15da302013-08-28 08:04:23 +00002287 if (FormatTok->is(tok::l_brace)) {
2288 parseBlock(/*MustBeDeclaration=*/false);
2289 // In ObjC interfaces, nothing should be following the "}".
2290 addUnwrappedLine();
Benjamin Kramere21cb742014-01-08 15:59:42 +00002291 } else if (FormatTok->is(tok::r_brace)) {
2292 // Ignore stray "}". parseStructuralElement doesn't consume them.
2293 nextToken();
2294 addUnwrappedLine();
Ben Hamilton707e68f2018-05-30 15:21:38 +00002295 } else if (FormatTok->isOneOf(tok::minus, tok::plus)) {
2296 nextToken();
2297 parseObjCMethod();
Daniel Jaspera15da302013-08-28 08:04:23 +00002298 } else {
2299 parseStructuralElement();
2300 }
Nico Weber8696a8d2013-01-09 21:15:03 +00002301 } while (!eof());
2302}
2303
Nico Weber2ce0ac52013-01-09 23:25:37 +00002304void UnwrappedLineParser::parseObjCInterfaceOrImplementation() {
Nico Weberc068ff72018-01-23 17:10:25 +00002305 assert(FormatTok->Tok.getObjCKeywordID() == tok::objc_interface ||
2306 FormatTok->Tok.getObjCKeywordID() == tok::objc_implementation);
Nico Weber7eecf4b2013-01-09 20:25:35 +00002307 nextToken();
Daniel Jasperd1ae3582013-03-20 12:37:50 +00002308 nextToken(); // interface name
Nico Weber7eecf4b2013-01-09 20:25:35 +00002309
Ben Hamilton1462e842018-04-05 15:26:25 +00002310 // @interface can be followed by a lightweight generic
2311 // specialization list, then either a base class or a category.
2312 if (FormatTok->Tok.is(tok::less)) {
2313 // Unlike protocol lists, generic parameterizations support
2314 // nested angles:
2315 //
2316 // @interface Foo<ValueType : id <NSCopying, NSSecureCoding>> :
2317 // NSObject <NSCopying, NSSecureCoding>
2318 //
2319 // so we need to count how many open angles we have left.
2320 unsigned NumOpenAngles = 1;
2321 do {
2322 nextToken();
2323 // Early exit in case someone forgot a close angle.
2324 if (FormatTok->isOneOf(tok::semi, tok::l_brace) ||
2325 FormatTok->Tok.isObjCAtKeyword(tok::objc_end))
2326 break;
2327 if (FormatTok->Tok.is(tok::less))
2328 ++NumOpenAngles;
2329 else if (FormatTok->Tok.is(tok::greater)) {
2330 assert(NumOpenAngles > 0 && "'>' makes NumOpenAngles negative");
2331 --NumOpenAngles;
2332 }
2333 } while (!eof() && NumOpenAngles != 0);
2334 nextToken(); // Skip '>'.
2335 }
Manuel Klimek15dfe7a2013-05-28 11:55:06 +00002336 if (FormatTok->Tok.is(tok::colon)) {
Nico Weber7eecf4b2013-01-09 20:25:35 +00002337 nextToken();
Daniel Jasperd1ae3582013-03-20 12:37:50 +00002338 nextToken(); // base class name
Manuel Klimek15dfe7a2013-05-28 11:55:06 +00002339 } else if (FormatTok->Tok.is(tok::l_paren))
Nico Weber7eecf4b2013-01-09 20:25:35 +00002340 // Skip category, if present.
2341 parseParens();
2342
Manuel Klimek15dfe7a2013-05-28 11:55:06 +00002343 if (FormatTok->Tok.is(tok::less))
Nico Weber8696a8d2013-01-09 21:15:03 +00002344 parseObjCProtocolList();
Nico Weber7eecf4b2013-01-09 20:25:35 +00002345
Dinesh Dwivediea3aca82014-05-02 17:01:46 +00002346 if (FormatTok->Tok.is(tok::l_brace)) {
Daniel Jasperc1bc38e2015-09-29 14:57:55 +00002347 if (Style.BraceWrapping.AfterObjCDeclaration)
Dinesh Dwivediea3aca82014-05-02 17:01:46 +00002348 addUnwrappedLine();
Nico Weber9096fc02013-06-26 00:30:14 +00002349 parseBlock(/*MustBeDeclaration=*/true);
Dinesh Dwivediea3aca82014-05-02 17:01:46 +00002350 }
Nico Weber7eecf4b2013-01-09 20:25:35 +00002351
2352 // With instance variables, this puts '}' on its own line. Without instance
2353 // variables, this ends the @interface line.
2354 addUnwrappedLine();
2355
Nico Weber8696a8d2013-01-09 21:15:03 +00002356 parseObjCUntilAtEnd();
2357}
Nico Weber7eecf4b2013-01-09 20:25:35 +00002358
Nico Weberc068ff72018-01-23 17:10:25 +00002359// Returns true for the declaration/definition form of @protocol,
2360// false for the expression form.
2361bool UnwrappedLineParser::parseObjCProtocol() {
2362 assert(FormatTok->Tok.getObjCKeywordID() == tok::objc_protocol);
Nico Weber8696a8d2013-01-09 21:15:03 +00002363 nextToken();
Nico Weberc068ff72018-01-23 17:10:25 +00002364
2365 if (FormatTok->is(tok::l_paren))
2366 // The expression form of @protocol, e.g. "Protocol* p = @protocol(foo);".
2367 return false;
2368
2369 // The definition/declaration form,
2370 // @protocol Foo
2371 // - (int)someMethod;
2372 // @end
2373
Daniel Jasperd1ae3582013-03-20 12:37:50 +00002374 nextToken(); // protocol name
Nico Weber8696a8d2013-01-09 21:15:03 +00002375
Manuel Klimek15dfe7a2013-05-28 11:55:06 +00002376 if (FormatTok->Tok.is(tok::less))
Nico Weber8696a8d2013-01-09 21:15:03 +00002377 parseObjCProtocolList();
2378
2379 // Check for protocol declaration.
Manuel Klimek15dfe7a2013-05-28 11:55:06 +00002380 if (FormatTok->Tok.is(tok::semi)) {
Nico Weber8696a8d2013-01-09 21:15:03 +00002381 nextToken();
Nico Weberc068ff72018-01-23 17:10:25 +00002382 addUnwrappedLine();
2383 return true;
Nico Weber8696a8d2013-01-09 21:15:03 +00002384 }
2385
2386 addUnwrappedLine();
2387 parseObjCUntilAtEnd();
Nico Weberc068ff72018-01-23 17:10:25 +00002388 return true;
Nico Weber7eecf4b2013-01-09 20:25:35 +00002389}
2390
Daniel Jasperfca735c2015-02-19 16:14:18 +00002391void UnwrappedLineParser::parseJavaScriptEs6ImportExport() {
Martin Probst053f1aa2016-04-19 14:55:37 +00002392 bool IsImport = FormatTok->is(Keywords.kw_import);
2393 assert(IsImport || FormatTok->is(tok::kw_export));
Daniel Jasper354aa512015-02-19 16:07:32 +00002394 nextToken();
Daniel Jasperfca735c2015-02-19 16:14:18 +00002395
Daniel Jasperec05fc72015-05-11 09:14:50 +00002396 // Consume the "default" in "export default class/function".
Daniel Jasper668c7bb2015-05-11 09:03:10 +00002397 if (FormatTok->is(tok::kw_default))
2398 nextToken();
Daniel Jasperec05fc72015-05-11 09:14:50 +00002399
Martin Probst5f8445b2016-04-24 22:05:09 +00002400 // Consume "async function", "function" and "default function", so that these
2401 // get parsed as free-standing JS functions, i.e. do not require a trailing
2402 // semicolon.
2403 if (FormatTok->is(Keywords.kw_async))
2404 nextToken();
Daniel Jasper668c7bb2015-05-11 09:03:10 +00002405 if (FormatTok->is(Keywords.kw_function)) {
2406 nextToken();
2407 return;
2408 }
2409
Martin Probst053f1aa2016-04-19 14:55:37 +00002410 // For imports, `export *`, `export {...}`, consume the rest of the line up
2411 // to the terminating `;`. For everything else, just return and continue
2412 // parsing the structural element, i.e. the declaration or expression for
2413 // `export default`.
2414 if (!IsImport && !FormatTok->isOneOf(tok::l_brace, tok::star) &&
2415 !FormatTok->isStringLiteral())
2416 return;
Daniel Jasperfca735c2015-02-19 16:14:18 +00002417
Martin Probstd40bca42017-01-09 08:56:36 +00002418 while (!eof()) {
2419 if (FormatTok->is(tok::semi))
2420 return;
Krasimir Georgiev112c2e92017-11-09 13:22:03 +00002421 if (Line->Tokens.empty()) {
Martin Probstd40bca42017-01-09 08:56:36 +00002422 // Common issue: Automatic Semicolon Insertion wrapped the line, so the
2423 // import statement should terminate.
2424 return;
2425 }
Daniel Jasperefc1a832016-01-07 08:53:35 +00002426 if (FormatTok->is(tok::l_brace)) {
2427 FormatTok->BlockKind = BK_Block;
Krasimir Georgiev26b144c2017-07-03 15:05:14 +00002428 nextToken();
Daniel Jasperefc1a832016-01-07 08:53:35 +00002429 parseBracedList();
2430 } else {
2431 nextToken();
2432 }
Daniel Jasper354aa512015-02-19 16:07:32 +00002433 }
2434}
2435
Paul Hoad5bcf99b2019-03-01 09:09:54 +00002436void UnwrappedLineParser::parseStatementMacro() {
Francois Ferrand6f40e212018-10-02 16:37:51 +00002437 nextToken();
2438 if (FormatTok->is(tok::l_paren))
2439 parseParens();
2440 if (FormatTok->is(tok::semi))
2441 nextToken();
2442 addUnwrappedLine();
2443}
2444
Daniel Jasper3b203a62013-09-05 16:05:56 +00002445LLVM_ATTRIBUTE_UNUSED static void printDebugInfo(const UnwrappedLine &Line,
2446 StringRef Prefix = "") {
Krasimir Georgiev9ad83fe2017-10-30 14:01:50 +00002447 llvm::dbgs() << Prefix << "Line(" << Line.Level
2448 << ", FSC=" << Line.FirstStartColumn << ")"
Daniel Jasper9fe0e8d2013-09-05 09:29:45 +00002449 << (Line.InPPDirective ? " MACRO" : "") << ": ";
2450 for (std::list<UnwrappedLineNode>::const_iterator I = Line.Tokens.begin(),
2451 E = Line.Tokens.end();
2452 I != E; ++I) {
Krasimir Georgiev91834222017-01-25 13:58:58 +00002453 llvm::dbgs() << I->Tok->Tok.getName() << "["
Manuel Klimek89628f62017-09-20 09:51:03 +00002454 << "T=" << I->Tok->Type << ", OC=" << I->Tok->OriginalColumn
2455 << "] ";
Daniel Jasper9fe0e8d2013-09-05 09:29:45 +00002456 }
2457 for (std::list<UnwrappedLineNode>::const_iterator I = Line.Tokens.begin(),
2458 E = Line.Tokens.end();
2459 I != E; ++I) {
2460 const UnwrappedLineNode &Node = *I;
2461 for (SmallVectorImpl<UnwrappedLine>::const_iterator
2462 I = Node.Children.begin(),
2463 E = Node.Children.end();
2464 I != E; ++I) {
2465 printDebugInfo(*I, "\nChild: ");
2466 }
2467 }
2468 llvm::dbgs() << "\n";
2469}
2470
Daniel Jasperf7935112012-12-03 18:12:45 +00002471void UnwrappedLineParser::addUnwrappedLine() {
Daniel Jasperdaffc0d2013-01-16 09:10:19 +00002472 if (Line->Tokens.empty())
Daniel Jasper7c85fde2013-01-08 14:56:18 +00002473 return;
Nicola Zaghen3538b392018-05-15 13:30:56 +00002474 LLVM_DEBUG({
Daniel Jasper9fe0e8d2013-09-05 09:29:45 +00002475 if (CurrentLines == &Lines)
2476 printDebugInfo(*Line);
Manuel Klimekab3dc002013-01-16 12:31:12 +00002477 });
Benjamin Kramerc7551a42015-05-31 11:18:05 +00002478 CurrentLines->push_back(std::move(*Line));
Daniel Jasperdaffc0d2013-01-16 09:10:19 +00002479 Line->Tokens.clear();
Krasimir Georgiev85c37042017-03-01 16:38:08 +00002480 Line->MatchingOpeningBlockLineIndex = UnwrappedLine::kInvalidIndex;
Krasimir Georgiev9ad83fe2017-10-30 14:01:50 +00002481 Line->FirstStartColumn = 0;
Manuel Klimekd3b92fa2013-01-18 14:04:34 +00002482 if (CurrentLines == &Lines && !PreprocessorDirectives.empty()) {
Benjamin Kramerc7551a42015-05-31 11:18:05 +00002483 CurrentLines->append(
2484 std::make_move_iterator(PreprocessorDirectives.begin()),
2485 std::make_move_iterator(PreprocessorDirectives.end()));
Manuel Klimekd3b92fa2013-01-18 14:04:34 +00002486 PreprocessorDirectives.clear();
2487 }
Manuel Klimeke411aa82017-09-20 09:29:37 +00002488 // Disconnect the current token from the last token on the previous line.
2489 FormatTok->Previous = nullptr;
Daniel Jasperf7935112012-12-03 18:12:45 +00002490}
2491
Manuel Klimek15dfe7a2013-05-28 11:55:06 +00002492bool UnwrappedLineParser::eof() const { return FormatTok->Tok.is(tok::eof); }
Daniel Jasperf7935112012-12-03 18:12:45 +00002493
Daniel Jasperb05a81d2014-05-09 13:11:16 +00002494bool UnwrappedLineParser::isOnNewLine(const FormatToken &FormatTok) {
Manuel Klimek1fcbe672014-04-11 12:27:47 +00002495 return (Line->InPPDirective || FormatTok.HasUnescapedNewline) &&
2496 FormatTok.NewlinesBefore > 0;
2497}
2498
Krasimir Georgiev91834222017-01-25 13:58:58 +00002499// Checks if \p FormatTok is a line comment that continues the line comment
2500// section on \p Line.
Krasimir Georgievea222a72017-05-22 10:07:56 +00002501static bool continuesLineCommentSection(const FormatToken &FormatTok,
2502 const UnwrappedLine &Line,
2503 llvm::Regex &CommentPragmasRegex) {
Krasimir Georgiev91834222017-01-25 13:58:58 +00002504 if (Line.Tokens.empty())
2505 return false;
Krasimir Georgiev84321612017-01-30 19:18:55 +00002506
Krasimir Georgiev00c5c722017-02-02 15:32:19 +00002507 StringRef IndentContent = FormatTok.TokenText;
2508 if (FormatTok.TokenText.startswith("//") ||
2509 FormatTok.TokenText.startswith("/*"))
2510 IndentContent = FormatTok.TokenText.substr(2);
2511 if (CommentPragmasRegex.match(IndentContent))
2512 return false;
2513
Krasimir Georgiev91834222017-01-25 13:58:58 +00002514 // If Line starts with a line comment, then FormatTok continues the comment
Krasimir Georgiev84321612017-01-30 19:18:55 +00002515 // section if its original column is greater or equal to the original start
Krasimir Georgiev91834222017-01-25 13:58:58 +00002516 // column of the line.
2517 //
Krasimir Georgiev84321612017-01-30 19:18:55 +00002518 // Define the min column token of a line as follows: if a line ends in '{' or
2519 // contains a '{' followed by a line comment, then the min column token is
2520 // that '{'. Otherwise, the min column token of the line is the first token of
2521 // the line.
2522 //
2523 // If Line starts with a token other than a line comment, then FormatTok
2524 // continues the comment section if its original column is greater than the
2525 // original start column of the min column token of the line.
Krasimir Georgiev91834222017-01-25 13:58:58 +00002526 //
2527 // For example, the second line comment continues the first in these cases:
Krasimir Georgievb6ccd382017-02-02 14:36:50 +00002528 //
Krasimir Georgiev91834222017-01-25 13:58:58 +00002529 // // first line
2530 // // second line
Krasimir Georgievb6ccd382017-02-02 14:36:50 +00002531 //
Krasimir Georgiev91834222017-01-25 13:58:58 +00002532 // and:
Krasimir Georgievb6ccd382017-02-02 14:36:50 +00002533 //
Krasimir Georgiev91834222017-01-25 13:58:58 +00002534 // // first line
2535 // // second line
Krasimir Georgievb6ccd382017-02-02 14:36:50 +00002536 //
Krasimir Georgiev91834222017-01-25 13:58:58 +00002537 // and:
Krasimir Georgievb6ccd382017-02-02 14:36:50 +00002538 //
Krasimir Georgiev91834222017-01-25 13:58:58 +00002539 // int i; // first line
2540 // // second line
Krasimir Georgievb6ccd382017-02-02 14:36:50 +00002541 //
Krasimir Georgiev84321612017-01-30 19:18:55 +00002542 // and:
Krasimir Georgievb6ccd382017-02-02 14:36:50 +00002543 //
Krasimir Georgiev84321612017-01-30 19:18:55 +00002544 // do { // first line
2545 // // second line
2546 // int i;
2547 // } while (true);
Krasimir Georgiev91834222017-01-25 13:58:58 +00002548 //
Krasimir Georgievb6ccd382017-02-02 14:36:50 +00002549 // and:
2550 //
2551 // enum {
2552 // a, // first line
2553 // // second line
2554 // b
2555 // };
2556 //
Krasimir Georgiev91834222017-01-25 13:58:58 +00002557 // The second line comment doesn't continue the first in these cases:
Krasimir Georgievb6ccd382017-02-02 14:36:50 +00002558 //
Krasimir Georgiev91834222017-01-25 13:58:58 +00002559 // // first line
2560 // // second line
Krasimir Georgievb6ccd382017-02-02 14:36:50 +00002561 //
Krasimir Georgiev91834222017-01-25 13:58:58 +00002562 // and:
Krasimir Georgievb6ccd382017-02-02 14:36:50 +00002563 //
Krasimir Georgiev91834222017-01-25 13:58:58 +00002564 // int i; // first line
2565 // // second line
Krasimir Georgievb6ccd382017-02-02 14:36:50 +00002566 //
Krasimir Georgiev84321612017-01-30 19:18:55 +00002567 // and:
Krasimir Georgievb6ccd382017-02-02 14:36:50 +00002568 //
Krasimir Georgiev84321612017-01-30 19:18:55 +00002569 // do { // first line
2570 // // second line
2571 // int i;
2572 // } while (true);
Krasimir Georgievb6ccd382017-02-02 14:36:50 +00002573 //
2574 // and:
2575 //
2576 // enum {
2577 // a, // first line
2578 // // second line
2579 // };
Krasimir Georgiev84321612017-01-30 19:18:55 +00002580 const FormatToken *MinColumnToken = Line.Tokens.front().Tok;
2581
2582 // Scan for '{//'. If found, use the column of '{' as a min column for line
2583 // comment section continuation.
2584 const FormatToken *PreviousToken = nullptr;
Krasimir Georgievd86c25d2017-03-10 13:09:29 +00002585 for (const UnwrappedLineNode &Node : Line.Tokens) {
Krasimir Georgiev84321612017-01-30 19:18:55 +00002586 if (PreviousToken && PreviousToken->is(tok::l_brace) &&
2587 isLineComment(*Node.Tok)) {
2588 MinColumnToken = PreviousToken;
2589 break;
2590 }
2591 PreviousToken = Node.Tok;
Krasimir Georgievb6ccd382017-02-02 14:36:50 +00002592
2593 // Grab the last newline preceding a token in this unwrapped line.
2594 if (Node.Tok->NewlinesBefore > 0) {
2595 MinColumnToken = Node.Tok;
2596 }
Krasimir Georgiev84321612017-01-30 19:18:55 +00002597 }
2598 if (PreviousToken && PreviousToken->is(tok::l_brace)) {
2599 MinColumnToken = PreviousToken;
2600 }
2601
Krasimir Georgievea222a72017-05-22 10:07:56 +00002602 return continuesLineComment(FormatTok, /*Previous=*/Line.Tokens.back().Tok,
2603 MinColumnToken);
Krasimir Georgiev91834222017-01-25 13:58:58 +00002604}
2605
Manuel Klimekf92f7bc2013-01-22 16:31:55 +00002606void UnwrappedLineParser::flushComments(bool NewlineBeforeNext) {
2607 bool JustComments = Line->Tokens.empty();
Manuel Klimek15dfe7a2013-05-28 11:55:06 +00002608 for (SmallVectorImpl<FormatToken *>::const_iterator
Manuel Klimekf92f7bc2013-01-22 16:31:55 +00002609 I = CommentsBeforeNextToken.begin(),
2610 E = CommentsBeforeNextToken.end();
2611 I != E; ++I) {
Krasimir Georgiev91834222017-01-25 13:58:58 +00002612 // Line comments that belong to the same line comment section are put on the
2613 // same line since later we might want to reflow content between them.
Krasimir Georgiev753625b2017-01-31 13:32:38 +00002614 // Additional fine-grained breaking of line comment sections is controlled
2615 // by the class BreakableLineCommentSection in case it is desirable to keep
2616 // several line comment sections in the same unwrapped line.
2617 //
2618 // FIXME: Consider putting separate line comment sections as children to the
2619 // unwrapped line instead.
Krasimir Georgiev00c5c722017-02-02 15:32:19 +00002620 (*I)->ContinuesLineCommentSection =
Krasimir Georgievea222a72017-05-22 10:07:56 +00002621 continuesLineCommentSection(**I, *Line, CommentPragmasRegex);
Krasimir Georgievb6ccd382017-02-02 14:36:50 +00002622 if (isOnNewLine(**I) && JustComments && !(*I)->ContinuesLineCommentSection)
Manuel Klimekf92f7bc2013-01-22 16:31:55 +00002623 addUnwrappedLine();
Manuel Klimekf92f7bc2013-01-22 16:31:55 +00002624 pushToken(*I);
2625 }
Daniel Jaspere60cba12015-05-13 11:35:53 +00002626 if (NewlineBeforeNext && JustComments)
Manuel Klimekf92f7bc2013-01-22 16:31:55 +00002627 addUnwrappedLine();
Manuel Klimekf92f7bc2013-01-22 16:31:55 +00002628 CommentsBeforeNextToken.clear();
2629}
2630
Krasimir Georgiev3e051052017-07-24 14:51:59 +00002631void UnwrappedLineParser::nextToken(int LevelDifference) {
Daniel Jasperf7935112012-12-03 18:12:45 +00002632 if (eof())
2633 return;
Manuel Klimek1fcbe672014-04-11 12:27:47 +00002634 flushComments(isOnNewLine(*FormatTok));
Manuel Klimekf92f7bc2013-01-22 16:31:55 +00002635 pushToken(FormatTok);
Manuel Klimek89628f62017-09-20 09:51:03 +00002636 FormatToken *Previous = FormatTok;
Daniel Jasper1dcbbcfc2016-03-14 19:21:36 +00002637 if (Style.Language != FormatStyle::LK_JavaScript)
Krasimir Georgiev3e051052017-07-24 14:51:59 +00002638 readToken(LevelDifference);
Daniel Jasper1dcbbcfc2016-03-14 19:21:36 +00002639 else
2640 readTokenWithJavaScriptASI();
Manuel Klimeke411aa82017-09-20 09:29:37 +00002641 FormatTok->Previous = Previous;
Daniel Jasperb9a49902016-01-09 15:56:28 +00002642}
2643
Krasimir Georgievf62f9582017-02-08 10:30:44 +00002644void UnwrappedLineParser::distributeComments(
2645 const SmallVectorImpl<FormatToken *> &Comments,
2646 const FormatToken *NextTok) {
2647 // Whether or not a line comment token continues a line is controlled by
Krasimir Georgievea222a72017-05-22 10:07:56 +00002648 // the method continuesLineCommentSection, with the following caveat:
Krasimir Georgievf62f9582017-02-08 10:30:44 +00002649 //
2650 // Define a trail of Comments to be a nonempty proper postfix of Comments such
2651 // that each comment line from the trail is aligned with the next token, if
2652 // the next token exists. If a trail exists, the beginning of the maximal
2653 // trail is marked as a start of a new comment section.
2654 //
2655 // For example in this code:
2656 //
2657 // int a; // line about a
2658 // // line 1 about b
2659 // // line 2 about b
2660 // int b;
2661 //
2662 // the two lines about b form a maximal trail, so there are two sections, the
2663 // first one consisting of the single comment "// line about a" and the
2664 // second one consisting of the next two comments.
2665 if (Comments.empty())
2666 return;
2667 bool ShouldPushCommentsInCurrentLine = true;
2668 bool HasTrailAlignedWithNextToken = false;
2669 unsigned StartOfTrailAlignedWithNextToken = 0;
2670 if (NextTok) {
2671 // We are skipping the first element intentionally.
2672 for (unsigned i = Comments.size() - 1; i > 0; --i) {
2673 if (Comments[i]->OriginalColumn == NextTok->OriginalColumn) {
2674 HasTrailAlignedWithNextToken = true;
2675 StartOfTrailAlignedWithNextToken = i;
2676 }
2677 }
2678 }
2679 for (unsigned i = 0, e = Comments.size(); i < e; ++i) {
2680 FormatToken *FormatTok = Comments[i];
Manuel Klimek89628f62017-09-20 09:51:03 +00002681 if (HasTrailAlignedWithNextToken && i == StartOfTrailAlignedWithNextToken) {
Krasimir Georgievf62f9582017-02-08 10:30:44 +00002682 FormatTok->ContinuesLineCommentSection = false;
2683 } else {
2684 FormatTok->ContinuesLineCommentSection =
Krasimir Georgievea222a72017-05-22 10:07:56 +00002685 continuesLineCommentSection(*FormatTok, *Line, CommentPragmasRegex);
Krasimir Georgievf62f9582017-02-08 10:30:44 +00002686 }
2687 if (!FormatTok->ContinuesLineCommentSection &&
2688 (isOnNewLine(*FormatTok) || FormatTok->IsFirst)) {
2689 ShouldPushCommentsInCurrentLine = false;
2690 }
2691 if (ShouldPushCommentsInCurrentLine) {
2692 pushToken(FormatTok);
2693 } else {
2694 CommentsBeforeNextToken.push_back(FormatTok);
2695 }
2696 }
2697}
2698
Krasimir Georgiev3e051052017-07-24 14:51:59 +00002699void UnwrappedLineParser::readToken(int LevelDifference) {
Krasimir Georgievf62f9582017-02-08 10:30:44 +00002700 SmallVector<FormatToken *, 1> Comments;
Manuel Klimekf92f7bc2013-01-22 16:31:55 +00002701 do {
2702 FormatTok = Tokens->getNextToken();
Alexander Kornienkoc2ee9cf2014-03-13 13:59:48 +00002703 assert(FormatTok);
Manuel Klimek15dfe7a2013-05-28 11:55:06 +00002704 while (!Line->InPPDirective && FormatTok->Tok.is(tok::hash) &&
2705 (FormatTok->HasUnescapedNewline || FormatTok->IsFirst)) {
Krasimir Georgievf62f9582017-02-08 10:30:44 +00002706 distributeComments(Comments, FormatTok);
2707 Comments.clear();
Manuel Klimekf92f7bc2013-01-22 16:31:55 +00002708 // If there is an unfinished unwrapped line, we flush the preprocessor
2709 // directives only after that unwrapped line was finished later.
Daniel Jasper29d39d52015-02-08 09:34:49 +00002710 bool SwitchToPreprocessorLines = !Line->Tokens.empty();
Manuel Klimekf92f7bc2013-01-22 16:31:55 +00002711 ScopedLineState BlockState(*this, SwitchToPreprocessorLines);
Krasimir Georgiev3e051052017-07-24 14:51:59 +00002712 assert((LevelDifference >= 0 ||
2713 static_cast<unsigned>(-LevelDifference) <= Line->Level) &&
2714 "LevelDifference makes Line->Level negative");
2715 Line->Level += LevelDifference;
Alexander Kornienkob1be9d62013-04-03 12:38:53 +00002716 // Comments stored before the preprocessor directive need to be output
2717 // before the preprocessor directive, at the same level as the
2718 // preprocessor directive, as we consider them to apply to the directive.
Paul Hoad701a0d72019-03-20 20:49:43 +00002719 if (Style.IndentPPDirectives == FormatStyle::PPDIS_BeforeHash &&
2720 PPBranchLevel > 0)
2721 Line->Level += PPBranchLevel;
Manuel Klimek1fcbe672014-04-11 12:27:47 +00002722 flushComments(isOnNewLine(*FormatTok));
Manuel Klimekf92f7bc2013-01-22 16:31:55 +00002723 parsePPDirective();
2724 }
Manuel Klimek68b03042014-04-14 09:14:11 +00002725 while (FormatTok->Type == TT_ConflictStart ||
2726 FormatTok->Type == TT_ConflictEnd ||
2727 FormatTok->Type == TT_ConflictAlternative) {
2728 if (FormatTok->Type == TT_ConflictStart) {
2729 conditionalCompilationStart(/*Unreachable=*/false);
2730 } else if (FormatTok->Type == TT_ConflictAlternative) {
2731 conditionalCompilationAlternative();
Daniel Jasperb05a81d2014-05-09 13:11:16 +00002732 } else if (FormatTok->Type == TT_ConflictEnd) {
Manuel Klimek68b03042014-04-14 09:14:11 +00002733 conditionalCompilationEnd();
2734 }
2735 FormatTok = Tokens->getNextToken();
2736 FormatTok->MustBreakBefore = true;
2737 }
Alexander Kornienkof2e02122013-05-24 18:24:24 +00002738
Francois Ferranda98a95c2017-07-28 07:56:14 +00002739 if (!PPStack.empty() && (PPStack.back().Kind == PP_Unreachable) &&
Alexander Kornienkof2e02122013-05-24 18:24:24 +00002740 !Line->InPPDirective) {
2741 continue;
2742 }
2743
Krasimir Georgievf62f9582017-02-08 10:30:44 +00002744 if (!FormatTok->Tok.is(tok::comment)) {
2745 distributeComments(Comments, FormatTok);
2746 Comments.clear();
Manuel Klimekf92f7bc2013-01-22 16:31:55 +00002747 return;
Manuel Klimekf92f7bc2013-01-22 16:31:55 +00002748 }
Krasimir Georgievf62f9582017-02-08 10:30:44 +00002749
2750 Comments.push_back(FormatTok);
Manuel Klimekf92f7bc2013-01-22 16:31:55 +00002751 } while (!eof());
Krasimir Georgievf62f9582017-02-08 10:30:44 +00002752
2753 distributeComments(Comments, nullptr);
2754 Comments.clear();
Manuel Klimekf92f7bc2013-01-22 16:31:55 +00002755}
2756
Manuel Klimek15dfe7a2013-05-28 11:55:06 +00002757void UnwrappedLineParser::pushToken(FormatToken *Tok) {
Daniel Jasper9fe0e8d2013-09-05 09:29:45 +00002758 Line->Tokens.push_back(UnwrappedLineNode(Tok));
Manuel Klimekf92f7bc2013-01-22 16:31:55 +00002759 if (MustBreakBeforeNextToken) {
Daniel Jasper9fe0e8d2013-09-05 09:29:45 +00002760 Line->Tokens.back().Tok->MustBreakBefore = true;
Manuel Klimekf92f7bc2013-01-22 16:31:55 +00002761 MustBreakBeforeNextToken = false;
Manuel Klimek1abf7892013-01-04 23:34:14 +00002762 }
Daniel Jasperf7935112012-12-03 18:12:45 +00002763}
2764
Daniel Jasper8d1832e2013-01-07 13:26:07 +00002765} // end namespace format
2766} // end namespace clang