blob: 24e2b1f87ec0c416ace8eda8a6b541ba98cd13f7 [file] [log] [blame]
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001//===--- TokenAnnotator.cpp - Format C++ code -----------------------------===//
2//
3// The LLVM Compiler Infrastructure
4//
5// This file is distributed under the University of Illinois Open Source
6// License. See LICENSE.TXT for details.
7//
8//===----------------------------------------------------------------------===//
9///
10/// \file
11/// \brief This file implements a token annotator, i.e. creates
12/// \c AnnotatedTokens out of \c FormatTokens with required extra information.
13///
14//===----------------------------------------------------------------------===//
15
16#include "TokenAnnotator.h"
17#include "clang/Basic/SourceManager.h"
18#include "clang/Lex/Lexer.h"
19
20namespace clang {
21namespace format {
22
Nico Weberee0feec2013-02-05 16:21:00 +000023static bool isUnaryOperator(const AnnotatedToken &Tok) {
24 switch (Tok.FormatTok.Tok.getKind()) {
25 case tok::plus:
26 case tok::plusplus:
27 case tok::minus:
28 case tok::minusminus:
29 case tok::exclaim:
30 case tok::tilde:
31 case tok::kw_sizeof:
32 case tok::kw_alignof:
33 return true;
34 default:
35 return false;
36 }
37}
38
Daniel Jasper32d28ee2013-01-29 21:01:14 +000039static bool isBinaryOperator(const AnnotatedToken &Tok) {
40 // Comma is a binary operator, but does not behave as such wrt. formatting.
41 return getPrecedence(Tok) > prec::Comma;
42}
43
Daniel Jasper01786732013-02-04 07:21:18 +000044// Returns the previous token ignoring comments.
Nico Weber4ed7f3e2013-02-06 16:54:35 +000045static AnnotatedToken *getPreviousToken(AnnotatedToken &Tok) {
46 AnnotatedToken *PrevToken = Tok.Parent;
Daniel Jasper01786732013-02-04 07:21:18 +000047 while (PrevToken != NULL && PrevToken->is(tok::comment))
48 PrevToken = PrevToken->Parent;
49 return PrevToken;
50}
Nico Weber4ed7f3e2013-02-06 16:54:35 +000051static const AnnotatedToken *getPreviousToken(const AnnotatedToken &Tok) {
52 return getPreviousToken(const_cast<AnnotatedToken &>(Tok));
53}
Daniel Jasper01786732013-02-04 07:21:18 +000054
Daniel Jasper29f123b2013-02-08 15:28:42 +000055static bool isTrailingComment(AnnotatedToken *Tok) {
56 return Tok != NULL && Tok->is(tok::comment) &&
57 (Tok->Children.empty() ||
58 Tok->Children[0].FormatTok.NewlinesBefore > 0);
59}
60
Daniel Jasper01786732013-02-04 07:21:18 +000061// Returns the next token ignoring comments.
62static const AnnotatedToken *getNextToken(const AnnotatedToken &Tok) {
63 if (Tok.Children.empty())
64 return NULL;
65 const AnnotatedToken *NextToken = &Tok.Children[0];
66 while (NextToken->is(tok::comment)) {
67 if (NextToken->Children.empty())
68 return NULL;
69 NextToken = &NextToken->Children[0];
70 }
71 return NextToken;
72}
73
Alexander Kornienkoe74de282013-03-13 14:41:29 +000074static bool closesScope(const AnnotatedToken &Tok) {
75 return Tok.isOneOf(tok::r_paren, tok::r_brace, tok::r_square) ||
76 Tok.Type == TT_TemplateCloser;
77}
78
79static bool opensScope(const AnnotatedToken &Tok) {
80 return Tok.isOneOf(tok::l_paren, tok::l_brace, tok::l_square) ||
81 Tok.Type == TT_TemplateOpener;
82}
83
Daniel Jasper32d28ee2013-01-29 21:01:14 +000084/// \brief A parser that gathers additional information about tokens.
85///
Alexander Kornienko3fd9ccd2013-03-12 16:28:18 +000086/// The \c TokenAnnotator tries to match parenthesis and square brakets and
Daniel Jasper32d28ee2013-01-29 21:01:14 +000087/// store a parenthesis levels. It also tries to resolve matching "<" and ">"
88/// into template parameter lists.
89class AnnotatingParser {
90public:
Nico Weberc2e6d2a2013-02-11 15:32:15 +000091 AnnotatingParser(SourceManager &SourceMgr, Lexer &Lex, AnnotatedLine &Line,
92 IdentifierInfo &Ident_in)
Daniel Jasper01786732013-02-04 07:21:18 +000093 : SourceMgr(SourceMgr), Lex(Lex), Line(Line), CurrentToken(&Line.First),
Nico Weberc2e6d2a2013-02-11 15:32:15 +000094 KeywordVirtualFound(false), Ident_in(Ident_in) {
Daniel Jasper923ebef2013-03-14 13:45:21 +000095 Contexts.push_back(Context(tok::unknown, 1, /*IsExpression=*/ false));
Daniel Jasper32d28ee2013-01-29 21:01:14 +000096 }
97
Nico Weber95e8e462013-02-12 16:17:07 +000098private:
Daniel Jasper32d28ee2013-01-29 21:01:14 +000099 bool parseAngle() {
100 if (CurrentToken == NULL)
101 return false;
Daniel Jasper923ebef2013-03-14 13:45:21 +0000102 ScopedContextCreator ContextCreator(*this, tok::less, 10);
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000103 AnnotatedToken *Left = CurrentToken->Parent;
Daniel Jasper4e778092013-02-06 10:05:46 +0000104 Contexts.back().IsExpression = false;
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000105 while (CurrentToken != NULL) {
106 if (CurrentToken->is(tok::greater)) {
107 Left->MatchingParen = CurrentToken;
108 CurrentToken->MatchingParen = Left;
109 CurrentToken->Type = TT_TemplateCloser;
110 next();
111 return true;
112 }
Alexander Kornienkoe74de282013-03-13 14:41:29 +0000113 if (CurrentToken->isOneOf(tok::r_paren, tok::r_square, tok::r_brace,
114 tok::pipepipe, tok::ampamp, tok::question,
115 tok::colon))
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000116 return false;
Daniel Jasper9fc56f22013-02-14 15:01:34 +0000117 updateParameterCount(Left, CurrentToken);
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000118 if (!consumeToken())
119 return false;
120 }
121 return false;
122 }
123
124 bool parseParens(bool LookForDecls = false) {
125 if (CurrentToken == NULL)
126 return false;
Daniel Jasper923ebef2013-03-14 13:45:21 +0000127 ScopedContextCreator ContextCreator(*this, tok::l_paren, 1);
Daniel Jasper4e778092013-02-06 10:05:46 +0000128
129 // FIXME: This is a bit of a hack. Do better.
130 Contexts.back().ColonIsForRangeExpr =
131 Contexts.size() == 2 && Contexts[0].ColonIsForRangeExpr;
132
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000133 bool StartsObjCMethodExpr = false;
134 AnnotatedToken *Left = CurrentToken->Parent;
135 if (CurrentToken->is(tok::caret)) {
136 // ^( starts a block.
137 Left->Type = TT_ObjCBlockLParen;
138 } else if (AnnotatedToken *MaybeSel = Left->Parent) {
139 // @selector( starts a selector.
140 if (MaybeSel->isObjCAtKeyword(tok::objc_selector) && MaybeSel->Parent &&
141 MaybeSel->Parent->is(tok::at)) {
142 StartsObjCMethodExpr = true;
143 }
144 }
145
Daniel Jasper4e778092013-02-06 10:05:46 +0000146 if (StartsObjCMethodExpr) {
147 Contexts.back().ColonIsObjCMethodExpr = true;
148 Left->Type = TT_ObjCMethodExpr;
149 }
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000150
151 while (CurrentToken != NULL) {
152 // LookForDecls is set when "if (" has been seen. Check for
153 // 'identifier' '*' 'identifier' followed by not '=' -- this
154 // '*' has to be a binary operator but determineStarAmpUsage() will
155 // categorize it as an unary operator, so set the right type here.
156 if (LookForDecls && !CurrentToken->Children.empty()) {
157 AnnotatedToken &Prev = *CurrentToken->Parent;
158 AnnotatedToken &Next = CurrentToken->Children[0];
159 if (Prev.Parent->is(tok::identifier) &&
Alexander Kornienkoe74de282013-03-13 14:41:29 +0000160 Prev.isOneOf(tok::star, tok::amp, tok::ampamp) &&
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000161 CurrentToken->is(tok::identifier) && Next.isNot(tok::equal)) {
162 Prev.Type = TT_BinaryOperator;
163 LookForDecls = false;
164 }
165 }
166
167 if (CurrentToken->is(tok::r_paren)) {
168 Left->MatchingParen = CurrentToken;
169 CurrentToken->MatchingParen = Left;
170
Daniel Jasper63d7ced2013-02-05 10:07:47 +0000171 if (StartsObjCMethodExpr) {
Daniel Jasper4e778092013-02-06 10:05:46 +0000172 CurrentToken->Type = TT_ObjCMethodExpr;
173 if (Contexts.back().FirstObjCSelectorName != NULL) {
174 Contexts.back().FirstObjCSelectorName->LongestObjCSelectorName =
175 Contexts.back().LongestObjCSelectorName;
Daniel Jasper63d7ced2013-02-05 10:07:47 +0000176 }
177 }
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000178
179 next();
180 return true;
181 }
Alexander Kornienkoe74de282013-03-13 14:41:29 +0000182 if (CurrentToken->isOneOf(tok::r_square, tok::r_brace))
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000183 return false;
Daniel Jasper9fc56f22013-02-14 15:01:34 +0000184 updateParameterCount(Left, CurrentToken);
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000185 if (!consumeToken())
186 return false;
187 }
188 return false;
189 }
190
191 bool parseSquare() {
192 if (!CurrentToken)
193 return false;
194
195 // A '[' could be an index subscript (after an indentifier or after
Nico Weber051860e2013-02-10 02:08:05 +0000196 // ')' or ']'), it could be the start of an Objective-C method
197 // expression, or it could the the start of an Objective-C array literal.
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000198 AnnotatedToken *Left = CurrentToken->Parent;
Nico Weber4ed7f3e2013-02-06 16:54:35 +0000199 AnnotatedToken *Parent = getPreviousToken(*Left);
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000200 bool StartsObjCMethodExpr =
Daniel Jasper6f21a982013-03-13 07:49:51 +0000201 Contexts.back().CanBeExpression &&
Alexander Kornienkoe74de282013-03-13 14:41:29 +0000202 (!Parent || Parent->isOneOf(tok::colon, tok::l_square, tok::l_paren,
203 tok::kw_return, tok::kw_throw) ||
204 isUnaryOperator(*Parent) || Parent->Type == TT_ObjCForIn ||
205 Parent->Type == TT_CastRParen ||
Daniel Jasper6f21a982013-03-13 07:49:51 +0000206 getBinOpPrecedence(Parent->FormatTok.Tok.getKind(), true, true) >
Daniel Jasperf9955d32013-03-20 12:37:50 +0000207 prec::Unknown);
Daniel Jasper923ebef2013-03-14 13:45:21 +0000208 ScopedContextCreator ContextCreator(*this, tok::l_square, 10);
Daniel Jasper6f21a982013-03-13 07:49:51 +0000209 Contexts.back().IsExpression = true;
Nico Weber051860e2013-02-10 02:08:05 +0000210 bool StartsObjCArrayLiteral = Parent && Parent->is(tok::at);
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000211
Daniel Jasper4e778092013-02-06 10:05:46 +0000212 if (StartsObjCMethodExpr) {
213 Contexts.back().ColonIsObjCMethodExpr = true;
214 Left->Type = TT_ObjCMethodExpr;
Nico Weber051860e2013-02-10 02:08:05 +0000215 } else if (StartsObjCArrayLiteral) {
216 Left->Type = TT_ObjCArrayLiteral;
Daniel Jasper4e778092013-02-06 10:05:46 +0000217 }
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000218
219 while (CurrentToken != NULL) {
220 if (CurrentToken->is(tok::r_square)) {
221 if (!CurrentToken->Children.empty() &&
222 CurrentToken->Children[0].is(tok::l_paren)) {
Nico Webere8a97982013-02-06 06:20:11 +0000223 // An ObjC method call is rarely followed by an open parenthesis.
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000224 // FIXME: Do we incorrectly label ":" with this?
225 StartsObjCMethodExpr = false;
226 Left->Type = TT_Unknown;
227 }
Daniel Jasper01786732013-02-04 07:21:18 +0000228 if (StartsObjCMethodExpr) {
Daniel Jasper4e778092013-02-06 10:05:46 +0000229 CurrentToken->Type = TT_ObjCMethodExpr;
Nico Webere8a97982013-02-06 06:20:11 +0000230 // determineStarAmpUsage() thinks that '*' '[' is allocating an
231 // array of pointers, but if '[' starts a selector then '*' is a
232 // binary operator.
Alexander Kornienko3fd9ccd2013-03-12 16:28:18 +0000233 if (Parent != NULL && Parent->Type == TT_PointerOrReference)
Nico Weber4ed7f3e2013-02-06 16:54:35 +0000234 Parent->Type = TT_BinaryOperator;
Nico Weber051860e2013-02-10 02:08:05 +0000235 } else if (StartsObjCArrayLiteral) {
236 CurrentToken->Type = TT_ObjCArrayLiteral;
Daniel Jasper01786732013-02-04 07:21:18 +0000237 }
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000238 Left->MatchingParen = CurrentToken;
239 CurrentToken->MatchingParen = Left;
Daniel Jasper4e778092013-02-06 10:05:46 +0000240 if (Contexts.back().FirstObjCSelectorName != NULL)
241 Contexts.back().FirstObjCSelectorName->LongestObjCSelectorName =
242 Contexts.back().LongestObjCSelectorName;
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000243 next();
244 return true;
245 }
Alexander Kornienkoe74de282013-03-13 14:41:29 +0000246 if (CurrentToken->isOneOf(tok::r_paren, tok::r_brace))
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000247 return false;
Daniel Jasper9fc56f22013-02-14 15:01:34 +0000248 updateParameterCount(Left, CurrentToken);
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000249 if (!consumeToken())
250 return false;
251 }
252 return false;
253 }
254
255 bool parseBrace() {
256 // Lines are fine to end with '{'.
257 if (CurrentToken == NULL)
258 return true;
Daniel Jasper923ebef2013-03-14 13:45:21 +0000259 ScopedContextCreator ContextCreator(*this, tok::l_brace, 1);
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000260 AnnotatedToken *Left = CurrentToken->Parent;
261 while (CurrentToken != NULL) {
262 if (CurrentToken->is(tok::r_brace)) {
263 Left->MatchingParen = CurrentToken;
264 CurrentToken->MatchingParen = Left;
265 next();
266 return true;
267 }
Alexander Kornienkoe74de282013-03-13 14:41:29 +0000268 if (CurrentToken->isOneOf(tok::r_paren, tok::r_square))
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000269 return false;
Daniel Jasper9fc56f22013-02-14 15:01:34 +0000270 updateParameterCount(Left, CurrentToken);
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000271 if (!consumeToken())
272 return false;
273 }
274 return true;
275 }
Daniel Jasperc4615b72013-02-20 12:56:39 +0000276
Daniel Jasper9fc56f22013-02-14 15:01:34 +0000277 void updateParameterCount(AnnotatedToken *Left, AnnotatedToken *Current) {
278 if (Current->is(tok::comma))
279 ++Left->ParameterCount;
280 else if (Left->ParameterCount == 0 && Current->isNot(tok::comment))
281 Left->ParameterCount = 1;
282 }
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000283
284 bool parseConditional() {
285 while (CurrentToken != NULL) {
286 if (CurrentToken->is(tok::colon)) {
287 CurrentToken->Type = TT_ConditionalExpr;
288 next();
289 return true;
290 }
291 if (!consumeToken())
292 return false;
293 }
294 return false;
295 }
296
297 bool parseTemplateDeclaration() {
298 if (CurrentToken != NULL && CurrentToken->is(tok::less)) {
299 CurrentToken->Type = TT_TemplateOpener;
300 next();
301 if (!parseAngle())
302 return false;
Daniel Jasper34511fb2013-02-19 17:14:38 +0000303 if (CurrentToken != NULL)
304 CurrentToken->Parent->ClosesTemplateDeclaration = true;
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000305 return true;
306 }
307 return false;
308 }
309
310 bool consumeToken() {
311 AnnotatedToken *Tok = CurrentToken;
312 next();
313 switch (Tok->FormatTok.Tok.getKind()) {
314 case tok::plus:
315 case tok::minus:
Daniel Jasper627707b2013-03-22 16:55:40 +0000316 if (Tok->Parent == NULL && Line.MustBeDeclaration)
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000317 Tok->Type = TT_ObjCMethodSpecifier;
318 break;
319 case tok::colon:
Daniel Jaspercf6d76a2013-03-18 12:50:26 +0000320 if (Tok->Parent == NULL)
321 return false;
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000322 // Colons from ?: are handled in parseConditional().
Daniel Jasper923ebef2013-03-14 13:45:21 +0000323 if (Tok->Parent->is(tok::r_paren) && Contexts.size() == 1) {
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000324 Tok->Type = TT_CtorInitializerColon;
Daniel Jasper4e778092013-02-06 10:05:46 +0000325 } else if (Contexts.back().ColonIsObjCMethodExpr ||
Daniel Jasper63d7ced2013-02-05 10:07:47 +0000326 Line.First.Type == TT_ObjCMethodSpecifier) {
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000327 Tok->Type = TT_ObjCMethodExpr;
Daniel Jasper63d7ced2013-02-05 10:07:47 +0000328 Tok->Parent->Type = TT_ObjCSelectorName;
Daniel Jasper4e778092013-02-06 10:05:46 +0000329 if (Tok->Parent->FormatTok.TokenLength >
Daniel Jasperf9955d32013-03-20 12:37:50 +0000330 Contexts.back().LongestObjCSelectorName)
Daniel Jasper4e778092013-02-06 10:05:46 +0000331 Contexts.back().LongestObjCSelectorName =
332 Tok->Parent->FormatTok.TokenLength;
333 if (Contexts.back().FirstObjCSelectorName == NULL)
334 Contexts.back().FirstObjCSelectorName = Tok->Parent;
335 } else if (Contexts.back().ColonIsForRangeExpr) {
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000336 Tok->Type = TT_RangeBasedForLoopColon;
Daniel Jasper6cabab42013-02-14 08:42:54 +0000337 } else if (Contexts.size() == 1) {
338 Tok->Type = TT_InheritanceColon;
Daniel Jasper923ebef2013-03-14 13:45:21 +0000339 } else if (Contexts.back().ContextKind == tok::l_paren) {
340 Tok->Type = TT_InlineASMColon;
Daniel Jasper63d7ced2013-02-05 10:07:47 +0000341 }
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000342 break;
343 case tok::kw_if:
344 case tok::kw_while:
345 if (CurrentToken != NULL && CurrentToken->is(tok::l_paren)) {
346 next();
347 if (!parseParens(/*LookForDecls=*/ true))
348 return false;
349 }
350 break;
351 case tok::kw_for:
Daniel Jasper4e778092013-02-06 10:05:46 +0000352 Contexts.back().ColonIsForRangeExpr = true;
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000353 next();
354 if (!parseParens())
355 return false;
356 break;
357 case tok::l_paren:
358 if (!parseParens())
359 return false;
Daniel Jasper3c08a812013-02-24 18:54:32 +0000360 if (Line.MustBeDeclaration)
361 Line.MightBeFunctionDecl = true;
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000362 break;
363 case tok::l_square:
364 if (!parseSquare())
365 return false;
366 break;
367 case tok::l_brace:
368 if (!parseBrace())
369 return false;
370 break;
371 case tok::less:
372 if (parseAngle())
373 Tok->Type = TT_TemplateOpener;
374 else {
375 Tok->Type = TT_BinaryOperator;
376 CurrentToken = Tok;
377 next();
378 }
379 break;
380 case tok::r_paren:
381 case tok::r_square:
382 return false;
383 case tok::r_brace:
384 // Lines can start with '}'.
385 if (Tok->Parent != NULL)
386 return false;
387 break;
388 case tok::greater:
389 Tok->Type = TT_BinaryOperator;
390 break;
391 case tok::kw_operator:
Daniel Jasper2b4c9242013-02-11 08:01:18 +0000392 while (CurrentToken && CurrentToken->isNot(tok::l_paren)) {
Alexander Kornienkoe74de282013-03-13 14:41:29 +0000393 if (CurrentToken->isOneOf(tok::star, tok::amp))
Daniel Jasper2b4c9242013-02-11 08:01:18 +0000394 CurrentToken->Type = TT_PointerOrReference;
395 consumeToken();
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000396 }
Daniel Jasper2b4c9242013-02-11 08:01:18 +0000397 if (CurrentToken)
398 CurrentToken->Type = TT_OverloadedOperatorLParen;
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000399 break;
400 case tok::question:
401 parseConditional();
402 break;
403 case tok::kw_template:
404 parseTemplateDeclaration();
405 break;
Nico Weberc2e6d2a2013-02-11 15:32:15 +0000406 case tok::identifier:
407 if (Line.First.is(tok::kw_for) &&
408 Tok->FormatTok.Tok.getIdentifierInfo() == &Ident_in)
409 Tok->Type = TT_ObjCForIn;
410 break;
Daniel Jasper8ed9f2b2013-04-03 13:36:17 +0000411 case tok::comma:
412 if (Contexts.back().FirstStartOfName)
413 Contexts.back().FirstStartOfName->PartOfMultiVariableDeclStmt = true;
414 break;
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000415 default:
416 break;
417 }
418 return true;
419 }
420
421 void parseIncludeDirective() {
422 next();
423 if (CurrentToken != NULL && CurrentToken->is(tok::less)) {
424 next();
425 while (CurrentToken != NULL) {
426 if (CurrentToken->isNot(tok::comment) ||
427 !CurrentToken->Children.empty())
428 CurrentToken->Type = TT_ImplicitStringLiteral;
429 next();
430 }
431 } else {
432 while (CurrentToken != NULL) {
Daniel Jasper3a204412013-02-23 07:46:38 +0000433 if (CurrentToken->is(tok::string_literal))
434 // Mark these string literals as "implicit" literals, too, so that
435 // they are not split or line-wrapped.
436 CurrentToken->Type = TT_ImplicitStringLiteral;
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000437 next();
438 }
439 }
440 }
441
442 void parseWarningOrError() {
443 next();
444 // We still want to format the whitespace left of the first token of the
445 // warning or error.
446 next();
447 while (CurrentToken != NULL) {
448 CurrentToken->Type = TT_ImplicitStringLiteral;
449 next();
450 }
451 }
452
453 void parsePreprocessorDirective() {
454 next();
455 if (CurrentToken == NULL)
456 return;
457 // Hashes in the middle of a line can lead to any strange token
458 // sequence.
459 if (CurrentToken->FormatTok.Tok.getIdentifierInfo() == NULL)
460 return;
461 switch (CurrentToken->FormatTok.Tok.getIdentifierInfo()->getPPKeywordID()) {
462 case tok::pp_include:
463 case tok::pp_import:
464 parseIncludeDirective();
465 break;
466 case tok::pp_error:
467 case tok::pp_warning:
468 parseWarningOrError();
469 break;
470 default:
471 break;
472 }
Daniel Jasper5b7e7b02013-02-05 09:34:14 +0000473 while (CurrentToken != NULL)
474 next();
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000475 }
476
Nico Weber95e8e462013-02-12 16:17:07 +0000477public:
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000478 LineType parseLine() {
479 int PeriodsAndArrows = 0;
Daniel Jasper24849712013-03-01 16:48:32 +0000480 AnnotatedToken *LastPeriodOrArrow = NULL;
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000481 bool CanBeBuilderTypeStmt = true;
482 if (CurrentToken->is(tok::hash)) {
483 parsePreprocessorDirective();
484 return LT_PreprocessorDirective;
485 }
486 while (CurrentToken != NULL) {
487 if (CurrentToken->is(tok::kw_virtual))
488 KeywordVirtualFound = true;
Alexander Kornienkoe74de282013-03-13 14:41:29 +0000489 if (CurrentToken->isOneOf(tok::period, tok::arrow)) {
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000490 ++PeriodsAndArrows;
Daniel Jasper24849712013-03-01 16:48:32 +0000491 LastPeriodOrArrow = CurrentToken;
492 }
Daniel Jasper4a544e52013-02-15 20:33:06 +0000493 AnnotatedToken *TheToken = CurrentToken;
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000494 if (!consumeToken())
495 return LT_Invalid;
Daniel Jasper4a544e52013-02-15 20:33:06 +0000496 if (getPrecedence(*TheToken) > prec::Assignment &&
Daniel Jasper82282dc2013-02-18 13:52:06 +0000497 TheToken->Type == TT_BinaryOperator)
Daniel Jasper4a544e52013-02-15 20:33:06 +0000498 CanBeBuilderTypeStmt = false;
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000499 }
500 if (KeywordVirtualFound)
501 return LT_VirtualFunctionDecl;
502
503 // Assume a builder-type call if there are 2 or more "." and "->".
Daniel Jasper24849712013-03-01 16:48:32 +0000504 if (PeriodsAndArrows >= 2 && CanBeBuilderTypeStmt) {
505 LastPeriodOrArrow->LastInChainOfCalls = true;
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000506 return LT_BuilderTypeCall;
Daniel Jasper24849712013-03-01 16:48:32 +0000507 }
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000508
Daniel Jasper63d7ced2013-02-05 10:07:47 +0000509 if (Line.First.Type == TT_ObjCMethodSpecifier) {
Daniel Jasper4e778092013-02-06 10:05:46 +0000510 if (Contexts.back().FirstObjCSelectorName != NULL)
511 Contexts.back().FirstObjCSelectorName->LongestObjCSelectorName =
512 Contexts.back().LongestObjCSelectorName;
Daniel Jasper63d7ced2013-02-05 10:07:47 +0000513 return LT_ObjCMethodDecl;
514 }
515
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000516 return LT_Other;
517 }
518
Nico Weber95e8e462013-02-12 16:17:07 +0000519private:
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000520 void next() {
Daniel Jasper01786732013-02-04 07:21:18 +0000521 if (CurrentToken != NULL) {
522 determineTokenType(*CurrentToken);
Daniel Jasper4e778092013-02-06 10:05:46 +0000523 CurrentToken->BindingStrength = Contexts.back().BindingStrength;
Daniel Jasper01786732013-02-04 07:21:18 +0000524 }
525
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000526 if (CurrentToken != NULL && !CurrentToken->Children.empty())
527 CurrentToken = &CurrentToken->Children[0];
528 else
529 CurrentToken = NULL;
Daniel Jasperd0f349b2013-02-18 12:44:35 +0000530
531 // Reset token type in case we have already looked at it and then recovered
532 // from an error (e.g. failure to find the matching >).
533 if (CurrentToken != NULL)
534 CurrentToken->Type = TT_Unknown;
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000535 }
536
Daniel Jasper4e778092013-02-06 10:05:46 +0000537 /// \brief A struct to hold information valid in a specific context, e.g.
538 /// a pair of parenthesis.
539 struct Context {
Daniel Jasper923ebef2013-03-14 13:45:21 +0000540 Context(tok::TokenKind ContextKind, unsigned BindingStrength,
541 bool IsExpression)
542 : ContextKind(ContextKind), BindingStrength(BindingStrength),
543 LongestObjCSelectorName(0), ColonIsForRangeExpr(false),
544 ColonIsObjCMethodExpr(false), FirstObjCSelectorName(NULL),
Daniel Jasper8ed9f2b2013-04-03 13:36:17 +0000545 FirstStartOfName(NULL), IsExpression(IsExpression),
546 CanBeExpression(true) {}
Daniel Jasper01786732013-02-04 07:21:18 +0000547
Daniel Jasper923ebef2013-03-14 13:45:21 +0000548 tok::TokenKind ContextKind;
Daniel Jasper4e778092013-02-06 10:05:46 +0000549 unsigned BindingStrength;
550 unsigned LongestObjCSelectorName;
551 bool ColonIsForRangeExpr;
552 bool ColonIsObjCMethodExpr;
553 AnnotatedToken *FirstObjCSelectorName;
Daniel Jasper8ed9f2b2013-04-03 13:36:17 +0000554 AnnotatedToken *FirstStartOfName;
Daniel Jasper4e778092013-02-06 10:05:46 +0000555 bool IsExpression;
Daniel Jasper6f21a982013-03-13 07:49:51 +0000556 bool CanBeExpression;
Daniel Jasper4e778092013-02-06 10:05:46 +0000557 };
558
559 /// \brief Puts a new \c Context onto the stack \c Contexts for the lifetime
560 /// of each instance.
561 struct ScopedContextCreator {
562 AnnotatingParser &P;
563
Daniel Jasper923ebef2013-03-14 13:45:21 +0000564 ScopedContextCreator(AnnotatingParser &P, tok::TokenKind ContextKind,
565 unsigned Increase)
566 : P(P) {
567 P.Contexts.push_back(
568 Context(ContextKind, P.Contexts.back().BindingStrength + Increase,
569 P.Contexts.back().IsExpression));
Daniel Jasper4e778092013-02-06 10:05:46 +0000570 }
571
572 ~ScopedContextCreator() { P.Contexts.pop_back(); }
573 };
Daniel Jasper01786732013-02-04 07:21:18 +0000574
575 void determineTokenType(AnnotatedToken &Current) {
576 if (getPrecedence(Current) == prec::Assignment) {
Daniel Jasper4e778092013-02-06 10:05:46 +0000577 Contexts.back().IsExpression = true;
Nico Weber95e8e462013-02-12 16:17:07 +0000578 for (AnnotatedToken *Previous = Current.Parent;
579 Previous && Previous->isNot(tok::comma);
580 Previous = Previous->Parent) {
Daniel Jasper9c65b062013-02-27 11:43:50 +0000581 if (Previous->is(tok::r_square))
582 Previous = Previous->MatchingParen;
Daniel Jasper01786732013-02-04 07:21:18 +0000583 if (Previous->Type == TT_BinaryOperator &&
Alexander Kornienkoe74de282013-03-13 14:41:29 +0000584 Previous->isOneOf(tok::star, tok::amp)) {
Daniel Jasper01786732013-02-04 07:21:18 +0000585 Previous->Type = TT_PointerOrReference;
586 }
Daniel Jasper01786732013-02-04 07:21:18 +0000587 }
Alexander Kornienkoe74de282013-03-13 14:41:29 +0000588 } else if (Current.isOneOf(tok::kw_return, tok::kw_throw) ||
Nico Weber95e8e462013-02-12 16:17:07 +0000589 (Current.is(tok::l_paren) && !Line.MustBeDeclaration &&
590 (!Current.Parent || Current.Parent->isNot(tok::kw_for)))) {
Daniel Jasper4e778092013-02-06 10:05:46 +0000591 Contexts.back().IsExpression = true;
Alexander Kornienkoe74de282013-03-13 14:41:29 +0000592 } else if (Current.isOneOf(tok::r_paren, tok::greater, tok::comma)) {
Nico Weber95e8e462013-02-12 16:17:07 +0000593 for (AnnotatedToken *Previous = Current.Parent;
Alexander Kornienkoe74de282013-03-13 14:41:29 +0000594 Previous && Previous->isOneOf(tok::star, tok::amp);
Nico Weber95e8e462013-02-12 16:17:07 +0000595 Previous = Previous->Parent)
596 Previous->Type = TT_PointerOrReference;
Daniel Jasperd0f349b2013-02-18 12:44:35 +0000597 } else if (Current.Parent &&
598 Current.Parent->Type == TT_CtorInitializerColon) {
599 Contexts.back().IsExpression = true;
Daniel Jasper6f21a982013-03-13 07:49:51 +0000600 } else if (Current.is(tok::kw_new)) {
601 Contexts.back().CanBeExpression = false;
Nico Weber95e8e462013-02-12 16:17:07 +0000602 }
Daniel Jasper01786732013-02-04 07:21:18 +0000603
604 if (Current.Type == TT_Unknown) {
Daniel Jasper3c08a812013-02-24 18:54:32 +0000605 if (Current.Parent && Current.is(tok::identifier) &&
606 ((Current.Parent->is(tok::identifier) &&
607 Current.Parent->FormatTok.Tok.getIdentifierInfo()
608 ->getPPKeywordID() == tok::pp_not_keyword) ||
Daniel Jasper8ed9f2b2013-04-03 13:36:17 +0000609 isSimpleTypeSpecifier(*Current.Parent) ||
Daniel Jasper3c08a812013-02-24 18:54:32 +0000610 Current.Parent->Type == TT_PointerOrReference ||
611 Current.Parent->Type == TT_TemplateCloser)) {
Daniel Jasper8ed9f2b2013-04-03 13:36:17 +0000612 Contexts.back().FirstStartOfName = &Current;
Daniel Jasper3c08a812013-02-24 18:54:32 +0000613 Current.Type = TT_StartOfName;
Alexander Kornienkoe74de282013-03-13 14:41:29 +0000614 } else if (Current.isOneOf(tok::star, tok::amp, tok::ampamp)) {
Daniel Jasper4e778092013-02-06 10:05:46 +0000615 Current.Type =
616 determineStarAmpUsage(Current, Contexts.back().IsExpression);
Alexander Kornienkoe74de282013-03-13 14:41:29 +0000617 } else if (Current.isOneOf(tok::minus, tok::plus, tok::caret)) {
Daniel Jasper01786732013-02-04 07:21:18 +0000618 Current.Type = determinePlusMinusCaretUsage(Current);
Alexander Kornienkoe74de282013-03-13 14:41:29 +0000619 } else if (Current.isOneOf(tok::minusminus, tok::plusplus)) {
Daniel Jasper01786732013-02-04 07:21:18 +0000620 Current.Type = determineIncrementUsage(Current);
621 } else if (Current.is(tok::exclaim)) {
622 Current.Type = TT_UnaryOperator;
623 } else if (isBinaryOperator(Current)) {
624 Current.Type = TT_BinaryOperator;
625 } else if (Current.is(tok::comment)) {
626 std::string Data(Lexer::getSpelling(Current.FormatTok.Tok, SourceMgr,
627 Lex.getLangOpts()));
628 if (StringRef(Data).startswith("//"))
629 Current.Type = TT_LineComment;
630 else
631 Current.Type = TT_BlockComment;
Nico Weber37d69312013-02-13 04:13:13 +0000632 } else if (Current.is(tok::r_paren)) {
Daniel Jasper03628b82013-02-19 20:05:41 +0000633 bool ParensNotExpr = !Current.Parent ||
634 Current.Parent->Type == TT_PointerOrReference ||
Nico Weber37d69312013-02-13 04:13:13 +0000635 Current.Parent->Type == TT_TemplateCloser;
636 bool ParensCouldEndDecl =
Alexander Kornienkoe74de282013-03-13 14:41:29 +0000637 !Current.Children.empty() &&
638 Current.Children[0].isOneOf(tok::equal, tok::semi, tok::l_brace);
Daniel Jasper6a365aa2013-03-13 17:13:53 +0000639 bool IsSizeOfOrAlignOf =
640 Current.MatchingParen && Current.MatchingParen->Parent &&
641 Current.MatchingParen->Parent->isOneOf(tok::kw_sizeof,
642 tok::kw_alignof);
643 if (ParensNotExpr && !ParensCouldEndDecl && !IsSizeOfOrAlignOf &&
Daniel Jasper37eff832013-02-23 08:07:18 +0000644 Contexts.back().IsExpression)
Nico Weber37d69312013-02-13 04:13:13 +0000645 // FIXME: We need to get smarter and understand more cases of casts.
646 Current.Type = TT_CastRParen;
Daniel Jasper01786732013-02-04 07:21:18 +0000647 } else if (Current.is(tok::at) && Current.Children.size()) {
648 switch (Current.Children[0].FormatTok.Tok.getObjCKeywordID()) {
649 case tok::objc_interface:
650 case tok::objc_implementation:
651 case tok::objc_protocol:
652 Current.Type = TT_ObjCDecl;
653 break;
654 case tok::objc_property:
655 Current.Type = TT_ObjCProperty;
656 break;
657 default:
658 break;
659 }
660 }
661 }
662 }
663
Daniel Jasper01786732013-02-04 07:21:18 +0000664 /// \brief Return the type of the given token assuming it is * or &.
665 TokenType
666 determineStarAmpUsage(const AnnotatedToken &Tok, bool IsExpression) {
667 const AnnotatedToken *PrevToken = getPreviousToken(Tok);
668 if (PrevToken == NULL)
669 return TT_UnaryOperator;
670
671 const AnnotatedToken *NextToken = getNextToken(Tok);
672 if (NextToken == NULL)
673 return TT_Unknown;
674
Daniel Jasper8a5d7cd2013-03-01 17:13:29 +0000675 if (PrevToken->is(tok::l_paren) && !IsExpression)
676 return TT_PointerOrReference;
677
Alexander Kornienkoe74de282013-03-13 14:41:29 +0000678 if (PrevToken->isOneOf(tok::l_paren, tok::l_square, tok::l_brace,
Daniel Jasperd3cf17b2013-03-14 10:50:25 +0000679 tok::comma, tok::semi, tok::kw_return, tok::colon,
Alexander Kornienkoe74de282013-03-13 14:41:29 +0000680 tok::equal) ||
681 PrevToken->Type == TT_BinaryOperator ||
Daniel Jasper01786732013-02-04 07:21:18 +0000682 PrevToken->Type == TT_UnaryOperator || PrevToken->Type == TT_CastRParen)
683 return TT_UnaryOperator;
684
Nico Webere8a97982013-02-06 06:20:11 +0000685 if (NextToken->is(tok::l_square))
686 return TT_PointerOrReference;
687
Alexander Kornienkoe74de282013-03-13 14:41:29 +0000688 if (PrevToken->FormatTok.Tok.isLiteral() ||
689 PrevToken->isOneOf(tok::r_paren, tok::r_square) ||
Daniel Jasper9322aae2013-03-20 09:53:18 +0000690 NextToken->FormatTok.Tok.isLiteral() || isUnaryOperator(*NextToken))
Daniel Jasper01786732013-02-04 07:21:18 +0000691 return TT_BinaryOperator;
692
Daniel Jasper01786732013-02-04 07:21:18 +0000693 // It is very unlikely that we are going to find a pointer or reference type
694 // definition on the RHS of an assignment.
695 if (IsExpression)
696 return TT_BinaryOperator;
697
698 return TT_PointerOrReference;
699 }
700
701 TokenType determinePlusMinusCaretUsage(const AnnotatedToken &Tok) {
702 const AnnotatedToken *PrevToken = getPreviousToken(Tok);
703 if (PrevToken == NULL)
704 return TT_UnaryOperator;
705
706 // Use heuristics to recognize unary operators.
Alexander Kornienkoe74de282013-03-13 14:41:29 +0000707 if (PrevToken->isOneOf(tok::equal, tok::l_paren, tok::comma, tok::l_square,
708 tok::question, tok::colon, tok::kw_return,
709 tok::kw_case, tok::at, tok::l_brace))
Daniel Jasper01786732013-02-04 07:21:18 +0000710 return TT_UnaryOperator;
711
Nico Weberee0feec2013-02-05 16:21:00 +0000712 // There can't be two consecutive binary operators.
Daniel Jasper01786732013-02-04 07:21:18 +0000713 if (PrevToken->Type == TT_BinaryOperator)
714 return TT_UnaryOperator;
715
716 // Fall back to marking the token as binary operator.
717 return TT_BinaryOperator;
718 }
719
720 /// \brief Determine whether ++/-- are pre- or post-increments/-decrements.
721 TokenType determineIncrementUsage(const AnnotatedToken &Tok) {
722 const AnnotatedToken *PrevToken = getPreviousToken(Tok);
723 if (PrevToken == NULL)
724 return TT_UnaryOperator;
Alexander Kornienkoe74de282013-03-13 14:41:29 +0000725 if (PrevToken->isOneOf(tok::r_paren, tok::r_square, tok::identifier))
Daniel Jasper01786732013-02-04 07:21:18 +0000726 return TT_TrailingUnaryOperator;
727
728 return TT_UnaryOperator;
729 }
Daniel Jasper4e778092013-02-06 10:05:46 +0000730
Daniel Jasper8ed9f2b2013-04-03 13:36:17 +0000731 // FIXME: This is copy&pasted from Sema. Put it in a common place and remove
732 // duplication.
733 /// \brief Determine whether the token kind starts a simple-type-specifier.
734 bool isSimpleTypeSpecifier(const AnnotatedToken &Tok) const {
735 switch (Tok.FormatTok.Tok.getKind()) {
736 case tok::kw_short:
737 case tok::kw_long:
738 case tok::kw___int64:
739 case tok::kw___int128:
740 case tok::kw_signed:
741 case tok::kw_unsigned:
742 case tok::kw_void:
743 case tok::kw_char:
744 case tok::kw_int:
745 case tok::kw_half:
746 case tok::kw_float:
747 case tok::kw_double:
748 case tok::kw_wchar_t:
749 case tok::kw_bool:
750 case tok::kw___underlying_type:
751 return true;
752 case tok::annot_typename:
753 case tok::kw_char16_t:
754 case tok::kw_char32_t:
755 case tok::kw_typeof:
756 case tok::kw_decltype:
757 return Lex.getLangOpts().CPlusPlus;
758 default:
759 break;
760 }
761 return false;
762 }
763
Daniel Jasper4e778092013-02-06 10:05:46 +0000764 SmallVector<Context, 8> Contexts;
765
766 SourceManager &SourceMgr;
767 Lexer &Lex;
768 AnnotatedLine &Line;
769 AnnotatedToken *CurrentToken;
770 bool KeywordVirtualFound;
Nico Weberc2e6d2a2013-02-11 15:32:15 +0000771 IdentifierInfo &Ident_in;
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000772};
773
Daniel Jasper29f123b2013-02-08 15:28:42 +0000774/// \brief Parses binary expressions by inserting fake parenthesis based on
775/// operator precedence.
776class ExpressionParser {
777public:
778 ExpressionParser(AnnotatedLine &Line) : Current(&Line.First) {}
779
780 /// \brief Parse expressions with the given operatore precedence.
Daniel Jasper237d4c12013-02-23 21:01:55 +0000781 void parse(int Precedence = 0) {
Daniel Jasper29f123b2013-02-08 15:28:42 +0000782 if (Precedence > prec::PointerToMember || Current == NULL)
783 return;
784
785 // Skip over "return" until we can properly parse it.
786 if (Current->is(tok::kw_return))
787 next();
788
789 // Eagerly consume trailing comments.
790 while (isTrailingComment(Current)) {
791 next();
792 }
793
794 AnnotatedToken *Start = Current;
795 bool OperatorFound = false;
796
Daniel Jasper237d4c12013-02-23 21:01:55 +0000797 while (Current) {
Daniel Jasper29f123b2013-02-08 15:28:42 +0000798 // Consume operators with higher precedence.
Dmitri Gribenko6ba52aa2013-02-16 20:03:26 +0000799 parse(prec::Level(Precedence + 1));
Daniel Jasper29f123b2013-02-08 15:28:42 +0000800
Daniel Jasper237d4c12013-02-23 21:01:55 +0000801 int CurrentPrecedence = 0;
802 if (Current) {
803 if (Current->Type == TT_ConditionalExpr)
804 CurrentPrecedence = 1 + (int) prec::Conditional;
Daniel Jasper923ebef2013-03-14 13:45:21 +0000805 else if (Current->is(tok::semi) || Current->Type == TT_InlineASMColon ||
806 Current->Type == TT_CtorInitializerColon)
Daniel Jasper237d4c12013-02-23 21:01:55 +0000807 CurrentPrecedence = 1;
808 else if (Current->Type == TT_BinaryOperator || Current->is(tok::comma))
809 CurrentPrecedence = 1 + (int) getPrecedence(*Current);
810 }
811
Daniel Jasper29f123b2013-02-08 15:28:42 +0000812 // At the end of the line or when an operator with higher precedence is
813 // found, insert fake parenthesis and return.
Daniel Jasper237d4c12013-02-23 21:01:55 +0000814 if (Current == NULL || closesScope(*Current) ||
815 (CurrentPrecedence != 0 && CurrentPrecedence < Precedence)) {
Daniel Jasper29f123b2013-02-08 15:28:42 +0000816 if (OperatorFound) {
817 ++Start->FakeLParens;
Daniel Jasper237d4c12013-02-23 21:01:55 +0000818 if (Current)
Daniel Jasper087387a2013-02-08 16:49:27 +0000819 ++Current->Parent->FakeRParens;
Daniel Jasper29f123b2013-02-08 15:28:42 +0000820 }
821 return;
822 }
823
824 // Consume scopes: (), [], <> and {}
825 if (opensScope(*Current)) {
Daniel Jasper237d4c12013-02-23 21:01:55 +0000826 AnnotatedToken *Left = Current;
827 while (Current && !closesScope(*Current)) {
Daniel Jasper29f123b2013-02-08 15:28:42 +0000828 next();
829 parse();
830 }
Daniel Jasper237d4c12013-02-23 21:01:55 +0000831 // Remove fake parens that just duplicate the real parens.
832 if (Current && Left->Children[0].FakeLParens > 0 &&
833 Current->Parent->FakeRParens > 0) {
834 --Left->Children[0].FakeLParens;
835 --Current->Parent->FakeRParens;
836 }
Daniel Jasper29f123b2013-02-08 15:28:42 +0000837 next();
838 } else {
839 // Operator found.
Daniel Jasper237d4c12013-02-23 21:01:55 +0000840 if (CurrentPrecedence == Precedence)
Daniel Jasper29f123b2013-02-08 15:28:42 +0000841 OperatorFound = true;
842
843 next();
844 }
845 }
846 }
847
848private:
849 void next() {
850 if (Current != NULL)
851 Current = Current->Children.empty() ? NULL : &Current->Children[0];
852 }
853
Daniel Jasper29f123b2013-02-08 15:28:42 +0000854 AnnotatedToken *Current;
855};
856
Daniel Jasper8ff690a2013-02-06 14:22:40 +0000857void TokenAnnotator::annotate(AnnotatedLine &Line) {
Nico Weberc2e6d2a2013-02-11 15:32:15 +0000858 AnnotatingParser Parser(SourceMgr, Lex, Line, Ident_in);
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000859 Line.Type = Parser.parseLine();
860 if (Line.Type == LT_Invalid)
861 return;
862
Daniel Jasper29f123b2013-02-08 15:28:42 +0000863 ExpressionParser ExprParser(Line);
864 ExprParser.parse();
865
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000866 if (Line.First.Type == TT_ObjCMethodSpecifier)
867 Line.Type = LT_ObjCMethodDecl;
868 else if (Line.First.Type == TT_ObjCDecl)
869 Line.Type = LT_ObjCDecl;
870 else if (Line.First.Type == TT_ObjCProperty)
871 Line.Type = LT_ObjCProperty;
872
Daniel Jasper729a7432013-02-11 12:36:37 +0000873 Line.First.SpacesRequiredBefore = 1;
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000874 Line.First.MustBreakBefore = Line.First.FormatTok.MustBreakBefore;
875 Line.First.CanBreakBefore = Line.First.MustBreakBefore;
876
877 Line.First.TotalLength = Line.First.FormatTok.TokenLength;
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000878}
879
Daniel Jasper8ff690a2013-02-06 14:22:40 +0000880void TokenAnnotator::calculateFormattingInformation(AnnotatedLine &Line) {
881 if (Line.First.Children.empty())
882 return;
883 AnnotatedToken *Current = &Line.First.Children[0];
884 while (Current != NULL) {
Daniel Jasper729a7432013-02-11 12:36:37 +0000885 if (Current->Type == TT_LineComment)
886 Current->SpacesRequiredBefore = Style.SpacesBeforeTrailingComments;
887 else
888 Current->SpacesRequiredBefore =
889 spaceRequiredBefore(Line, *Current) ? 1 : 0;
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000890
Daniel Jasper8ff690a2013-02-06 14:22:40 +0000891 if (Current->FormatTok.MustBreakBefore) {
892 Current->MustBreakBefore = true;
893 } else if (Current->Type == TT_LineComment) {
894 Current->MustBreakBefore = Current->FormatTok.NewlinesBefore > 0;
Daniel Jasper29f123b2013-02-08 15:28:42 +0000895 } else if (isTrailingComment(Current->Parent) ||
Daniel Jasper8ff690a2013-02-06 14:22:40 +0000896 (Current->is(tok::string_literal) &&
897 Current->Parent->is(tok::string_literal))) {
898 Current->MustBreakBefore = true;
899 } else if (Current->is(tok::lessless) && !Current->Children.empty() &&
900 Current->Parent->is(tok::string_literal) &&
901 Current->Children[0].is(tok::string_literal)) {
902 Current->MustBreakBefore = true;
903 } else {
904 Current->MustBreakBefore = false;
905 }
906 Current->CanBreakBefore =
907 Current->MustBreakBefore || canBreakBefore(Line, *Current);
908 if (Current->MustBreakBefore)
909 Current->TotalLength = Current->Parent->TotalLength + Style.ColumnLimit;
910 else
911 Current->TotalLength =
912 Current->Parent->TotalLength + Current->FormatTok.TokenLength +
Daniel Jasper729a7432013-02-11 12:36:37 +0000913 Current->SpacesRequiredBefore;
Daniel Jasper8ff690a2013-02-06 14:22:40 +0000914 // FIXME: Only calculate this if CanBreakBefore is true once static
915 // initializers etc. are sorted out.
916 // FIXME: Move magic numbers to a better place.
917 Current->SplitPenalty =
918 20 * Current->BindingStrength + splitPenalty(Line, *Current);
919
920 Current = Current->Children.empty() ? NULL : &Current->Children[0];
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000921 }
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000922}
923
Daniel Jasper8ff690a2013-02-06 14:22:40 +0000924unsigned TokenAnnotator::splitPenalty(const AnnotatedLine &Line,
925 const AnnotatedToken &Tok) {
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000926 const AnnotatedToken &Left = *Tok.Parent;
927 const AnnotatedToken &Right = Tok;
928
Daniel Jasper3c08a812013-02-24 18:54:32 +0000929 if (Right.Type == TT_StartOfName) {
Daniel Jasper8ed9f2b2013-04-03 13:36:17 +0000930 if (Line.First.is(tok::kw_for) && Right.PartOfMultiVariableDeclStmt)
Daniel Jasper3c08a812013-02-24 18:54:32 +0000931 return 3;
932 else if (Line.MightBeFunctionDecl && Right.BindingStrength == 1)
933 // FIXME: Clean up hack of using BindingStrength to find top-level names.
934 return Style.PenaltyReturnTypeOnItsOwnLine;
935 else
936 return 100;
937 }
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000938 if (Left.is(tok::equal) && Right.is(tok::l_brace))
939 return 150;
940 if (Left.is(tok::coloncolon))
941 return 500;
942
Daniel Jasper6cabab42013-02-14 08:42:54 +0000943 if (Left.Type == TT_RangeBasedForLoopColon ||
944 Left.Type == TT_InheritanceColon)
Daniel Jasper84a1a632013-02-26 13:18:08 +0000945 return 2;
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000946
Alexander Kornienkoe74de282013-03-13 14:41:29 +0000947 if (Right.isOneOf(tok::arrow, tok::period)) {
Daniel Jasper515f65d2013-02-18 13:24:21 +0000948 if (Line.Type == LT_BuilderTypeCall)
Daniel Jasper6a365aa2013-03-13 17:13:53 +0000949 return prec::PointerToMember;
Alexander Kornienkoe74de282013-03-13 14:41:29 +0000950 if (Left.isOneOf(tok::r_paren, tok::r_square) && Left.MatchingParen &&
951 Left.MatchingParen->ParameterCount > 0)
Daniel Jasper518ee342013-02-26 13:59:14 +0000952 return 20; // Should be smaller than breaking at a nested comma.
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000953 return 150;
954 }
955
956 // In for-loops, prefer breaking at ',' and ';'.
Daniel Jasper7d812812013-02-21 15:00:29 +0000957 if (Line.First.is(tok::kw_for) && Left.is(tok::equal))
958 return 4;
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000959
Daniel Jasper8159d2f2013-02-04 07:30:30 +0000960 if (Left.is(tok::semi))
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000961 return 0;
Daniel Jasper8159d2f2013-02-04 07:30:30 +0000962 if (Left.is(tok::comma))
963 return 1;
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000964
965 // In Objective-C method expressions, prefer breaking before "param:" over
966 // breaking after it.
Daniel Jasper63d7ced2013-02-05 10:07:47 +0000967 if (Right.Type == TT_ObjCSelectorName)
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000968 return 0;
Daniel Jasper63d7ced2013-02-05 10:07:47 +0000969 if (Left.is(tok::colon) && Left.Type == TT_ObjCMethodExpr)
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000970 return 20;
971
Alexander Kornienkoe74de282013-03-13 14:41:29 +0000972 if (opensScope(Left))
Daniel Jasper64f09282013-03-20 13:53:11 +0000973 return Left.ParameterCount > 1 ? prec::Comma : 20;
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000974
Daniel Jasper4e8a7b42013-02-06 21:04:05 +0000975 if (Right.is(tok::lessless)) {
976 if (Left.is(tok::string_literal)) {
Daniel Jasperbfa1edd2013-03-14 14:00:17 +0000977 StringRef Content = StringRef(Left.FormatTok.Tok.getLiteralData(),
978 Left.FormatTok.TokenLength);
979 Content = Content.drop_back(1).drop_front(1).trim();
980 if (Content.size() > 1 &&
981 (Content.back() == ':' || Content.back() == '='))
Daniel Jasper4e8a7b42013-02-06 21:04:05 +0000982 return 100;
983 }
Daniel Jasper01786732013-02-04 07:21:18 +0000984 return prec::Shift;
Daniel Jasper4e8a7b42013-02-06 21:04:05 +0000985 }
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000986 if (Left.Type == TT_ConditionalExpr)
Daniel Jasper518ee342013-02-26 13:59:14 +0000987 return prec::Conditional;
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000988 prec::Level Level = getPrecedence(Left);
989
990 if (Level != prec::Unknown)
991 return Level;
Daniel Jasper24849712013-03-01 16:48:32 +0000992
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000993 return 3;
994}
995
Daniel Jasper8ff690a2013-02-06 14:22:40 +0000996bool TokenAnnotator::spaceRequiredBetween(const AnnotatedLine &Line,
997 const AnnotatedToken &Left,
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000998 const AnnotatedToken &Right) {
999 if (Right.is(tok::hashhash))
1000 return Left.is(tok::hash);
Alexander Kornienkoe74de282013-03-13 14:41:29 +00001001 if (Left.isOneOf(tok::hashhash, tok::hash))
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001002 return Right.is(tok::hash);
Alexander Kornienkoe74de282013-03-13 14:41:29 +00001003 if (Right.isOneOf(tok::r_paren, tok::semi, tok::comma))
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001004 return false;
1005 if (Right.is(tok::less) &&
1006 (Left.is(tok::kw_template) ||
1007 (Line.Type == LT_ObjCDecl && Style.ObjCSpaceBeforeProtocolList)))
1008 return true;
1009 if (Left.is(tok::arrow) || Right.is(tok::arrow))
1010 return false;
Alexander Kornienkoe74de282013-03-13 14:41:29 +00001011 if (Left.isOneOf(tok::exclaim, tok::tilde))
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001012 return false;
1013 if (Left.is(tok::at) &&
Alexander Kornienkoe74de282013-03-13 14:41:29 +00001014 Right.isOneOf(tok::identifier, tok::string_literal, tok::char_constant,
1015 tok::numeric_constant, tok::l_paren, tok::l_brace,
1016 tok::kw_true, tok::kw_false))
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001017 return false;
1018 if (Left.is(tok::coloncolon))
1019 return false;
1020 if (Right.is(tok::coloncolon))
Alexander Kornienkoe74de282013-03-13 14:41:29 +00001021 return !Left.isOneOf(tok::identifier, tok::greater, tok::l_paren);
1022 if (Left.is(tok::less) || Right.isOneOf(tok::greater, tok::less))
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001023 return false;
Alexander Kornienko3fd9ccd2013-03-12 16:28:18 +00001024 if (Right.Type == TT_PointerOrReference)
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001025 return Left.FormatTok.Tok.isLiteral() ||
Alexander Kornienko3fd9ccd2013-03-12 16:28:18 +00001026 ((Left.Type != TT_PointerOrReference) && Left.isNot(tok::l_paren) &&
1027 !Style.PointerBindsToType);
1028 if (Left.Type == TT_PointerOrReference)
Nico Weber95e8e462013-02-12 16:17:07 +00001029 return Right.FormatTok.Tok.isLiteral() ||
Daniel Jasper9322aae2013-03-20 09:53:18 +00001030 ((Right.Type != TT_PointerOrReference) &&
Daniel Jasper81d2d382013-04-01 17:13:26 +00001031 Right.isNot(tok::l_paren) && Style.PointerBindsToType &&
1032 Left.Parent && Left.Parent->isNot(tok::l_paren));
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001033 if (Right.is(tok::star) && Left.is(tok::l_paren))
1034 return false;
Nico Weber051860e2013-02-10 02:08:05 +00001035 if (Left.is(tok::l_square))
1036 return Left.Type == TT_ObjCArrayLiteral && Right.isNot(tok::r_square);
1037 if (Right.is(tok::r_square))
1038 return Right.Type == TT_ObjCArrayLiteral;
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001039 if (Right.is(tok::l_square) && Right.Type != TT_ObjCMethodExpr)
1040 return false;
1041 if (Left.is(tok::period) || Right.is(tok::period))
1042 return false;
1043 if (Left.is(tok::colon))
1044 return Left.Type != TT_ObjCMethodExpr;
1045 if (Right.is(tok::colon))
1046 return Right.Type != TT_ObjCMethodExpr;
1047 if (Left.is(tok::l_paren))
1048 return false;
1049 if (Right.is(tok::l_paren)) {
Alexander Kornienkoe74de282013-03-13 14:41:29 +00001050 return Line.Type == LT_ObjCDecl ||
1051 Left.isOneOf(tok::kw_if, tok::kw_for, tok::kw_while, tok::kw_switch,
1052 tok::kw_return, tok::kw_catch, tok::kw_new,
1053 tok::kw_delete);
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001054 }
1055 if (Left.is(tok::at) &&
1056 Right.FormatTok.Tok.getObjCKeywordID() != tok::objc_not_keyword)
1057 return false;
1058 if (Left.is(tok::l_brace) && Right.is(tok::r_brace))
1059 return false;
1060 return true;
1061}
1062
Daniel Jasper8ff690a2013-02-06 14:22:40 +00001063bool TokenAnnotator::spaceRequiredBefore(const AnnotatedLine &Line,
1064 const AnnotatedToken &Tok) {
Daniel Jasper2b4c9242013-02-11 08:01:18 +00001065 if (Tok.FormatTok.Tok.getIdentifierInfo() &&
1066 Tok.Parent->FormatTok.Tok.getIdentifierInfo())
1067 return true; // Never ever merge two identifiers.
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001068 if (Line.Type == LT_ObjCMethodDecl) {
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001069 if (Tok.Parent->Type == TT_ObjCMethodSpecifier)
1070 return true;
1071 if (Tok.Parent->is(tok::r_paren) && Tok.is(tok::identifier))
1072 // Don't space between ')' and <id>
1073 return false;
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001074 }
1075 if (Line.Type == LT_ObjCProperty &&
1076 (Tok.is(tok::equal) || Tok.Parent->is(tok::equal)))
1077 return false;
1078
1079 if (Tok.Parent->is(tok::comma))
1080 return true;
Daniel Jasper9c3c7b32013-02-28 13:40:17 +00001081 if (Tok.is(tok::comma))
1082 return false;
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001083 if (Tok.Type == TT_CtorInitializerColon || Tok.Type == TT_ObjCBlockLParen)
1084 return true;
Daniel Jasper2b4c9242013-02-11 08:01:18 +00001085 if (Tok.Parent->FormatTok.Tok.is(tok::kw_operator))
1086 return false;
1087 if (Tok.Type == TT_OverloadedOperatorLParen)
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001088 return false;
1089 if (Tok.is(tok::colon))
Alexander Kornienkoe74de282013-03-13 14:41:29 +00001090 return !Line.First.isOneOf(tok::kw_case, tok::kw_default) &&
1091 !Tok.Children.empty() && Tok.Type != TT_ObjCMethodExpr;
Daniel Jasper8a5d7cd2013-03-01 17:13:29 +00001092 if (Tok.is(tok::l_paren) && !Tok.Children.empty() &&
1093 Tok.Children[0].Type == TT_PointerOrReference &&
1094 !Tok.Children[0].Children.empty() &&
Alexander Kornienko54a38bd2013-03-20 16:41:56 +00001095 Tok.Children[0].Children[0].isNot(tok::r_paren) &&
Daniel Jasper81d2d382013-04-01 17:13:26 +00001096 Tok.Parent->isNot(tok::l_paren) &&
1097 (Tok.Parent->Type != TT_PointerOrReference || Style.PointerBindsToType))
Daniel Jasper8a5d7cd2013-03-01 17:13:29 +00001098 return true;
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001099 if (Tok.Parent->Type == TT_UnaryOperator || Tok.Parent->Type == TT_CastRParen)
1100 return false;
1101 if (Tok.Type == TT_UnaryOperator)
Alexander Kornienkoe74de282013-03-13 14:41:29 +00001102 return !Tok.Parent->isOneOf(tok::l_paren, tok::l_square, tok::at) &&
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001103 (Tok.Parent->isNot(tok::colon) ||
1104 Tok.Parent->Type != TT_ObjCMethodExpr);
1105 if (Tok.Parent->is(tok::greater) && Tok.is(tok::greater)) {
Daniel Jasper29f123b2013-02-08 15:28:42 +00001106 return Tok.Type == TT_TemplateCloser &&
1107 Tok.Parent->Type == TT_TemplateCloser &&
1108 Style.Standard != FormatStyle::LS_Cpp11;
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001109 }
Alexander Kornienko54a38bd2013-03-20 16:41:56 +00001110 if (Tok.isOneOf(tok::arrowstar, tok::periodstar) ||
1111 Tok.Parent->isOneOf(tok::arrowstar, tok::periodstar))
Daniel Jasper9c3c7b32013-02-28 13:40:17 +00001112 return false;
1113 if (Tok.Type == TT_BinaryOperator || Tok.Parent->Type == TT_BinaryOperator)
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001114 return true;
1115 if (Tok.Parent->Type == TT_TemplateCloser && Tok.is(tok::l_paren))
1116 return false;
1117 if (Tok.is(tok::less) && Line.First.is(tok::hash))
1118 return true;
1119 if (Tok.Type == TT_TrailingUnaryOperator)
1120 return false;
Daniel Jasper8ff690a2013-02-06 14:22:40 +00001121 return spaceRequiredBetween(Line, *Tok.Parent, Tok);
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001122}
1123
Daniel Jasper8ff690a2013-02-06 14:22:40 +00001124bool TokenAnnotator::canBreakBefore(const AnnotatedLine &Line,
1125 const AnnotatedToken &Right) {
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001126 const AnnotatedToken &Left = *Right.Parent;
Daniel Jaspera03ab102013-02-13 20:33:44 +00001127 if (Right.Type == TT_StartOfName)
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001128 return true;
1129 if (Right.is(tok::colon) && Right.Type == TT_ObjCMethodExpr)
1130 return false;
1131 if (Left.is(tok::colon) && Left.Type == TT_ObjCMethodExpr)
1132 return true;
Daniel Jasper63d7ced2013-02-05 10:07:47 +00001133 if (Right.Type == TT_ObjCSelectorName)
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001134 return true;
1135 if (Left.ClosesTemplateDeclaration)
1136 return true;
1137 if (Right.Type == TT_ConditionalExpr || Right.is(tok::question))
1138 return true;
Daniel Jasper6cabab42013-02-14 08:42:54 +00001139 if (Right.Type == TT_RangeBasedForLoopColon ||
Daniel Jasper27b91cc2013-04-05 17:21:59 +00001140 Right.Type == TT_InheritanceColon ||
1141 Right.Type == TT_OverloadedOperatorLParen)
Daniel Jasper6cabab42013-02-14 08:42:54 +00001142 return false;
1143 if (Left.Type == TT_RangeBasedForLoopColon ||
1144 Left.Type == TT_InheritanceColon)
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001145 return true;
Daniel Jasper7d812812013-02-21 15:00:29 +00001146 if (Right.Type == TT_RangeBasedForLoopColon)
1147 return false;
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001148 if (Left.Type == TT_PointerOrReference || Left.Type == TT_TemplateCloser ||
1149 Left.Type == TT_UnaryOperator || Left.Type == TT_ConditionalExpr ||
Alexander Kornienkoe74de282013-03-13 14:41:29 +00001150 Left.isOneOf(tok::question, tok::kw_operator))
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001151 return false;
1152 if (Left.is(tok::equal) && Line.Type == LT_VirtualFunctionDecl)
1153 return false;
Daniel Jasper8ed41002013-02-28 14:44:25 +00001154 if (Left.is(tok::l_paren) && Right.is(tok::l_paren) && Left.Parent &&
1155 Left.Parent->is(tok::kw___attribute))
1156 return false;
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001157
1158 if (Right.Type == TT_LineComment)
1159 // We rely on MustBreakBefore being set correctly here as we should not
1160 // change the "binding" behavior of a comment.
1161 return false;
1162
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001163 // Allow breaking after a trailing 'const', e.g. after a method declaration,
1164 // unless it is follow by ';', '{' or '='.
1165 if (Left.is(tok::kw_const) && Left.Parent != NULL &&
1166 Left.Parent->is(tok::r_paren))
Alexander Kornienkoe74de282013-03-13 14:41:29 +00001167 return !Right.isOneOf(tok::l_brace, tok::semi, tok::equal);
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001168
Daniel Jasper8ef19a22013-03-14 09:50:46 +00001169 if (Right.is(tok::kw___attribute))
1170 return true;
1171
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001172 // We only break before r_brace if there was a corresponding break before
1173 // the l_brace, which is tracked by BreakBeforeClosingBrace.
Daniel Jasper8ef19a22013-03-14 09:50:46 +00001174 if (Right.isOneOf(tok::r_brace, tok::r_paren, tok::greater))
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001175 return false;
Daniel Jasper3a204412013-02-23 07:46:38 +00001176 if (Left.is(tok::identifier) && Right.is(tok::string_literal))
1177 return true;
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001178 return (isBinaryOperator(Left) && Left.isNot(tok::lessless)) ||
Alexander Kornienkoe74de282013-03-13 14:41:29 +00001179 Left.isOneOf(tok::comma, tok::coloncolon, tok::semi, tok::l_brace) ||
1180 Right.isOneOf(tok::lessless, tok::arrow, tok::period, tok::colon) ||
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001181 (Left.is(tok::r_paren) && Left.Type != TT_CastRParen &&
Alexander Kornienkoe74de282013-03-13 14:41:29 +00001182 Right.isOneOf(tok::identifier, tok::kw___attribute)) ||
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001183 (Left.is(tok::l_paren) && !Right.is(tok::r_paren)) ||
1184 (Left.is(tok::l_square) && !Right.is(tok::r_square));
1185}
1186
1187} // namespace format
1188} // namespace clang