blob: 307607aadd72df27205bbc7ecb534ce4bdeab89b [file] [log] [blame]
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001//===--- TokenAnnotator.cpp - Format C++ code -----------------------------===//
2//
3// The LLVM Compiler Infrastructure
4//
5// This file is distributed under the University of Illinois Open Source
6// License. See LICENSE.TXT for details.
7//
8//===----------------------------------------------------------------------===//
9///
10/// \file
11/// \brief This file implements a token annotator, i.e. creates
12/// \c AnnotatedTokens out of \c FormatTokens with required extra information.
13///
14//===----------------------------------------------------------------------===//
15
16#include "TokenAnnotator.h"
17#include "clang/Basic/SourceManager.h"
18#include "clang/Lex/Lexer.h"
19
20namespace clang {
21namespace format {
22
Nico Weberee0feec2013-02-05 16:21:00 +000023static bool isUnaryOperator(const AnnotatedToken &Tok) {
24 switch (Tok.FormatTok.Tok.getKind()) {
25 case tok::plus:
26 case tok::plusplus:
27 case tok::minus:
28 case tok::minusminus:
29 case tok::exclaim:
30 case tok::tilde:
31 case tok::kw_sizeof:
32 case tok::kw_alignof:
33 return true;
34 default:
35 return false;
36 }
37}
38
Daniel Jasper32d28ee2013-01-29 21:01:14 +000039static bool isBinaryOperator(const AnnotatedToken &Tok) {
40 // Comma is a binary operator, but does not behave as such wrt. formatting.
41 return getPrecedence(Tok) > prec::Comma;
42}
43
Daniel Jasper01786732013-02-04 07:21:18 +000044// Returns the previous token ignoring comments.
Nico Weber4ed7f3e2013-02-06 16:54:35 +000045static AnnotatedToken *getPreviousToken(AnnotatedToken &Tok) {
46 AnnotatedToken *PrevToken = Tok.Parent;
Daniel Jasper01786732013-02-04 07:21:18 +000047 while (PrevToken != NULL && PrevToken->is(tok::comment))
48 PrevToken = PrevToken->Parent;
49 return PrevToken;
50}
Nico Weber4ed7f3e2013-02-06 16:54:35 +000051static const AnnotatedToken *getPreviousToken(const AnnotatedToken &Tok) {
52 return getPreviousToken(const_cast<AnnotatedToken &>(Tok));
53}
Daniel Jasper01786732013-02-04 07:21:18 +000054
Daniel Jasper29f123b2013-02-08 15:28:42 +000055static bool isTrailingComment(AnnotatedToken *Tok) {
56 return Tok != NULL && Tok->is(tok::comment) &&
57 (Tok->Children.empty() ||
58 Tok->Children[0].FormatTok.NewlinesBefore > 0);
59}
60
Daniel Jasper01786732013-02-04 07:21:18 +000061// Returns the next token ignoring comments.
62static const AnnotatedToken *getNextToken(const AnnotatedToken &Tok) {
63 if (Tok.Children.empty())
64 return NULL;
65 const AnnotatedToken *NextToken = &Tok.Children[0];
66 while (NextToken->is(tok::comment)) {
67 if (NextToken->Children.empty())
68 return NULL;
69 NextToken = &NextToken->Children[0];
70 }
71 return NextToken;
72}
73
Daniel Jasper32d28ee2013-01-29 21:01:14 +000074/// \brief A parser that gathers additional information about tokens.
75///
Alexander Kornienko3fd9ccd2013-03-12 16:28:18 +000076/// The \c TokenAnnotator tries to match parenthesis and square brakets and
Daniel Jasper32d28ee2013-01-29 21:01:14 +000077/// store a parenthesis levels. It also tries to resolve matching "<" and ">"
78/// into template parameter lists.
79class AnnotatingParser {
80public:
Nico Weberc2e6d2a2013-02-11 15:32:15 +000081 AnnotatingParser(SourceManager &SourceMgr, Lexer &Lex, AnnotatedLine &Line,
82 IdentifierInfo &Ident_in)
Daniel Jasper01786732013-02-04 07:21:18 +000083 : SourceMgr(SourceMgr), Lex(Lex), Line(Line), CurrentToken(&Line.First),
Nico Weberc2e6d2a2013-02-11 15:32:15 +000084 KeywordVirtualFound(false), Ident_in(Ident_in) {
Daniel Jasper4e778092013-02-06 10:05:46 +000085 Contexts.push_back(Context(1, /*IsExpression=*/ false));
Daniel Jasper32d28ee2013-01-29 21:01:14 +000086 }
87
Nico Weber95e8e462013-02-12 16:17:07 +000088private:
Daniel Jasper32d28ee2013-01-29 21:01:14 +000089 bool parseAngle() {
90 if (CurrentToken == NULL)
91 return false;
Daniel Jasper4e778092013-02-06 10:05:46 +000092 ScopedContextCreator ContextCreator(*this, 10);
Daniel Jasper32d28ee2013-01-29 21:01:14 +000093 AnnotatedToken *Left = CurrentToken->Parent;
Daniel Jasper4e778092013-02-06 10:05:46 +000094 Contexts.back().IsExpression = false;
Daniel Jasper32d28ee2013-01-29 21:01:14 +000095 while (CurrentToken != NULL) {
96 if (CurrentToken->is(tok::greater)) {
97 Left->MatchingParen = CurrentToken;
98 CurrentToken->MatchingParen = Left;
99 CurrentToken->Type = TT_TemplateCloser;
100 next();
101 return true;
102 }
103 if (CurrentToken->is(tok::r_paren) || CurrentToken->is(tok::r_square) ||
104 CurrentToken->is(tok::r_brace))
105 return false;
106 if (CurrentToken->is(tok::pipepipe) || CurrentToken->is(tok::ampamp) ||
107 CurrentToken->is(tok::question) || CurrentToken->is(tok::colon))
108 return false;
Daniel Jasper9fc56f22013-02-14 15:01:34 +0000109 updateParameterCount(Left, CurrentToken);
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000110 if (!consumeToken())
111 return false;
112 }
113 return false;
114 }
115
116 bool parseParens(bool LookForDecls = false) {
117 if (CurrentToken == NULL)
118 return false;
Daniel Jasper4e778092013-02-06 10:05:46 +0000119 ScopedContextCreator ContextCreator(*this, 1);
120
121 // FIXME: This is a bit of a hack. Do better.
122 Contexts.back().ColonIsForRangeExpr =
123 Contexts.size() == 2 && Contexts[0].ColonIsForRangeExpr;
124
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000125 bool StartsObjCMethodExpr = false;
126 AnnotatedToken *Left = CurrentToken->Parent;
127 if (CurrentToken->is(tok::caret)) {
128 // ^( starts a block.
129 Left->Type = TT_ObjCBlockLParen;
130 } else if (AnnotatedToken *MaybeSel = Left->Parent) {
131 // @selector( starts a selector.
132 if (MaybeSel->isObjCAtKeyword(tok::objc_selector) && MaybeSel->Parent &&
133 MaybeSel->Parent->is(tok::at)) {
134 StartsObjCMethodExpr = true;
135 }
136 }
137
Daniel Jasper4e778092013-02-06 10:05:46 +0000138 if (StartsObjCMethodExpr) {
139 Contexts.back().ColonIsObjCMethodExpr = true;
140 Left->Type = TT_ObjCMethodExpr;
141 }
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000142
143 while (CurrentToken != NULL) {
144 // LookForDecls is set when "if (" has been seen. Check for
145 // 'identifier' '*' 'identifier' followed by not '=' -- this
146 // '*' has to be a binary operator but determineStarAmpUsage() will
147 // categorize it as an unary operator, so set the right type here.
148 if (LookForDecls && !CurrentToken->Children.empty()) {
149 AnnotatedToken &Prev = *CurrentToken->Parent;
150 AnnotatedToken &Next = CurrentToken->Children[0];
151 if (Prev.Parent->is(tok::identifier) &&
Alexander Kornienko3fd9ccd2013-03-12 16:28:18 +0000152 (Prev.is(tok::star) || Prev.is(tok::amp) || Prev.is(tok::ampamp)) &&
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000153 CurrentToken->is(tok::identifier) && Next.isNot(tok::equal)) {
154 Prev.Type = TT_BinaryOperator;
155 LookForDecls = false;
156 }
157 }
158
159 if (CurrentToken->is(tok::r_paren)) {
160 Left->MatchingParen = CurrentToken;
161 CurrentToken->MatchingParen = Left;
162
Daniel Jasper63d7ced2013-02-05 10:07:47 +0000163 if (StartsObjCMethodExpr) {
Daniel Jasper4e778092013-02-06 10:05:46 +0000164 CurrentToken->Type = TT_ObjCMethodExpr;
165 if (Contexts.back().FirstObjCSelectorName != NULL) {
166 Contexts.back().FirstObjCSelectorName->LongestObjCSelectorName =
167 Contexts.back().LongestObjCSelectorName;
Daniel Jasper63d7ced2013-02-05 10:07:47 +0000168 }
169 }
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000170
171 next();
172 return true;
173 }
174 if (CurrentToken->is(tok::r_square) || CurrentToken->is(tok::r_brace))
175 return false;
Daniel Jasper9fc56f22013-02-14 15:01:34 +0000176 updateParameterCount(Left, CurrentToken);
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000177 if (!consumeToken())
178 return false;
179 }
180 return false;
181 }
182
183 bool parseSquare() {
184 if (!CurrentToken)
185 return false;
Daniel Jasper4e778092013-02-06 10:05:46 +0000186 ScopedContextCreator ContextCreator(*this, 10);
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000187
188 // A '[' could be an index subscript (after an indentifier or after
Nico Weber051860e2013-02-10 02:08:05 +0000189 // ')' or ']'), it could be the start of an Objective-C method
190 // expression, or it could the the start of an Objective-C array literal.
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000191 AnnotatedToken *Left = CurrentToken->Parent;
Nico Weber4ed7f3e2013-02-06 16:54:35 +0000192 AnnotatedToken *Parent = getPreviousToken(*Left);
Daniel Jasper9c65b062013-02-27 11:43:50 +0000193 Contexts.back().IsExpression = true;
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000194 bool StartsObjCMethodExpr =
Nico Weber4ed7f3e2013-02-06 16:54:35 +0000195 !Parent || Parent->is(tok::colon) || Parent->is(tok::l_square) ||
196 Parent->is(tok::l_paren) || Parent->is(tok::kw_return) ||
197 Parent->is(tok::kw_throw) || isUnaryOperator(*Parent) ||
Nico Weber4c2cc602013-02-13 03:48:27 +0000198 Parent->Type == TT_ObjCForIn || Parent->Type == TT_CastRParen ||
Nico Weber4ed7f3e2013-02-06 16:54:35 +0000199 getBinOpPrecedence(Parent->FormatTok.Tok.getKind(), true, true) >
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000200 prec::Unknown;
Nico Weber051860e2013-02-10 02:08:05 +0000201 bool StartsObjCArrayLiteral = Parent && Parent->is(tok::at);
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000202
Daniel Jasper4e778092013-02-06 10:05:46 +0000203 if (StartsObjCMethodExpr) {
204 Contexts.back().ColonIsObjCMethodExpr = true;
205 Left->Type = TT_ObjCMethodExpr;
Nico Weber051860e2013-02-10 02:08:05 +0000206 } else if (StartsObjCArrayLiteral) {
207 Left->Type = TT_ObjCArrayLiteral;
Daniel Jasper4e778092013-02-06 10:05:46 +0000208 }
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000209
210 while (CurrentToken != NULL) {
211 if (CurrentToken->is(tok::r_square)) {
212 if (!CurrentToken->Children.empty() &&
213 CurrentToken->Children[0].is(tok::l_paren)) {
Nico Webere8a97982013-02-06 06:20:11 +0000214 // An ObjC method call is rarely followed by an open parenthesis.
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000215 // FIXME: Do we incorrectly label ":" with this?
216 StartsObjCMethodExpr = false;
217 Left->Type = TT_Unknown;
218 }
Daniel Jasper01786732013-02-04 07:21:18 +0000219 if (StartsObjCMethodExpr) {
Daniel Jasper4e778092013-02-06 10:05:46 +0000220 CurrentToken->Type = TT_ObjCMethodExpr;
Nico Webere8a97982013-02-06 06:20:11 +0000221 // determineStarAmpUsage() thinks that '*' '[' is allocating an
222 // array of pointers, but if '[' starts a selector then '*' is a
223 // binary operator.
Alexander Kornienko3fd9ccd2013-03-12 16:28:18 +0000224 if (Parent != NULL && Parent->Type == TT_PointerOrReference)
Nico Weber4ed7f3e2013-02-06 16:54:35 +0000225 Parent->Type = TT_BinaryOperator;
Nico Weber051860e2013-02-10 02:08:05 +0000226 } else if (StartsObjCArrayLiteral) {
227 CurrentToken->Type = TT_ObjCArrayLiteral;
Daniel Jasper01786732013-02-04 07:21:18 +0000228 }
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000229 Left->MatchingParen = CurrentToken;
230 CurrentToken->MatchingParen = Left;
Daniel Jasper4e778092013-02-06 10:05:46 +0000231 if (Contexts.back().FirstObjCSelectorName != NULL)
232 Contexts.back().FirstObjCSelectorName->LongestObjCSelectorName =
233 Contexts.back().LongestObjCSelectorName;
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000234 next();
235 return true;
236 }
237 if (CurrentToken->is(tok::r_paren) || CurrentToken->is(tok::r_brace))
238 return false;
Daniel Jasper9fc56f22013-02-14 15:01:34 +0000239 updateParameterCount(Left, CurrentToken);
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000240 if (!consumeToken())
241 return false;
242 }
243 return false;
244 }
245
246 bool parseBrace() {
247 // Lines are fine to end with '{'.
248 if (CurrentToken == NULL)
249 return true;
Daniel Jasper4e778092013-02-06 10:05:46 +0000250 ScopedContextCreator ContextCreator(*this, 1);
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000251 AnnotatedToken *Left = CurrentToken->Parent;
252 while (CurrentToken != NULL) {
253 if (CurrentToken->is(tok::r_brace)) {
254 Left->MatchingParen = CurrentToken;
255 CurrentToken->MatchingParen = Left;
256 next();
257 return true;
258 }
259 if (CurrentToken->is(tok::r_paren) || CurrentToken->is(tok::r_square))
260 return false;
Daniel Jasper9fc56f22013-02-14 15:01:34 +0000261 updateParameterCount(Left, CurrentToken);
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000262 if (!consumeToken())
263 return false;
264 }
265 return true;
266 }
Daniel Jasperc4615b72013-02-20 12:56:39 +0000267
Daniel Jasper9fc56f22013-02-14 15:01:34 +0000268 void updateParameterCount(AnnotatedToken *Left, AnnotatedToken *Current) {
269 if (Current->is(tok::comma))
270 ++Left->ParameterCount;
271 else if (Left->ParameterCount == 0 && Current->isNot(tok::comment))
272 Left->ParameterCount = 1;
273 }
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000274
275 bool parseConditional() {
276 while (CurrentToken != NULL) {
277 if (CurrentToken->is(tok::colon)) {
278 CurrentToken->Type = TT_ConditionalExpr;
279 next();
280 return true;
281 }
282 if (!consumeToken())
283 return false;
284 }
285 return false;
286 }
287
288 bool parseTemplateDeclaration() {
289 if (CurrentToken != NULL && CurrentToken->is(tok::less)) {
290 CurrentToken->Type = TT_TemplateOpener;
291 next();
292 if (!parseAngle())
293 return false;
Daniel Jasper34511fb2013-02-19 17:14:38 +0000294 if (CurrentToken != NULL)
295 CurrentToken->Parent->ClosesTemplateDeclaration = true;
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000296 return true;
297 }
298 return false;
299 }
300
301 bool consumeToken() {
302 AnnotatedToken *Tok = CurrentToken;
303 next();
304 switch (Tok->FormatTok.Tok.getKind()) {
305 case tok::plus:
306 case tok::minus:
307 // At the start of the line, +/- specific ObjectiveC method
308 // declarations.
309 if (Tok->Parent == NULL)
310 Tok->Type = TT_ObjCMethodSpecifier;
311 break;
312 case tok::colon:
313 // Colons from ?: are handled in parseConditional().
Daniel Jasper63d7ced2013-02-05 10:07:47 +0000314 if (Tok->Parent->is(tok::r_paren)) {
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000315 Tok->Type = TT_CtorInitializerColon;
Daniel Jasper4e778092013-02-06 10:05:46 +0000316 } else if (Contexts.back().ColonIsObjCMethodExpr ||
Daniel Jasper63d7ced2013-02-05 10:07:47 +0000317 Line.First.Type == TT_ObjCMethodSpecifier) {
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000318 Tok->Type = TT_ObjCMethodExpr;
Daniel Jasper63d7ced2013-02-05 10:07:47 +0000319 Tok->Parent->Type = TT_ObjCSelectorName;
Daniel Jasper4e778092013-02-06 10:05:46 +0000320 if (Tok->Parent->FormatTok.TokenLength >
321 Contexts.back().LongestObjCSelectorName)
322 Contexts.back().LongestObjCSelectorName =
323 Tok->Parent->FormatTok.TokenLength;
324 if (Contexts.back().FirstObjCSelectorName == NULL)
325 Contexts.back().FirstObjCSelectorName = Tok->Parent;
326 } else if (Contexts.back().ColonIsForRangeExpr) {
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000327 Tok->Type = TT_RangeBasedForLoopColon;
Daniel Jasper6cabab42013-02-14 08:42:54 +0000328 } else if (Contexts.size() == 1) {
329 Tok->Type = TT_InheritanceColon;
Daniel Jasper63d7ced2013-02-05 10:07:47 +0000330 }
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000331 break;
332 case tok::kw_if:
333 case tok::kw_while:
334 if (CurrentToken != NULL && CurrentToken->is(tok::l_paren)) {
335 next();
336 if (!parseParens(/*LookForDecls=*/ true))
337 return false;
338 }
339 break;
340 case tok::kw_for:
Daniel Jasper4e778092013-02-06 10:05:46 +0000341 Contexts.back().ColonIsForRangeExpr = true;
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000342 next();
343 if (!parseParens())
344 return false;
345 break;
346 case tok::l_paren:
347 if (!parseParens())
348 return false;
Daniel Jasper3c08a812013-02-24 18:54:32 +0000349 if (Line.MustBeDeclaration)
350 Line.MightBeFunctionDecl = true;
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000351 break;
352 case tok::l_square:
353 if (!parseSquare())
354 return false;
355 break;
356 case tok::l_brace:
357 if (!parseBrace())
358 return false;
359 break;
360 case tok::less:
361 if (parseAngle())
362 Tok->Type = TT_TemplateOpener;
363 else {
364 Tok->Type = TT_BinaryOperator;
365 CurrentToken = Tok;
366 next();
367 }
368 break;
369 case tok::r_paren:
370 case tok::r_square:
371 return false;
372 case tok::r_brace:
373 // Lines can start with '}'.
374 if (Tok->Parent != NULL)
375 return false;
376 break;
377 case tok::greater:
378 Tok->Type = TT_BinaryOperator;
379 break;
380 case tok::kw_operator:
Daniel Jasper2b4c9242013-02-11 08:01:18 +0000381 while (CurrentToken && CurrentToken->isNot(tok::l_paren)) {
382 if (CurrentToken->is(tok::star) || CurrentToken->is(tok::amp))
383 CurrentToken->Type = TT_PointerOrReference;
384 consumeToken();
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000385 }
Daniel Jasper2b4c9242013-02-11 08:01:18 +0000386 if (CurrentToken)
387 CurrentToken->Type = TT_OverloadedOperatorLParen;
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000388 break;
389 case tok::question:
390 parseConditional();
391 break;
392 case tok::kw_template:
393 parseTemplateDeclaration();
394 break;
Nico Weberc2e6d2a2013-02-11 15:32:15 +0000395 case tok::identifier:
396 if (Line.First.is(tok::kw_for) &&
397 Tok->FormatTok.Tok.getIdentifierInfo() == &Ident_in)
398 Tok->Type = TT_ObjCForIn;
399 break;
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000400 default:
401 break;
402 }
403 return true;
404 }
405
406 void parseIncludeDirective() {
407 next();
408 if (CurrentToken != NULL && CurrentToken->is(tok::less)) {
409 next();
410 while (CurrentToken != NULL) {
411 if (CurrentToken->isNot(tok::comment) ||
412 !CurrentToken->Children.empty())
413 CurrentToken->Type = TT_ImplicitStringLiteral;
414 next();
415 }
416 } else {
417 while (CurrentToken != NULL) {
Daniel Jasper3a204412013-02-23 07:46:38 +0000418 if (CurrentToken->is(tok::string_literal))
419 // Mark these string literals as "implicit" literals, too, so that
420 // they are not split or line-wrapped.
421 CurrentToken->Type = TT_ImplicitStringLiteral;
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000422 next();
423 }
424 }
425 }
426
427 void parseWarningOrError() {
428 next();
429 // We still want to format the whitespace left of the first token of the
430 // warning or error.
431 next();
432 while (CurrentToken != NULL) {
433 CurrentToken->Type = TT_ImplicitStringLiteral;
434 next();
435 }
436 }
437
438 void parsePreprocessorDirective() {
439 next();
440 if (CurrentToken == NULL)
441 return;
442 // Hashes in the middle of a line can lead to any strange token
443 // sequence.
444 if (CurrentToken->FormatTok.Tok.getIdentifierInfo() == NULL)
445 return;
446 switch (CurrentToken->FormatTok.Tok.getIdentifierInfo()->getPPKeywordID()) {
447 case tok::pp_include:
448 case tok::pp_import:
449 parseIncludeDirective();
450 break;
451 case tok::pp_error:
452 case tok::pp_warning:
453 parseWarningOrError();
454 break;
455 default:
456 break;
457 }
Daniel Jasper5b7e7b02013-02-05 09:34:14 +0000458 while (CurrentToken != NULL)
459 next();
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000460 }
461
Nico Weber95e8e462013-02-12 16:17:07 +0000462public:
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000463 LineType parseLine() {
464 int PeriodsAndArrows = 0;
Daniel Jasper24849712013-03-01 16:48:32 +0000465 AnnotatedToken *LastPeriodOrArrow = NULL;
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000466 bool CanBeBuilderTypeStmt = true;
467 if (CurrentToken->is(tok::hash)) {
468 parsePreprocessorDirective();
469 return LT_PreprocessorDirective;
470 }
471 while (CurrentToken != NULL) {
472 if (CurrentToken->is(tok::kw_virtual))
473 KeywordVirtualFound = true;
Daniel Jasper24849712013-03-01 16:48:32 +0000474 if (CurrentToken->is(tok::period) || CurrentToken->is(tok::arrow)) {
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000475 ++PeriodsAndArrows;
Daniel Jasper24849712013-03-01 16:48:32 +0000476 LastPeriodOrArrow = CurrentToken;
477 }
Daniel Jasper4a544e52013-02-15 20:33:06 +0000478 AnnotatedToken *TheToken = CurrentToken;
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000479 if (!consumeToken())
480 return LT_Invalid;
Daniel Jasper4a544e52013-02-15 20:33:06 +0000481 if (getPrecedence(*TheToken) > prec::Assignment &&
Daniel Jasper82282dc2013-02-18 13:52:06 +0000482 TheToken->Type == TT_BinaryOperator)
Daniel Jasper4a544e52013-02-15 20:33:06 +0000483 CanBeBuilderTypeStmt = false;
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000484 }
485 if (KeywordVirtualFound)
486 return LT_VirtualFunctionDecl;
487
488 // Assume a builder-type call if there are 2 or more "." and "->".
Daniel Jasper24849712013-03-01 16:48:32 +0000489 if (PeriodsAndArrows >= 2 && CanBeBuilderTypeStmt) {
490 LastPeriodOrArrow->LastInChainOfCalls = true;
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000491 return LT_BuilderTypeCall;
Daniel Jasper24849712013-03-01 16:48:32 +0000492 }
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000493
Daniel Jasper63d7ced2013-02-05 10:07:47 +0000494 if (Line.First.Type == TT_ObjCMethodSpecifier) {
Daniel Jasper4e778092013-02-06 10:05:46 +0000495 if (Contexts.back().FirstObjCSelectorName != NULL)
496 Contexts.back().FirstObjCSelectorName->LongestObjCSelectorName =
497 Contexts.back().LongestObjCSelectorName;
Daniel Jasper63d7ced2013-02-05 10:07:47 +0000498 return LT_ObjCMethodDecl;
499 }
500
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000501 return LT_Other;
502 }
503
Nico Weber95e8e462013-02-12 16:17:07 +0000504private:
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000505 void next() {
Daniel Jasper01786732013-02-04 07:21:18 +0000506 if (CurrentToken != NULL) {
507 determineTokenType(*CurrentToken);
Daniel Jasper4e778092013-02-06 10:05:46 +0000508 CurrentToken->BindingStrength = Contexts.back().BindingStrength;
Daniel Jasper01786732013-02-04 07:21:18 +0000509 }
510
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000511 if (CurrentToken != NULL && !CurrentToken->Children.empty())
512 CurrentToken = &CurrentToken->Children[0];
513 else
514 CurrentToken = NULL;
Daniel Jasperd0f349b2013-02-18 12:44:35 +0000515
516 // Reset token type in case we have already looked at it and then recovered
517 // from an error (e.g. failure to find the matching >).
518 if (CurrentToken != NULL)
519 CurrentToken->Type = TT_Unknown;
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000520 }
521
Daniel Jasper4e778092013-02-06 10:05:46 +0000522 /// \brief A struct to hold information valid in a specific context, e.g.
523 /// a pair of parenthesis.
524 struct Context {
525 Context(unsigned BindingStrength, bool IsExpression)
526 : BindingStrength(BindingStrength), LongestObjCSelectorName(0),
527 ColonIsForRangeExpr(false), ColonIsObjCMethodExpr(false),
Daniel Jasper3c08a812013-02-24 18:54:32 +0000528 FirstObjCSelectorName(NULL), IsExpression(IsExpression) {}
Daniel Jasper01786732013-02-04 07:21:18 +0000529
Daniel Jasper4e778092013-02-06 10:05:46 +0000530 unsigned BindingStrength;
531 unsigned LongestObjCSelectorName;
532 bool ColonIsForRangeExpr;
533 bool ColonIsObjCMethodExpr;
534 AnnotatedToken *FirstObjCSelectorName;
535 bool IsExpression;
Daniel Jasper4e778092013-02-06 10:05:46 +0000536 };
537
538 /// \brief Puts a new \c Context onto the stack \c Contexts for the lifetime
539 /// of each instance.
540 struct ScopedContextCreator {
541 AnnotatingParser &P;
542
Daniel Jasperfc759082013-02-14 14:26:07 +0000543 ScopedContextCreator(AnnotatingParser &P, unsigned Increase) : P(P) {
544 P.Contexts.push_back(Context(P.Contexts.back().BindingStrength + Increase,
545 P.Contexts.back().IsExpression));
Daniel Jasper4e778092013-02-06 10:05:46 +0000546 }
547
548 ~ScopedContextCreator() { P.Contexts.pop_back(); }
549 };
Daniel Jasper01786732013-02-04 07:21:18 +0000550
551 void determineTokenType(AnnotatedToken &Current) {
552 if (getPrecedence(Current) == prec::Assignment) {
Daniel Jasper4e778092013-02-06 10:05:46 +0000553 Contexts.back().IsExpression = true;
Nico Weber95e8e462013-02-12 16:17:07 +0000554 for (AnnotatedToken *Previous = Current.Parent;
555 Previous && Previous->isNot(tok::comma);
556 Previous = Previous->Parent) {
Daniel Jasper9c65b062013-02-27 11:43:50 +0000557 if (Previous->is(tok::r_square))
558 Previous = Previous->MatchingParen;
Daniel Jasper01786732013-02-04 07:21:18 +0000559 if (Previous->Type == TT_BinaryOperator &&
560 (Previous->is(tok::star) || Previous->is(tok::amp))) {
561 Previous->Type = TT_PointerOrReference;
562 }
Daniel Jasper01786732013-02-04 07:21:18 +0000563 }
Nico Weber95e8e462013-02-12 16:17:07 +0000564 } else if (Current.is(tok::kw_return) || Current.is(tok::kw_throw) ||
565 (Current.is(tok::l_paren) && !Line.MustBeDeclaration &&
566 (!Current.Parent || Current.Parent->isNot(tok::kw_for)))) {
Daniel Jasper4e778092013-02-06 10:05:46 +0000567 Contexts.back().IsExpression = true;
Nico Weber95e8e462013-02-12 16:17:07 +0000568 } else if (Current.is(tok::r_paren) || Current.is(tok::greater) ||
569 Current.is(tok::comma)) {
570 for (AnnotatedToken *Previous = Current.Parent;
571 Previous && (Previous->is(tok::star) || Previous->is(tok::amp));
572 Previous = Previous->Parent)
573 Previous->Type = TT_PointerOrReference;
Daniel Jasperd0f349b2013-02-18 12:44:35 +0000574 } else if (Current.Parent &&
575 Current.Parent->Type == TT_CtorInitializerColon) {
576 Contexts.back().IsExpression = true;
Nico Weber95e8e462013-02-12 16:17:07 +0000577 }
Daniel Jasper01786732013-02-04 07:21:18 +0000578
579 if (Current.Type == TT_Unknown) {
Daniel Jasper3c08a812013-02-24 18:54:32 +0000580 if (Current.Parent && Current.is(tok::identifier) &&
581 ((Current.Parent->is(tok::identifier) &&
582 Current.Parent->FormatTok.Tok.getIdentifierInfo()
583 ->getPPKeywordID() == tok::pp_not_keyword) ||
584 Current.Parent->Type == TT_PointerOrReference ||
585 Current.Parent->Type == TT_TemplateCloser)) {
586 Current.Type = TT_StartOfName;
Alexander Kornienko3fd9ccd2013-03-12 16:28:18 +0000587 } else if (Current.is(tok::star) || Current.is(tok::amp) ||
588 Current.is(tok::ampamp)) {
Daniel Jasper4e778092013-02-06 10:05:46 +0000589 Current.Type =
590 determineStarAmpUsage(Current, Contexts.back().IsExpression);
Daniel Jasper01786732013-02-04 07:21:18 +0000591 } else if (Current.is(tok::minus) || Current.is(tok::plus) ||
592 Current.is(tok::caret)) {
593 Current.Type = determinePlusMinusCaretUsage(Current);
594 } else if (Current.is(tok::minusminus) || Current.is(tok::plusplus)) {
595 Current.Type = determineIncrementUsage(Current);
596 } else if (Current.is(tok::exclaim)) {
597 Current.Type = TT_UnaryOperator;
598 } else if (isBinaryOperator(Current)) {
599 Current.Type = TT_BinaryOperator;
600 } else if (Current.is(tok::comment)) {
601 std::string Data(Lexer::getSpelling(Current.FormatTok.Tok, SourceMgr,
602 Lex.getLangOpts()));
603 if (StringRef(Data).startswith("//"))
604 Current.Type = TT_LineComment;
605 else
606 Current.Type = TT_BlockComment;
Nico Weber37d69312013-02-13 04:13:13 +0000607 } else if (Current.is(tok::r_paren)) {
Daniel Jasper03628b82013-02-19 20:05:41 +0000608 bool ParensNotExpr = !Current.Parent ||
609 Current.Parent->Type == TT_PointerOrReference ||
Nico Weber37d69312013-02-13 04:13:13 +0000610 Current.Parent->Type == TT_TemplateCloser;
611 bool ParensCouldEndDecl =
612 !Current.Children.empty() && (Current.Children[0].is(tok::equal) ||
613 Current.Children[0].is(tok::semi) ||
614 Current.Children[0].is(tok::l_brace));
Daniel Jasper37eff832013-02-23 08:07:18 +0000615 if (ParensNotExpr && !ParensCouldEndDecl &&
616 Contexts.back().IsExpression)
Nico Weber37d69312013-02-13 04:13:13 +0000617 // FIXME: We need to get smarter and understand more cases of casts.
618 Current.Type = TT_CastRParen;
Daniel Jasper01786732013-02-04 07:21:18 +0000619 } else if (Current.is(tok::at) && Current.Children.size()) {
620 switch (Current.Children[0].FormatTok.Tok.getObjCKeywordID()) {
621 case tok::objc_interface:
622 case tok::objc_implementation:
623 case tok::objc_protocol:
624 Current.Type = TT_ObjCDecl;
625 break;
626 case tok::objc_property:
627 Current.Type = TT_ObjCProperty;
628 break;
629 default:
630 break;
631 }
632 }
633 }
634 }
635
Daniel Jasper01786732013-02-04 07:21:18 +0000636 /// \brief Return the type of the given token assuming it is * or &.
637 TokenType
638 determineStarAmpUsage(const AnnotatedToken &Tok, bool IsExpression) {
639 const AnnotatedToken *PrevToken = getPreviousToken(Tok);
640 if (PrevToken == NULL)
641 return TT_UnaryOperator;
642
643 const AnnotatedToken *NextToken = getNextToken(Tok);
644 if (NextToken == NULL)
645 return TT_Unknown;
646
Daniel Jasper8a5d7cd2013-03-01 17:13:29 +0000647 if (PrevToken->is(tok::l_paren) && !IsExpression)
648 return TT_PointerOrReference;
649
Daniel Jasper01786732013-02-04 07:21:18 +0000650 if (PrevToken->is(tok::l_paren) || PrevToken->is(tok::l_square) ||
651 PrevToken->is(tok::l_brace) || PrevToken->is(tok::comma) ||
652 PrevToken->is(tok::kw_return) || PrevToken->is(tok::colon) ||
Nico Webere8a97982013-02-06 06:20:11 +0000653 PrevToken->is(tok::equal) || PrevToken->Type == TT_BinaryOperator ||
Daniel Jasper01786732013-02-04 07:21:18 +0000654 PrevToken->Type == TT_UnaryOperator || PrevToken->Type == TT_CastRParen)
655 return TT_UnaryOperator;
656
Nico Webere8a97982013-02-06 06:20:11 +0000657 if (NextToken->is(tok::l_square))
658 return TT_PointerOrReference;
659
Daniel Jasper01786732013-02-04 07:21:18 +0000660 if (PrevToken->FormatTok.Tok.isLiteral() || PrevToken->is(tok::r_paren) ||
661 PrevToken->is(tok::r_square) || NextToken->FormatTok.Tok.isLiteral() ||
Nico Weberee0feec2013-02-05 16:21:00 +0000662 isUnaryOperator(*NextToken) || NextToken->is(tok::l_paren) ||
663 NextToken->is(tok::l_square))
Daniel Jasper01786732013-02-04 07:21:18 +0000664 return TT_BinaryOperator;
665
Daniel Jasper01786732013-02-04 07:21:18 +0000666 // It is very unlikely that we are going to find a pointer or reference type
667 // definition on the RHS of an assignment.
668 if (IsExpression)
669 return TT_BinaryOperator;
670
671 return TT_PointerOrReference;
672 }
673
674 TokenType determinePlusMinusCaretUsage(const AnnotatedToken &Tok) {
675 const AnnotatedToken *PrevToken = getPreviousToken(Tok);
676 if (PrevToken == NULL)
677 return TT_UnaryOperator;
678
679 // Use heuristics to recognize unary operators.
680 if (PrevToken->is(tok::equal) || PrevToken->is(tok::l_paren) ||
681 PrevToken->is(tok::comma) || PrevToken->is(tok::l_square) ||
682 PrevToken->is(tok::question) || PrevToken->is(tok::colon) ||
683 PrevToken->is(tok::kw_return) || PrevToken->is(tok::kw_case) ||
684 PrevToken->is(tok::at) || PrevToken->is(tok::l_brace))
685 return TT_UnaryOperator;
686
Nico Weberee0feec2013-02-05 16:21:00 +0000687 // There can't be two consecutive binary operators.
Daniel Jasper01786732013-02-04 07:21:18 +0000688 if (PrevToken->Type == TT_BinaryOperator)
689 return TT_UnaryOperator;
690
691 // Fall back to marking the token as binary operator.
692 return TT_BinaryOperator;
693 }
694
695 /// \brief Determine whether ++/-- are pre- or post-increments/-decrements.
696 TokenType determineIncrementUsage(const AnnotatedToken &Tok) {
697 const AnnotatedToken *PrevToken = getPreviousToken(Tok);
698 if (PrevToken == NULL)
699 return TT_UnaryOperator;
700 if (PrevToken->is(tok::r_paren) || PrevToken->is(tok::r_square) ||
701 PrevToken->is(tok::identifier))
702 return TT_TrailingUnaryOperator;
703
704 return TT_UnaryOperator;
705 }
Daniel Jasper4e778092013-02-06 10:05:46 +0000706
707 SmallVector<Context, 8> Contexts;
708
709 SourceManager &SourceMgr;
710 Lexer &Lex;
711 AnnotatedLine &Line;
712 AnnotatedToken *CurrentToken;
713 bool KeywordVirtualFound;
Nico Weberc2e6d2a2013-02-11 15:32:15 +0000714 IdentifierInfo &Ident_in;
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000715};
716
Daniel Jasper29f123b2013-02-08 15:28:42 +0000717/// \brief Parses binary expressions by inserting fake parenthesis based on
718/// operator precedence.
719class ExpressionParser {
720public:
721 ExpressionParser(AnnotatedLine &Line) : Current(&Line.First) {}
722
723 /// \brief Parse expressions with the given operatore precedence.
Daniel Jasper237d4c12013-02-23 21:01:55 +0000724 void parse(int Precedence = 0) {
Daniel Jasper29f123b2013-02-08 15:28:42 +0000725 if (Precedence > prec::PointerToMember || Current == NULL)
726 return;
727
728 // Skip over "return" until we can properly parse it.
729 if (Current->is(tok::kw_return))
730 next();
731
732 // Eagerly consume trailing comments.
733 while (isTrailingComment(Current)) {
734 next();
735 }
736
737 AnnotatedToken *Start = Current;
738 bool OperatorFound = false;
739
Daniel Jasper237d4c12013-02-23 21:01:55 +0000740 while (Current) {
Daniel Jasper29f123b2013-02-08 15:28:42 +0000741 // Consume operators with higher precedence.
Dmitri Gribenko6ba52aa2013-02-16 20:03:26 +0000742 parse(prec::Level(Precedence + 1));
Daniel Jasper29f123b2013-02-08 15:28:42 +0000743
Daniel Jasper237d4c12013-02-23 21:01:55 +0000744 int CurrentPrecedence = 0;
745 if (Current) {
746 if (Current->Type == TT_ConditionalExpr)
747 CurrentPrecedence = 1 + (int) prec::Conditional;
748 else if (Current->is(tok::semi))
749 CurrentPrecedence = 1;
750 else if (Current->Type == TT_BinaryOperator || Current->is(tok::comma))
751 CurrentPrecedence = 1 + (int) getPrecedence(*Current);
752 }
753
Daniel Jasper29f123b2013-02-08 15:28:42 +0000754 // At the end of the line or when an operator with higher precedence is
755 // found, insert fake parenthesis and return.
Daniel Jasper237d4c12013-02-23 21:01:55 +0000756 if (Current == NULL || closesScope(*Current) ||
757 (CurrentPrecedence != 0 && CurrentPrecedence < Precedence)) {
Daniel Jasper29f123b2013-02-08 15:28:42 +0000758 if (OperatorFound) {
759 ++Start->FakeLParens;
Daniel Jasper237d4c12013-02-23 21:01:55 +0000760 if (Current)
Daniel Jasper087387a2013-02-08 16:49:27 +0000761 ++Current->Parent->FakeRParens;
Daniel Jasper29f123b2013-02-08 15:28:42 +0000762 }
763 return;
764 }
765
766 // Consume scopes: (), [], <> and {}
767 if (opensScope(*Current)) {
Daniel Jasper237d4c12013-02-23 21:01:55 +0000768 AnnotatedToken *Left = Current;
769 while (Current && !closesScope(*Current)) {
Daniel Jasper29f123b2013-02-08 15:28:42 +0000770 next();
771 parse();
772 }
Daniel Jasper237d4c12013-02-23 21:01:55 +0000773 // Remove fake parens that just duplicate the real parens.
774 if (Current && Left->Children[0].FakeLParens > 0 &&
775 Current->Parent->FakeRParens > 0) {
776 --Left->Children[0].FakeLParens;
777 --Current->Parent->FakeRParens;
778 }
Daniel Jasper29f123b2013-02-08 15:28:42 +0000779 next();
780 } else {
781 // Operator found.
Daniel Jasper237d4c12013-02-23 21:01:55 +0000782 if (CurrentPrecedence == Precedence)
Daniel Jasper29f123b2013-02-08 15:28:42 +0000783 OperatorFound = true;
784
785 next();
786 }
787 }
788 }
789
790private:
791 void next() {
792 if (Current != NULL)
793 Current = Current->Children.empty() ? NULL : &Current->Children[0];
794 }
795
796 bool closesScope(const AnnotatedToken &Tok) {
797 return Current->is(tok::r_paren) || Current->Type == TT_TemplateCloser ||
798 Current->is(tok::r_brace) || Current->is(tok::r_square);
799 }
800
801 bool opensScope(const AnnotatedToken &Tok) {
802 return Current->is(tok::l_paren) || Current->Type == TT_TemplateOpener ||
803 Current->is(tok::l_brace) || Current->is(tok::l_square);
804 }
805
806 AnnotatedToken *Current;
807};
808
Daniel Jasper8ff690a2013-02-06 14:22:40 +0000809void TokenAnnotator::annotate(AnnotatedLine &Line) {
Nico Weberc2e6d2a2013-02-11 15:32:15 +0000810 AnnotatingParser Parser(SourceMgr, Lex, Line, Ident_in);
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000811 Line.Type = Parser.parseLine();
812 if (Line.Type == LT_Invalid)
813 return;
814
Daniel Jasper29f123b2013-02-08 15:28:42 +0000815 ExpressionParser ExprParser(Line);
816 ExprParser.parse();
817
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000818 if (Line.First.Type == TT_ObjCMethodSpecifier)
819 Line.Type = LT_ObjCMethodDecl;
820 else if (Line.First.Type == TT_ObjCDecl)
821 Line.Type = LT_ObjCDecl;
822 else if (Line.First.Type == TT_ObjCProperty)
823 Line.Type = LT_ObjCProperty;
824
Daniel Jasper729a7432013-02-11 12:36:37 +0000825 Line.First.SpacesRequiredBefore = 1;
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000826 Line.First.MustBreakBefore = Line.First.FormatTok.MustBreakBefore;
827 Line.First.CanBreakBefore = Line.First.MustBreakBefore;
828
829 Line.First.TotalLength = Line.First.FormatTok.TokenLength;
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000830}
831
Daniel Jasper8ff690a2013-02-06 14:22:40 +0000832void TokenAnnotator::calculateFormattingInformation(AnnotatedLine &Line) {
833 if (Line.First.Children.empty())
834 return;
835 AnnotatedToken *Current = &Line.First.Children[0];
836 while (Current != NULL) {
Daniel Jasper729a7432013-02-11 12:36:37 +0000837 if (Current->Type == TT_LineComment)
838 Current->SpacesRequiredBefore = Style.SpacesBeforeTrailingComments;
839 else
840 Current->SpacesRequiredBefore =
841 spaceRequiredBefore(Line, *Current) ? 1 : 0;
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000842
Daniel Jasper8ff690a2013-02-06 14:22:40 +0000843 if (Current->FormatTok.MustBreakBefore) {
844 Current->MustBreakBefore = true;
845 } else if (Current->Type == TT_LineComment) {
846 Current->MustBreakBefore = Current->FormatTok.NewlinesBefore > 0;
Daniel Jasper29f123b2013-02-08 15:28:42 +0000847 } else if (isTrailingComment(Current->Parent) ||
Daniel Jasper8ff690a2013-02-06 14:22:40 +0000848 (Current->is(tok::string_literal) &&
849 Current->Parent->is(tok::string_literal))) {
850 Current->MustBreakBefore = true;
851 } else if (Current->is(tok::lessless) && !Current->Children.empty() &&
852 Current->Parent->is(tok::string_literal) &&
853 Current->Children[0].is(tok::string_literal)) {
854 Current->MustBreakBefore = true;
855 } else {
856 Current->MustBreakBefore = false;
857 }
858 Current->CanBreakBefore =
859 Current->MustBreakBefore || canBreakBefore(Line, *Current);
860 if (Current->MustBreakBefore)
861 Current->TotalLength = Current->Parent->TotalLength + Style.ColumnLimit;
862 else
863 Current->TotalLength =
864 Current->Parent->TotalLength + Current->FormatTok.TokenLength +
Daniel Jasper729a7432013-02-11 12:36:37 +0000865 Current->SpacesRequiredBefore;
Daniel Jasper8ff690a2013-02-06 14:22:40 +0000866 // FIXME: Only calculate this if CanBreakBefore is true once static
867 // initializers etc. are sorted out.
868 // FIXME: Move magic numbers to a better place.
869 Current->SplitPenalty =
870 20 * Current->BindingStrength + splitPenalty(Line, *Current);
871
872 Current = Current->Children.empty() ? NULL : &Current->Children[0];
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000873 }
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000874}
875
Daniel Jasper8ff690a2013-02-06 14:22:40 +0000876unsigned TokenAnnotator::splitPenalty(const AnnotatedLine &Line,
877 const AnnotatedToken &Tok) {
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000878 const AnnotatedToken &Left = *Tok.Parent;
879 const AnnotatedToken &Right = Tok;
880
Daniel Jasper3c08a812013-02-24 18:54:32 +0000881 if (Right.Type == TT_StartOfName) {
882 if (Line.First.is(tok::kw_for))
883 return 3;
884 else if (Line.MightBeFunctionDecl && Right.BindingStrength == 1)
885 // FIXME: Clean up hack of using BindingStrength to find top-level names.
886 return Style.PenaltyReturnTypeOnItsOwnLine;
887 else
888 return 100;
889 }
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000890 if (Left.is(tok::equal) && Right.is(tok::l_brace))
891 return 150;
892 if (Left.is(tok::coloncolon))
893 return 500;
894
Daniel Jasper6cabab42013-02-14 08:42:54 +0000895 if (Left.Type == TT_RangeBasedForLoopColon ||
896 Left.Type == TT_InheritanceColon)
Daniel Jasper84a1a632013-02-26 13:18:08 +0000897 return 2;
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000898
899 if (Right.is(tok::arrow) || Right.is(tok::period)) {
Daniel Jasper515f65d2013-02-18 13:24:21 +0000900 if (Line.Type == LT_BuilderTypeCall)
Daniel Jasper518ee342013-02-26 13:59:14 +0000901 return 5;
Daniel Jasperfc759082013-02-14 14:26:07 +0000902 if ((Left.is(tok::r_paren) || Left.is(tok::r_square)) &&
903 Left.MatchingParen && Left.MatchingParen->ParameterCount > 0)
Daniel Jasper518ee342013-02-26 13:59:14 +0000904 return 20; // Should be smaller than breaking at a nested comma.
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000905 return 150;
906 }
907
908 // In for-loops, prefer breaking at ',' and ';'.
Daniel Jasper7d812812013-02-21 15:00:29 +0000909 if (Line.First.is(tok::kw_for) && Left.is(tok::equal))
910 return 4;
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000911
Daniel Jasper8159d2f2013-02-04 07:30:30 +0000912 if (Left.is(tok::semi))
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000913 return 0;
Daniel Jasper8159d2f2013-02-04 07:30:30 +0000914 if (Left.is(tok::comma))
915 return 1;
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000916
917 // In Objective-C method expressions, prefer breaking before "param:" over
918 // breaking after it.
Daniel Jasper63d7ced2013-02-05 10:07:47 +0000919 if (Right.Type == TT_ObjCSelectorName)
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000920 return 0;
Daniel Jasper63d7ced2013-02-05 10:07:47 +0000921 if (Left.is(tok::colon) && Left.Type == TT_ObjCMethodExpr)
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000922 return 20;
923
Daniel Jasper01786732013-02-04 07:21:18 +0000924 if (Left.is(tok::l_paren) || Left.is(tok::l_square) ||
Daniel Jasper25e81b22013-02-28 15:04:12 +0000925 Left.is(tok::l_brace) || Left.Type == TT_TemplateOpener)
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000926 return 20;
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000927
Daniel Jasper4e8a7b42013-02-06 21:04:05 +0000928 if (Right.is(tok::lessless)) {
929 if (Left.is(tok::string_literal)) {
930 char LastChar =
931 StringRef(Left.FormatTok.Tok.getLiteralData(),
932 Left.FormatTok.TokenLength).drop_back(1).rtrim().back();
933 if (LastChar == ':' || LastChar == '=')
934 return 100;
935 }
Daniel Jasper01786732013-02-04 07:21:18 +0000936 return prec::Shift;
Daniel Jasper4e8a7b42013-02-06 21:04:05 +0000937 }
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000938 if (Left.Type == TT_ConditionalExpr)
Daniel Jasper518ee342013-02-26 13:59:14 +0000939 return prec::Conditional;
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000940 prec::Level Level = getPrecedence(Left);
941
942 if (Level != prec::Unknown)
943 return Level;
Daniel Jasper24849712013-03-01 16:48:32 +0000944
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000945 return 3;
946}
947
Daniel Jasper8ff690a2013-02-06 14:22:40 +0000948bool TokenAnnotator::spaceRequiredBetween(const AnnotatedLine &Line,
949 const AnnotatedToken &Left,
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000950 const AnnotatedToken &Right) {
951 if (Right.is(tok::hashhash))
952 return Left.is(tok::hash);
953 if (Left.is(tok::hashhash) || Left.is(tok::hash))
954 return Right.is(tok::hash);
955 if (Right.is(tok::r_paren) || Right.is(tok::semi) || Right.is(tok::comma))
956 return false;
957 if (Right.is(tok::less) &&
958 (Left.is(tok::kw_template) ||
959 (Line.Type == LT_ObjCDecl && Style.ObjCSpaceBeforeProtocolList)))
960 return true;
961 if (Left.is(tok::arrow) || Right.is(tok::arrow))
962 return false;
963 if (Left.is(tok::exclaim) || Left.is(tok::tilde))
964 return false;
965 if (Left.is(tok::at) &&
966 (Right.is(tok::identifier) || Right.is(tok::string_literal) ||
967 Right.is(tok::char_constant) || Right.is(tok::numeric_constant) ||
968 Right.is(tok::l_paren) || Right.is(tok::l_brace) ||
969 Right.is(tok::kw_true) || Right.is(tok::kw_false)))
970 return false;
971 if (Left.is(tok::coloncolon))
972 return false;
973 if (Right.is(tok::coloncolon))
Daniel Jasperdaf1a152013-02-07 21:08:36 +0000974 return Left.isNot(tok::identifier) && Left.isNot(tok::greater) &&
975 Left.isNot(tok::l_paren);
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000976 if (Left.is(tok::less) || Right.is(tok::greater) || Right.is(tok::less))
977 return false;
Alexander Kornienko3fd9ccd2013-03-12 16:28:18 +0000978 if (Right.Type == TT_PointerOrReference)
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000979 return Left.FormatTok.Tok.isLiteral() ||
Alexander Kornienko3fd9ccd2013-03-12 16:28:18 +0000980 ((Left.Type != TT_PointerOrReference) && Left.isNot(tok::l_paren) &&
981 !Style.PointerBindsToType);
982 if (Left.Type == TT_PointerOrReference)
Nico Weber95e8e462013-02-12 16:17:07 +0000983 return Right.FormatTok.Tok.isLiteral() ||
Alexander Kornienko3fd9ccd2013-03-12 16:28:18 +0000984 ((Right.Type != TT_PointerOrReference) && Style.PointerBindsToType);
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000985 if (Right.is(tok::star) && Left.is(tok::l_paren))
986 return false;
Nico Weber051860e2013-02-10 02:08:05 +0000987 if (Left.is(tok::l_square))
988 return Left.Type == TT_ObjCArrayLiteral && Right.isNot(tok::r_square);
989 if (Right.is(tok::r_square))
990 return Right.Type == TT_ObjCArrayLiteral;
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000991 if (Right.is(tok::l_square) && Right.Type != TT_ObjCMethodExpr)
992 return false;
993 if (Left.is(tok::period) || Right.is(tok::period))
994 return false;
995 if (Left.is(tok::colon))
996 return Left.Type != TT_ObjCMethodExpr;
997 if (Right.is(tok::colon))
998 return Right.Type != TT_ObjCMethodExpr;
999 if (Left.is(tok::l_paren))
1000 return false;
1001 if (Right.is(tok::l_paren)) {
1002 return Line.Type == LT_ObjCDecl || Left.is(tok::kw_if) ||
1003 Left.is(tok::kw_for) || Left.is(tok::kw_while) ||
1004 Left.is(tok::kw_switch) || Left.is(tok::kw_return) ||
1005 Left.is(tok::kw_catch) || Left.is(tok::kw_new) ||
1006 Left.is(tok::kw_delete);
1007 }
1008 if (Left.is(tok::at) &&
1009 Right.FormatTok.Tok.getObjCKeywordID() != tok::objc_not_keyword)
1010 return false;
1011 if (Left.is(tok::l_brace) && Right.is(tok::r_brace))
1012 return false;
1013 return true;
1014}
1015
Daniel Jasper8ff690a2013-02-06 14:22:40 +00001016bool TokenAnnotator::spaceRequiredBefore(const AnnotatedLine &Line,
1017 const AnnotatedToken &Tok) {
Daniel Jasper2b4c9242013-02-11 08:01:18 +00001018 if (Tok.FormatTok.Tok.getIdentifierInfo() &&
1019 Tok.Parent->FormatTok.Tok.getIdentifierInfo())
1020 return true; // Never ever merge two identifiers.
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001021 if (Line.Type == LT_ObjCMethodDecl) {
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001022 if (Tok.Parent->Type == TT_ObjCMethodSpecifier)
1023 return true;
1024 if (Tok.Parent->is(tok::r_paren) && Tok.is(tok::identifier))
1025 // Don't space between ')' and <id>
1026 return false;
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001027 }
1028 if (Line.Type == LT_ObjCProperty &&
1029 (Tok.is(tok::equal) || Tok.Parent->is(tok::equal)))
1030 return false;
1031
1032 if (Tok.Parent->is(tok::comma))
1033 return true;
Daniel Jasper9c3c7b32013-02-28 13:40:17 +00001034 if (Tok.is(tok::comma))
1035 return false;
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001036 if (Tok.Type == TT_CtorInitializerColon || Tok.Type == TT_ObjCBlockLParen)
1037 return true;
Daniel Jasper2b4c9242013-02-11 08:01:18 +00001038 if (Tok.Parent->FormatTok.Tok.is(tok::kw_operator))
1039 return false;
1040 if (Tok.Type == TT_OverloadedOperatorLParen)
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001041 return false;
1042 if (Tok.is(tok::colon))
Daniel Jasper4ba9bfd2013-03-12 12:26:55 +00001043 return Line.First.isNot(tok::kw_case) &&
1044 Line.First.isNot(tok::kw_default) && !Tok.Children.empty() &&
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001045 Tok.Type != TT_ObjCMethodExpr;
Daniel Jasper8a5d7cd2013-03-01 17:13:29 +00001046 if (Tok.is(tok::l_paren) && !Tok.Children.empty() &&
1047 Tok.Children[0].Type == TT_PointerOrReference &&
1048 !Tok.Children[0].Children.empty() &&
1049 Tok.Children[0].Children[0].isNot(tok::r_paren))
1050 return true;
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001051 if (Tok.Parent->Type == TT_UnaryOperator || Tok.Parent->Type == TT_CastRParen)
1052 return false;
1053 if (Tok.Type == TT_UnaryOperator)
1054 return Tok.Parent->isNot(tok::l_paren) &&
1055 Tok.Parent->isNot(tok::l_square) && Tok.Parent->isNot(tok::at) &&
1056 (Tok.Parent->isNot(tok::colon) ||
1057 Tok.Parent->Type != TT_ObjCMethodExpr);
1058 if (Tok.Parent->is(tok::greater) && Tok.is(tok::greater)) {
Daniel Jasper29f123b2013-02-08 15:28:42 +00001059 return Tok.Type == TT_TemplateCloser &&
1060 Tok.Parent->Type == TT_TemplateCloser &&
1061 Style.Standard != FormatStyle::LS_Cpp11;
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001062 }
Daniel Jasper9c3c7b32013-02-28 13:40:17 +00001063 if (Tok.is(tok::arrowstar) || Tok.Parent->is(tok::arrowstar))
1064 return false;
1065 if (Tok.Type == TT_BinaryOperator || Tok.Parent->Type == TT_BinaryOperator)
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001066 return true;
1067 if (Tok.Parent->Type == TT_TemplateCloser && Tok.is(tok::l_paren))
1068 return false;
1069 if (Tok.is(tok::less) && Line.First.is(tok::hash))
1070 return true;
1071 if (Tok.Type == TT_TrailingUnaryOperator)
1072 return false;
Daniel Jasper8ff690a2013-02-06 14:22:40 +00001073 return spaceRequiredBetween(Line, *Tok.Parent, Tok);
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001074}
1075
Daniel Jasper8ff690a2013-02-06 14:22:40 +00001076bool TokenAnnotator::canBreakBefore(const AnnotatedLine &Line,
1077 const AnnotatedToken &Right) {
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001078 const AnnotatedToken &Left = *Right.Parent;
Daniel Jaspera03ab102013-02-13 20:33:44 +00001079 if (Right.Type == TT_StartOfName)
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001080 return true;
1081 if (Right.is(tok::colon) && Right.Type == TT_ObjCMethodExpr)
1082 return false;
1083 if (Left.is(tok::colon) && Left.Type == TT_ObjCMethodExpr)
1084 return true;
Daniel Jasper63d7ced2013-02-05 10:07:47 +00001085 if (Right.Type == TT_ObjCSelectorName)
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001086 return true;
1087 if (Left.ClosesTemplateDeclaration)
1088 return true;
1089 if (Right.Type == TT_ConditionalExpr || Right.is(tok::question))
1090 return true;
Daniel Jasper6cabab42013-02-14 08:42:54 +00001091 if (Right.Type == TT_RangeBasedForLoopColon ||
1092 Right.Type == TT_InheritanceColon)
1093 return false;
1094 if (Left.Type == TT_RangeBasedForLoopColon ||
1095 Left.Type == TT_InheritanceColon)
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001096 return true;
Daniel Jasper7d812812013-02-21 15:00:29 +00001097 if (Right.Type == TT_RangeBasedForLoopColon)
1098 return false;
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001099 if (Left.Type == TT_PointerOrReference || Left.Type == TT_TemplateCloser ||
1100 Left.Type == TT_UnaryOperator || Left.Type == TT_ConditionalExpr ||
Daniel Jasperdc2efa12013-02-15 19:24:08 +00001101 Left.is(tok::question) || Left.is(tok::kw_operator))
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001102 return false;
1103 if (Left.is(tok::equal) && Line.Type == LT_VirtualFunctionDecl)
1104 return false;
Daniel Jasper8ed41002013-02-28 14:44:25 +00001105 if (Left.is(tok::l_paren) && Right.is(tok::l_paren) && Left.Parent &&
1106 Left.Parent->is(tok::kw___attribute))
1107 return false;
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001108
1109 if (Right.Type == TT_LineComment)
1110 // We rely on MustBreakBefore being set correctly here as we should not
1111 // change the "binding" behavior of a comment.
1112 return false;
1113
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001114 // Allow breaking after a trailing 'const', e.g. after a method declaration,
1115 // unless it is follow by ';', '{' or '='.
1116 if (Left.is(tok::kw_const) && Left.Parent != NULL &&
1117 Left.Parent->is(tok::r_paren))
1118 return Right.isNot(tok::l_brace) && Right.isNot(tok::semi) &&
1119 Right.isNot(tok::equal);
1120
1121 // We only break before r_brace if there was a corresponding break before
1122 // the l_brace, which is tracked by BreakBeforeClosingBrace.
1123 if (Right.is(tok::r_brace))
1124 return false;
1125
1126 if (Right.is(tok::r_paren) || Right.is(tok::greater))
1127 return false;
Daniel Jasper3a204412013-02-23 07:46:38 +00001128 if (Left.is(tok::identifier) && Right.is(tok::string_literal))
1129 return true;
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001130 return (isBinaryOperator(Left) && Left.isNot(tok::lessless)) ||
1131 Left.is(tok::comma) || Right.is(tok::lessless) ||
1132 Right.is(tok::arrow) || Right.is(tok::period) ||
1133 Right.is(tok::colon) || Left.is(tok::coloncolon) ||
1134 Left.is(tok::semi) || Left.is(tok::l_brace) ||
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001135 (Left.is(tok::r_paren) && Left.Type != TT_CastRParen &&
Daniel Jasper8ed41002013-02-28 14:44:25 +00001136 (Right.is(tok::identifier) || Right.is(tok::kw___attribute))) ||
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001137 (Left.is(tok::l_paren) && !Right.is(tok::r_paren)) ||
1138 (Left.is(tok::l_square) && !Right.is(tok::r_square));
1139}
1140
1141} // namespace format
1142} // namespace clang