blob: 418025a7735b1153bef6abc43891a057ce2b6dd0 [file] [log] [blame]
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001//===--- TokenAnnotator.cpp - Format C++ code -----------------------------===//
2//
3// The LLVM Compiler Infrastructure
4//
5// This file is distributed under the University of Illinois Open Source
6// License. See LICENSE.TXT for details.
7//
8//===----------------------------------------------------------------------===//
9///
10/// \file
11/// \brief This file implements a token annotator, i.e. creates
12/// \c AnnotatedTokens out of \c FormatTokens with required extra information.
13///
14//===----------------------------------------------------------------------===//
15
16#include "TokenAnnotator.h"
17#include "clang/Basic/SourceManager.h"
Daniel Jasperbf71ba22013-04-08 20:33:42 +000018#include "llvm/Support/Debug.h"
Daniel Jasper32d28ee2013-01-29 21:01:14 +000019
20namespace clang {
21namespace format {
22
Craig Topper14e66492013-07-01 04:03:19 +000023namespace {
24
Daniel Jasper32d28ee2013-01-29 21:01:14 +000025/// \brief A parser that gathers additional information about tokens.
26///
Alexander Kornienko3fd9ccd2013-03-12 16:28:18 +000027/// The \c TokenAnnotator tries to match parenthesis and square brakets and
Daniel Jasper32d28ee2013-01-29 21:01:14 +000028/// store a parenthesis levels. It also tries to resolve matching "<" and ">"
29/// into template parameter lists.
30class AnnotatingParser {
31public:
Alexander Kornienko00895102013-06-05 14:09:10 +000032 AnnotatingParser(AnnotatedLine &Line, IdentifierInfo &Ident_in)
33 : Line(Line), CurrentToken(Line.First), KeywordVirtualFound(false),
34 NameFound(false), Ident_in(Ident_in) {
Nico Weber27268772013-06-26 00:30:14 +000035 Contexts.push_back(Context(tok::unknown, 1, /*IsExpression=*/false));
Daniel Jasper32d28ee2013-01-29 21:01:14 +000036 }
37
Nico Weber95e8e462013-02-12 16:17:07 +000038private:
Daniel Jasper32d28ee2013-01-29 21:01:14 +000039 bool parseAngle() {
40 if (CurrentToken == NULL)
41 return false;
Daniel Jasper923ebef2013-03-14 13:45:21 +000042 ScopedContextCreator ContextCreator(*this, tok::less, 10);
Manuel Klimekb3987012013-05-29 14:47:47 +000043 FormatToken *Left = CurrentToken->Previous;
Daniel Jasper4e778092013-02-06 10:05:46 +000044 Contexts.back().IsExpression = false;
Daniel Jasper32d28ee2013-01-29 21:01:14 +000045 while (CurrentToken != NULL) {
46 if (CurrentToken->is(tok::greater)) {
47 Left->MatchingParen = CurrentToken;
48 CurrentToken->MatchingParen = Left;
49 CurrentToken->Type = TT_TemplateCloser;
50 next();
51 return true;
52 }
Alexander Kornienkoe74de282013-03-13 14:41:29 +000053 if (CurrentToken->isOneOf(tok::r_paren, tok::r_square, tok::r_brace,
Daniel Jasper5d823e32013-05-15 13:46:48 +000054 tok::question, tok::colon))
55 return false;
Daniel Jasper0348be02013-06-01 18:56:00 +000056 // If a && or || is found and interpreted as a binary operator, this set
Daniel Jasper15f33f02013-06-03 16:16:41 +000057 // of angles is likely part of something like "a < b && c > d". If the
Daniel Jasper0348be02013-06-01 18:56:00 +000058 // angles are inside an expression, the ||/&& might also be a binary
59 // operator that was misinterpreted because we are parsing template
60 // parameters.
61 // FIXME: This is getting out of hand, write a decent parser.
Manuel Klimekb3987012013-05-29 14:47:47 +000062 if (CurrentToken->Previous->isOneOf(tok::pipepipe, tok::ampamp) &&
Daniel Jasper0348be02013-06-01 18:56:00 +000063 (CurrentToken->Previous->Type == TT_BinaryOperator ||
64 Contexts[Contexts.size() - 2].IsExpression) &&
Manuel Klimekb3987012013-05-29 14:47:47 +000065 Line.First->isNot(tok::kw_template))
Daniel Jasper32d28ee2013-01-29 21:01:14 +000066 return false;
Daniel Jasper9fc56f22013-02-14 15:01:34 +000067 updateParameterCount(Left, CurrentToken);
Daniel Jasper32d28ee2013-01-29 21:01:14 +000068 if (!consumeToken())
69 return false;
70 }
71 return false;
72 }
73
74 bool parseParens(bool LookForDecls = false) {
75 if (CurrentToken == NULL)
76 return false;
Daniel Jasper923ebef2013-03-14 13:45:21 +000077 ScopedContextCreator ContextCreator(*this, tok::l_paren, 1);
Daniel Jasper4e778092013-02-06 10:05:46 +000078
79 // FIXME: This is a bit of a hack. Do better.
80 Contexts.back().ColonIsForRangeExpr =
81 Contexts.size() == 2 && Contexts[0].ColonIsForRangeExpr;
82
Daniel Jasper32d28ee2013-01-29 21:01:14 +000083 bool StartsObjCMethodExpr = false;
Manuel Klimekb3987012013-05-29 14:47:47 +000084 FormatToken *Left = CurrentToken->Previous;
Daniel Jasper32d28ee2013-01-29 21:01:14 +000085 if (CurrentToken->is(tok::caret)) {
86 // ^( starts a block.
87 Left->Type = TT_ObjCBlockLParen;
Manuel Klimekb3987012013-05-29 14:47:47 +000088 } else if (FormatToken *MaybeSel = Left->Previous) {
Daniel Jasper32d28ee2013-01-29 21:01:14 +000089 // @selector( starts a selector.
Manuel Klimekb3987012013-05-29 14:47:47 +000090 if (MaybeSel->isObjCAtKeyword(tok::objc_selector) && MaybeSel->Previous &&
91 MaybeSel->Previous->is(tok::at)) {
Daniel Jasper32d28ee2013-01-29 21:01:14 +000092 StartsObjCMethodExpr = true;
93 }
94 }
95
Daniel Jasper4e778092013-02-06 10:05:46 +000096 if (StartsObjCMethodExpr) {
97 Contexts.back().ColonIsObjCMethodExpr = true;
98 Left->Type = TT_ObjCMethodExpr;
99 }
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000100
Daniel Jasper431f5912013-05-28 08:33:00 +0000101 bool MightBeFunctionType = CurrentToken->is(tok::star);
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000102 while (CurrentToken != NULL) {
103 // LookForDecls is set when "if (" has been seen. Check for
104 // 'identifier' '*' 'identifier' followed by not '=' -- this
105 // '*' has to be a binary operator but determineStarAmpUsage() will
106 // categorize it as an unary operator, so set the right type here.
Manuel Klimekb3987012013-05-29 14:47:47 +0000107 if (LookForDecls && CurrentToken->Next) {
Alexander Kornienko0bdc6432013-07-04 14:47:51 +0000108 FormatToken *Prev = CurrentToken->getPreviousNonComment();
Alexander Kornienko2785b9a2013-06-07 16:02:52 +0000109 if (Prev) {
Alexander Kornienko0bdc6432013-07-04 14:47:51 +0000110 FormatToken *PrevPrev = Prev->getPreviousNonComment();
Alexander Kornienko2785b9a2013-06-07 16:02:52 +0000111 FormatToken *Next = CurrentToken->Next;
112 if (PrevPrev && PrevPrev->is(tok::identifier) &&
113 Prev->isOneOf(tok::star, tok::amp, tok::ampamp) &&
114 CurrentToken->is(tok::identifier) && Next->isNot(tok::equal)) {
115 Prev->Type = TT_BinaryOperator;
116 LookForDecls = false;
117 }
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000118 }
119 }
120
121 if (CurrentToken->is(tok::r_paren)) {
Manuel Klimekb3987012013-05-29 14:47:47 +0000122 if (MightBeFunctionType && CurrentToken->Next &&
123 CurrentToken->Next->isOneOf(tok::l_paren, tok::l_square))
Daniel Jasper431f5912013-05-28 08:33:00 +0000124 Left->Type = TT_FunctionTypeLParen;
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000125 Left->MatchingParen = CurrentToken;
126 CurrentToken->MatchingParen = Left;
127
Daniel Jasper63d7ced2013-02-05 10:07:47 +0000128 if (StartsObjCMethodExpr) {
Daniel Jasper4e778092013-02-06 10:05:46 +0000129 CurrentToken->Type = TT_ObjCMethodExpr;
130 if (Contexts.back().FirstObjCSelectorName != NULL) {
131 Contexts.back().FirstObjCSelectorName->LongestObjCSelectorName =
132 Contexts.back().LongestObjCSelectorName;
Daniel Jasper63d7ced2013-02-05 10:07:47 +0000133 }
134 }
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000135
136 next();
137 return true;
138 }
Alexander Kornienkoe74de282013-03-13 14:41:29 +0000139 if (CurrentToken->isOneOf(tok::r_square, tok::r_brace))
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000140 return false;
Manuel Klimekb3987012013-05-29 14:47:47 +0000141 if (CurrentToken->Previous->Type == TT_PointerOrReference &&
142 CurrentToken->Previous->Previous->isOneOf(tok::l_paren,
143 tok::coloncolon))
Daniel Jasper431f5912013-05-28 08:33:00 +0000144 MightBeFunctionType = true;
Daniel Jasper9fc56f22013-02-14 15:01:34 +0000145 updateParameterCount(Left, CurrentToken);
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000146 if (!consumeToken())
147 return false;
148 }
149 return false;
150 }
151
152 bool parseSquare() {
153 if (!CurrentToken)
154 return false;
155
Alexander Kornienkod71b15b2013-06-17 13:19:53 +0000156 // A '[' could be an index subscript (after an identifier or after
Nico Weber051860e2013-02-10 02:08:05 +0000157 // ')' or ']'), it could be the start of an Objective-C method
158 // expression, or it could the the start of an Objective-C array literal.
Manuel Klimekb3987012013-05-29 14:47:47 +0000159 FormatToken *Left = CurrentToken->Previous;
Alexander Kornienko0bdc6432013-07-04 14:47:51 +0000160 FormatToken *Parent = Left->getPreviousNonComment();
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000161 bool StartsObjCMethodExpr =
Daniel Jasper6f21a982013-03-13 07:49:51 +0000162 Contexts.back().CanBeExpression &&
Alexander Kornienkoe74de282013-03-13 14:41:29 +0000163 (!Parent || Parent->isOneOf(tok::colon, tok::l_square, tok::l_paren,
164 tok::kw_return, tok::kw_throw) ||
Daniel Jasperac3223e2013-04-10 09:49:49 +0000165 Parent->isUnaryOperator() || Parent->Type == TT_ObjCForIn ||
Alexander Kornienkoe74de282013-03-13 14:41:29 +0000166 Parent->Type == TT_CastRParen ||
Manuel Klimekb3987012013-05-29 14:47:47 +0000167 getBinOpPrecedence(Parent->Tok.getKind(), true, true) > prec::Unknown);
Daniel Jasper923ebef2013-03-14 13:45:21 +0000168 ScopedContextCreator ContextCreator(*this, tok::l_square, 10);
Daniel Jasper6f21a982013-03-13 07:49:51 +0000169 Contexts.back().IsExpression = true;
Nico Weber051860e2013-02-10 02:08:05 +0000170 bool StartsObjCArrayLiteral = Parent && Parent->is(tok::at);
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000171
Daniel Jasper4e778092013-02-06 10:05:46 +0000172 if (StartsObjCMethodExpr) {
173 Contexts.back().ColonIsObjCMethodExpr = true;
174 Left->Type = TT_ObjCMethodExpr;
Nico Weber051860e2013-02-10 02:08:05 +0000175 } else if (StartsObjCArrayLiteral) {
176 Left->Type = TT_ObjCArrayLiteral;
Daniel Jasper4e778092013-02-06 10:05:46 +0000177 }
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000178
179 while (CurrentToken != NULL) {
180 if (CurrentToken->is(tok::r_square)) {
Manuel Klimekb3987012013-05-29 14:47:47 +0000181 if (CurrentToken->Next && CurrentToken->Next->is(tok::l_paren)) {
Nico Webere8a97982013-02-06 06:20:11 +0000182 // An ObjC method call is rarely followed by an open parenthesis.
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000183 // FIXME: Do we incorrectly label ":" with this?
184 StartsObjCMethodExpr = false;
185 Left->Type = TT_Unknown;
186 }
Daniel Jasper01786732013-02-04 07:21:18 +0000187 if (StartsObjCMethodExpr) {
Daniel Jasper4e778092013-02-06 10:05:46 +0000188 CurrentToken->Type = TT_ObjCMethodExpr;
Nico Webere8a97982013-02-06 06:20:11 +0000189 // determineStarAmpUsage() thinks that '*' '[' is allocating an
190 // array of pointers, but if '[' starts a selector then '*' is a
191 // binary operator.
Alexander Kornienko3fd9ccd2013-03-12 16:28:18 +0000192 if (Parent != NULL && Parent->Type == TT_PointerOrReference)
Nico Weber4ed7f3e2013-02-06 16:54:35 +0000193 Parent->Type = TT_BinaryOperator;
Nico Weber051860e2013-02-10 02:08:05 +0000194 } else if (StartsObjCArrayLiteral) {
195 CurrentToken->Type = TT_ObjCArrayLiteral;
Daniel Jasper01786732013-02-04 07:21:18 +0000196 }
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000197 Left->MatchingParen = CurrentToken;
198 CurrentToken->MatchingParen = Left;
Daniel Jasper4e778092013-02-06 10:05:46 +0000199 if (Contexts.back().FirstObjCSelectorName != NULL)
200 Contexts.back().FirstObjCSelectorName->LongestObjCSelectorName =
201 Contexts.back().LongestObjCSelectorName;
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000202 next();
203 return true;
204 }
Alexander Kornienkoe74de282013-03-13 14:41:29 +0000205 if (CurrentToken->isOneOf(tok::r_paren, tok::r_brace))
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000206 return false;
Daniel Jasper9fc56f22013-02-14 15:01:34 +0000207 updateParameterCount(Left, CurrentToken);
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000208 if (!consumeToken())
209 return false;
210 }
211 return false;
212 }
213
214 bool parseBrace() {
Daniel Jasper53e72cd2013-05-06 08:27:33 +0000215 if (CurrentToken != NULL) {
216 ScopedContextCreator ContextCreator(*this, tok::l_brace, 1);
Manuel Klimekb3987012013-05-29 14:47:47 +0000217 FormatToken *Left = CurrentToken->Previous;
Nico Weberf2ff8122013-05-26 05:39:26 +0000218
Alexander Kornienko0bdc6432013-07-04 14:47:51 +0000219 FormatToken *Parent = Left->getPreviousNonComment();
Nico Weberf2ff8122013-05-26 05:39:26 +0000220 bool StartsObjCDictLiteral = Parent && Parent->is(tok::at);
221 if (StartsObjCDictLiteral) {
222 Contexts.back().ColonIsObjCDictLiteral = true;
223 Left->Type = TT_ObjCDictLiteral;
224 }
225
Daniel Jasper53e72cd2013-05-06 08:27:33 +0000226 while (CurrentToken != NULL) {
227 if (CurrentToken->is(tok::r_brace)) {
Nico Weberf2ff8122013-05-26 05:39:26 +0000228 if (StartsObjCDictLiteral)
229 CurrentToken->Type = TT_ObjCDictLiteral;
Daniel Jasper53e72cd2013-05-06 08:27:33 +0000230 Left->MatchingParen = CurrentToken;
231 CurrentToken->MatchingParen = Left;
232 next();
233 return true;
234 }
235 if (CurrentToken->isOneOf(tok::r_paren, tok::r_square))
236 return false;
237 updateParameterCount(Left, CurrentToken);
238 if (!consumeToken())
239 return false;
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000240 }
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000241 }
Daniel Jasper53e72cd2013-05-06 08:27:33 +0000242 // No closing "}" found, this probably starts a definition.
243 Line.StartsDefinition = true;
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000244 return true;
245 }
Daniel Jasperc4615b72013-02-20 12:56:39 +0000246
Manuel Klimekb3987012013-05-29 14:47:47 +0000247 void updateParameterCount(FormatToken *Left, FormatToken *Current) {
Daniel Jasper9fc56f22013-02-14 15:01:34 +0000248 if (Current->is(tok::comma))
249 ++Left->ParameterCount;
250 else if (Left->ParameterCount == 0 && Current->isNot(tok::comment))
251 Left->ParameterCount = 1;
252 }
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000253
254 bool parseConditional() {
255 while (CurrentToken != NULL) {
256 if (CurrentToken->is(tok::colon)) {
257 CurrentToken->Type = TT_ConditionalExpr;
258 next();
259 return true;
260 }
261 if (!consumeToken())
262 return false;
263 }
264 return false;
265 }
266
267 bool parseTemplateDeclaration() {
268 if (CurrentToken != NULL && CurrentToken->is(tok::less)) {
269 CurrentToken->Type = TT_TemplateOpener;
270 next();
271 if (!parseAngle())
272 return false;
Daniel Jasper34511fb2013-02-19 17:14:38 +0000273 if (CurrentToken != NULL)
Manuel Klimekb3987012013-05-29 14:47:47 +0000274 CurrentToken->Previous->ClosesTemplateDeclaration = true;
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000275 return true;
276 }
277 return false;
278 }
279
280 bool consumeToken() {
Manuel Klimekb3987012013-05-29 14:47:47 +0000281 FormatToken *Tok = CurrentToken;
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000282 next();
Manuel Klimekb3987012013-05-29 14:47:47 +0000283 switch (Tok->Tok.getKind()) {
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000284 case tok::plus:
285 case tok::minus:
Manuel Klimekb3987012013-05-29 14:47:47 +0000286 if (Tok->Previous == NULL && Line.MustBeDeclaration)
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000287 Tok->Type = TT_ObjCMethodSpecifier;
288 break;
289 case tok::colon:
Manuel Klimekb3987012013-05-29 14:47:47 +0000290 if (Tok->Previous == NULL)
Daniel Jaspercf6d76a2013-03-18 12:50:26 +0000291 return false;
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000292 // Colons from ?: are handled in parseConditional().
Manuel Klimekb3987012013-05-29 14:47:47 +0000293 if (Tok->Previous->is(tok::r_paren) && Contexts.size() == 1) {
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000294 Tok->Type = TT_CtorInitializerColon;
Nico Weberf2ff8122013-05-26 05:39:26 +0000295 } else if (Contexts.back().ColonIsObjCDictLiteral) {
296 Tok->Type = TT_ObjCDictLiteral;
Daniel Jasper4e778092013-02-06 10:05:46 +0000297 } else if (Contexts.back().ColonIsObjCMethodExpr ||
Manuel Klimekb3987012013-05-29 14:47:47 +0000298 Line.First->Type == TT_ObjCMethodSpecifier) {
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000299 Tok->Type = TT_ObjCMethodExpr;
Manuel Klimekb3987012013-05-29 14:47:47 +0000300 Tok->Previous->Type = TT_ObjCSelectorName;
Alexander Kornienko00895102013-06-05 14:09:10 +0000301 if (Tok->Previous->CodePointCount >
302 Contexts.back().LongestObjCSelectorName) {
303 Contexts.back().LongestObjCSelectorName =
304 Tok->Previous->CodePointCount;
305 }
Daniel Jasper4e778092013-02-06 10:05:46 +0000306 if (Contexts.back().FirstObjCSelectorName == NULL)
Manuel Klimekb3987012013-05-29 14:47:47 +0000307 Contexts.back().FirstObjCSelectorName = Tok->Previous;
Daniel Jasper4e778092013-02-06 10:05:46 +0000308 } else if (Contexts.back().ColonIsForRangeExpr) {
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000309 Tok->Type = TT_RangeBasedForLoopColon;
Daniel Jasper6cabab42013-02-14 08:42:54 +0000310 } else if (Contexts.size() == 1) {
311 Tok->Type = TT_InheritanceColon;
Daniel Jasper923ebef2013-03-14 13:45:21 +0000312 } else if (Contexts.back().ContextKind == tok::l_paren) {
313 Tok->Type = TT_InlineASMColon;
Daniel Jasper63d7ced2013-02-05 10:07:47 +0000314 }
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000315 break;
316 case tok::kw_if:
317 case tok::kw_while:
318 if (CurrentToken != NULL && CurrentToken->is(tok::l_paren)) {
319 next();
Nico Weber27268772013-06-26 00:30:14 +0000320 if (!parseParens(/*LookForDecls=*/true))
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000321 return false;
322 }
323 break;
324 case tok::kw_for:
Daniel Jasper4e778092013-02-06 10:05:46 +0000325 Contexts.back().ColonIsForRangeExpr = true;
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000326 next();
327 if (!parseParens())
328 return false;
329 break;
330 case tok::l_paren:
331 if (!parseParens())
332 return false;
Daniel Jasper1407bee2013-04-11 14:29:13 +0000333 if (Line.MustBeDeclaration && NameFound && !Contexts.back().IsExpression)
Daniel Jasper3c08a812013-02-24 18:54:32 +0000334 Line.MightBeFunctionDecl = true;
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000335 break;
336 case tok::l_square:
337 if (!parseSquare())
338 return false;
339 break;
340 case tok::l_brace:
341 if (!parseBrace())
342 return false;
343 break;
344 case tok::less:
345 if (parseAngle())
346 Tok->Type = TT_TemplateOpener;
347 else {
348 Tok->Type = TT_BinaryOperator;
349 CurrentToken = Tok;
350 next();
351 }
352 break;
353 case tok::r_paren:
354 case tok::r_square:
355 return false;
356 case tok::r_brace:
357 // Lines can start with '}'.
Manuel Klimekb3987012013-05-29 14:47:47 +0000358 if (Tok->Previous != NULL)
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000359 return false;
360 break;
361 case tok::greater:
362 Tok->Type = TT_BinaryOperator;
363 break;
364 case tok::kw_operator:
Daniel Jasper2b4c9242013-02-11 08:01:18 +0000365 while (CurrentToken && CurrentToken->isNot(tok::l_paren)) {
Alexander Kornienkoe74de282013-03-13 14:41:29 +0000366 if (CurrentToken->isOneOf(tok::star, tok::amp))
Daniel Jasper2b4c9242013-02-11 08:01:18 +0000367 CurrentToken->Type = TT_PointerOrReference;
368 consumeToken();
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000369 }
Daniel Jasper6ea933c2013-05-10 07:59:58 +0000370 if (CurrentToken) {
Daniel Jasper2b4c9242013-02-11 08:01:18 +0000371 CurrentToken->Type = TT_OverloadedOperatorLParen;
Manuel Klimekb3987012013-05-29 14:47:47 +0000372 if (CurrentToken->Previous->Type == TT_BinaryOperator)
373 CurrentToken->Previous->Type = TT_OverloadedOperator;
Daniel Jasper6ea933c2013-05-10 07:59:58 +0000374 }
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000375 break;
376 case tok::question:
377 parseConditional();
378 break;
379 case tok::kw_template:
380 parseTemplateDeclaration();
381 break;
Nico Weberc2e6d2a2013-02-11 15:32:15 +0000382 case tok::identifier:
Manuel Klimekb3987012013-05-29 14:47:47 +0000383 if (Line.First->is(tok::kw_for) &&
384 Tok->Tok.getIdentifierInfo() == &Ident_in)
Nico Weberc2e6d2a2013-02-11 15:32:15 +0000385 Tok->Type = TT_ObjCForIn;
386 break;
Daniel Jasper8ed9f2b2013-04-03 13:36:17 +0000387 case tok::comma:
388 if (Contexts.back().FirstStartOfName)
389 Contexts.back().FirstStartOfName->PartOfMultiVariableDeclStmt = true;
390 break;
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000391 default:
392 break;
393 }
394 return true;
395 }
396
397 void parseIncludeDirective() {
398 next();
399 if (CurrentToken != NULL && CurrentToken->is(tok::less)) {
400 next();
401 while (CurrentToken != NULL) {
Manuel Klimekb3987012013-05-29 14:47:47 +0000402 if (CurrentToken->isNot(tok::comment) || CurrentToken->Next)
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000403 CurrentToken->Type = TT_ImplicitStringLiteral;
404 next();
405 }
406 } else {
407 while (CurrentToken != NULL) {
Daniel Jasper3a204412013-02-23 07:46:38 +0000408 if (CurrentToken->is(tok::string_literal))
409 // Mark these string literals as "implicit" literals, too, so that
410 // they are not split or line-wrapped.
411 CurrentToken->Type = TT_ImplicitStringLiteral;
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000412 next();
413 }
414 }
415 }
416
417 void parseWarningOrError() {
418 next();
419 // We still want to format the whitespace left of the first token of the
420 // warning or error.
421 next();
422 while (CurrentToken != NULL) {
423 CurrentToken->Type = TT_ImplicitStringLiteral;
424 next();
425 }
426 }
427
428 void parsePreprocessorDirective() {
429 next();
430 if (CurrentToken == NULL)
431 return;
432 // Hashes in the middle of a line can lead to any strange token
433 // sequence.
Manuel Klimekb3987012013-05-29 14:47:47 +0000434 if (CurrentToken->Tok.getIdentifierInfo() == NULL)
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000435 return;
Manuel Klimekb3987012013-05-29 14:47:47 +0000436 switch (CurrentToken->Tok.getIdentifierInfo()->getPPKeywordID()) {
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000437 case tok::pp_include:
438 case tok::pp_import:
439 parseIncludeDirective();
440 break;
441 case tok::pp_error:
442 case tok::pp_warning:
443 parseWarningOrError();
444 break;
Daniel Jasperaae7bad2013-04-23 13:54:04 +0000445 case tok::pp_if:
446 case tok::pp_elif:
447 parseLine();
448 break;
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000449 default:
450 break;
451 }
Daniel Jasper5b7e7b02013-02-05 09:34:14 +0000452 while (CurrentToken != NULL)
453 next();
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000454 }
455
Nico Weber95e8e462013-02-12 16:17:07 +0000456public:
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000457 LineType parseLine() {
458 int PeriodsAndArrows = 0;
Manuel Klimekb3987012013-05-29 14:47:47 +0000459 FormatToken *LastPeriodOrArrow = NULL;
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000460 bool CanBeBuilderTypeStmt = true;
461 if (CurrentToken->is(tok::hash)) {
462 parsePreprocessorDirective();
463 return LT_PreprocessorDirective;
464 }
465 while (CurrentToken != NULL) {
466 if (CurrentToken->is(tok::kw_virtual))
467 KeywordVirtualFound = true;
Alexander Kornienkoe74de282013-03-13 14:41:29 +0000468 if (CurrentToken->isOneOf(tok::period, tok::arrow)) {
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000469 ++PeriodsAndArrows;
Daniel Jasper24849712013-03-01 16:48:32 +0000470 LastPeriodOrArrow = CurrentToken;
471 }
Manuel Klimekb3987012013-05-29 14:47:47 +0000472 FormatToken *TheToken = CurrentToken;
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000473 if (!consumeToken())
474 return LT_Invalid;
Manuel Klimekb3987012013-05-29 14:47:47 +0000475 if (TheToken->getPrecedence() > prec::Assignment &&
Daniel Jasper82282dc2013-02-18 13:52:06 +0000476 TheToken->Type == TT_BinaryOperator)
Daniel Jasper4a544e52013-02-15 20:33:06 +0000477 CanBeBuilderTypeStmt = false;
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000478 }
479 if (KeywordVirtualFound)
480 return LT_VirtualFunctionDecl;
481
482 // Assume a builder-type call if there are 2 or more "." and "->".
Daniel Jasper24849712013-03-01 16:48:32 +0000483 if (PeriodsAndArrows >= 2 && CanBeBuilderTypeStmt) {
484 LastPeriodOrArrow->LastInChainOfCalls = true;
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000485 return LT_BuilderTypeCall;
Daniel Jasper24849712013-03-01 16:48:32 +0000486 }
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000487
Manuel Klimekb3987012013-05-29 14:47:47 +0000488 if (Line.First->Type == TT_ObjCMethodSpecifier) {
Daniel Jasper4e778092013-02-06 10:05:46 +0000489 if (Contexts.back().FirstObjCSelectorName != NULL)
490 Contexts.back().FirstObjCSelectorName->LongestObjCSelectorName =
491 Contexts.back().LongestObjCSelectorName;
Daniel Jasper63d7ced2013-02-05 10:07:47 +0000492 return LT_ObjCMethodDecl;
493 }
494
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000495 return LT_Other;
496 }
497
Nico Weber95e8e462013-02-12 16:17:07 +0000498private:
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000499 void next() {
Daniel Jasper01786732013-02-04 07:21:18 +0000500 if (CurrentToken != NULL) {
501 determineTokenType(*CurrentToken);
Daniel Jasper4e778092013-02-06 10:05:46 +0000502 CurrentToken->BindingStrength = Contexts.back().BindingStrength;
Daniel Jasper01786732013-02-04 07:21:18 +0000503 }
504
Manuel Klimekb3987012013-05-29 14:47:47 +0000505 if (CurrentToken != NULL)
506 CurrentToken = CurrentToken->Next;
Daniel Jasperd0f349b2013-02-18 12:44:35 +0000507
508 // Reset token type in case we have already looked at it and then recovered
509 // from an error (e.g. failure to find the matching >).
510 if (CurrentToken != NULL)
511 CurrentToken->Type = TT_Unknown;
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000512 }
513
Daniel Jasper4e778092013-02-06 10:05:46 +0000514 /// \brief A struct to hold information valid in a specific context, e.g.
515 /// a pair of parenthesis.
516 struct Context {
Daniel Jasper923ebef2013-03-14 13:45:21 +0000517 Context(tok::TokenKind ContextKind, unsigned BindingStrength,
518 bool IsExpression)
519 : ContextKind(ContextKind), BindingStrength(BindingStrength),
520 LongestObjCSelectorName(0), ColonIsForRangeExpr(false),
Nico Weberf2ff8122013-05-26 05:39:26 +0000521 ColonIsObjCDictLiteral(false), ColonIsObjCMethodExpr(false),
522 FirstObjCSelectorName(NULL), FirstStartOfName(NULL),
523 IsExpression(IsExpression), CanBeExpression(true) {}
Daniel Jasper01786732013-02-04 07:21:18 +0000524
Daniel Jasper923ebef2013-03-14 13:45:21 +0000525 tok::TokenKind ContextKind;
Daniel Jasper4e778092013-02-06 10:05:46 +0000526 unsigned BindingStrength;
527 unsigned LongestObjCSelectorName;
528 bool ColonIsForRangeExpr;
Nico Weberf2ff8122013-05-26 05:39:26 +0000529 bool ColonIsObjCDictLiteral;
Daniel Jasper4e778092013-02-06 10:05:46 +0000530 bool ColonIsObjCMethodExpr;
Manuel Klimekb3987012013-05-29 14:47:47 +0000531 FormatToken *FirstObjCSelectorName;
532 FormatToken *FirstStartOfName;
Daniel Jasper4e778092013-02-06 10:05:46 +0000533 bool IsExpression;
Daniel Jasper6f21a982013-03-13 07:49:51 +0000534 bool CanBeExpression;
Daniel Jasper4e778092013-02-06 10:05:46 +0000535 };
536
537 /// \brief Puts a new \c Context onto the stack \c Contexts for the lifetime
538 /// of each instance.
539 struct ScopedContextCreator {
540 AnnotatingParser &P;
541
Daniel Jasper923ebef2013-03-14 13:45:21 +0000542 ScopedContextCreator(AnnotatingParser &P, tok::TokenKind ContextKind,
543 unsigned Increase)
544 : P(P) {
545 P.Contexts.push_back(
546 Context(ContextKind, P.Contexts.back().BindingStrength + Increase,
547 P.Contexts.back().IsExpression));
Daniel Jasper4e778092013-02-06 10:05:46 +0000548 }
549
550 ~ScopedContextCreator() { P.Contexts.pop_back(); }
551 };
Daniel Jasper01786732013-02-04 07:21:18 +0000552
Manuel Klimekb3987012013-05-29 14:47:47 +0000553 void determineTokenType(FormatToken &Current) {
554 if (Current.getPrecedence() == prec::Assignment &&
555 (!Current.Previous || Current.Previous->isNot(tok::kw_operator))) {
Daniel Jasper4e778092013-02-06 10:05:46 +0000556 Contexts.back().IsExpression = true;
Manuel Klimekb3987012013-05-29 14:47:47 +0000557 for (FormatToken *Previous = Current.Previous;
Nico Weber95e8e462013-02-12 16:17:07 +0000558 Previous && Previous->isNot(tok::comma);
Manuel Klimekb3987012013-05-29 14:47:47 +0000559 Previous = Previous->Previous) {
Daniel Jasper9c65b062013-02-27 11:43:50 +0000560 if (Previous->is(tok::r_square))
561 Previous = Previous->MatchingParen;
Daniel Jasper01786732013-02-04 07:21:18 +0000562 if (Previous->Type == TT_BinaryOperator &&
Alexander Kornienkoe74de282013-03-13 14:41:29 +0000563 Previous->isOneOf(tok::star, tok::amp)) {
Daniel Jasper01786732013-02-04 07:21:18 +0000564 Previous->Type = TT_PointerOrReference;
565 }
Daniel Jasper01786732013-02-04 07:21:18 +0000566 }
Alexander Kornienkoe74de282013-03-13 14:41:29 +0000567 } else if (Current.isOneOf(tok::kw_return, tok::kw_throw) ||
Nico Weber95e8e462013-02-12 16:17:07 +0000568 (Current.is(tok::l_paren) && !Line.MustBeDeclaration &&
Daniel Jasper378d93d2013-05-13 07:14:40 +0000569 !Line.InPPDirective &&
Manuel Klimekb3987012013-05-29 14:47:47 +0000570 (!Current.Previous || Current.Previous->isNot(tok::kw_for)))) {
Daniel Jasper4e778092013-02-06 10:05:46 +0000571 Contexts.back().IsExpression = true;
Alexander Kornienkoe74de282013-03-13 14:41:29 +0000572 } else if (Current.isOneOf(tok::r_paren, tok::greater, tok::comma)) {
Manuel Klimekb3987012013-05-29 14:47:47 +0000573 for (FormatToken *Previous = Current.Previous;
Alexander Kornienkoe74de282013-03-13 14:41:29 +0000574 Previous && Previous->isOneOf(tok::star, tok::amp);
Manuel Klimekb3987012013-05-29 14:47:47 +0000575 Previous = Previous->Previous)
Nico Weber95e8e462013-02-12 16:17:07 +0000576 Previous->Type = TT_PointerOrReference;
Manuel Klimekb3987012013-05-29 14:47:47 +0000577 } else if (Current.Previous &&
578 Current.Previous->Type == TT_CtorInitializerColon) {
Daniel Jasperd0f349b2013-02-18 12:44:35 +0000579 Contexts.back().IsExpression = true;
Daniel Jasper6f21a982013-03-13 07:49:51 +0000580 } else if (Current.is(tok::kw_new)) {
581 Contexts.back().CanBeExpression = false;
Daniel Jasper16a69ef2013-05-03 14:41:24 +0000582 } else if (Current.is(tok::semi)) {
583 // This should be the condition or increment in a for-loop.
584 Contexts.back().IsExpression = true;
Nico Weber95e8e462013-02-12 16:17:07 +0000585 }
Daniel Jasper01786732013-02-04 07:21:18 +0000586
587 if (Current.Type == TT_Unknown) {
Daniel Jasper6ac431c2013-07-02 09:47:29 +0000588 if (isStartOfName(Current)) {
Daniel Jasper8ed9f2b2013-04-03 13:36:17 +0000589 Contexts.back().FirstStartOfName = &Current;
Daniel Jasper3c08a812013-02-24 18:54:32 +0000590 Current.Type = TT_StartOfName;
Daniel Jasper1407bee2013-04-11 14:29:13 +0000591 NameFound = true;
Alexander Kornienkoe74de282013-03-13 14:41:29 +0000592 } else if (Current.isOneOf(tok::star, tok::amp, tok::ampamp)) {
Daniel Jasper4e778092013-02-06 10:05:46 +0000593 Current.Type =
594 determineStarAmpUsage(Current, Contexts.back().IsExpression);
Alexander Kornienkoe74de282013-03-13 14:41:29 +0000595 } else if (Current.isOneOf(tok::minus, tok::plus, tok::caret)) {
Daniel Jasper01786732013-02-04 07:21:18 +0000596 Current.Type = determinePlusMinusCaretUsage(Current);
Alexander Kornienkoe74de282013-03-13 14:41:29 +0000597 } else if (Current.isOneOf(tok::minusminus, tok::plusplus)) {
Daniel Jasper01786732013-02-04 07:21:18 +0000598 Current.Type = determineIncrementUsage(Current);
599 } else if (Current.is(tok::exclaim)) {
600 Current.Type = TT_UnaryOperator;
Daniel Jasperac3223e2013-04-10 09:49:49 +0000601 } else if (Current.isBinaryOperator()) {
Daniel Jasper01786732013-02-04 07:21:18 +0000602 Current.Type = TT_BinaryOperator;
603 } else if (Current.is(tok::comment)) {
Alexander Kornienko00895102013-06-05 14:09:10 +0000604 if (Current.TokenText.startswith("//"))
Daniel Jasper01786732013-02-04 07:21:18 +0000605 Current.Type = TT_LineComment;
606 else
607 Current.Type = TT_BlockComment;
Nico Weber37d69312013-02-13 04:13:13 +0000608 } else if (Current.is(tok::r_paren)) {
Daniel Jasperb8b42952013-05-31 16:14:28 +0000609 FormatToken *LeftOfParens = NULL;
610 if (Current.MatchingParen)
Alexander Kornienko0bdc6432013-07-04 14:47:51 +0000611 LeftOfParens = Current.MatchingParen->getPreviousNonComment();
Daniel Jasperb8b42952013-05-31 16:14:28 +0000612 bool IsCast = false;
613 bool ParensAreEmpty = Current.Previous == Current.MatchingParen;
614 bool ParensAreType = !Current.Previous ||
Manuel Klimekb3987012013-05-29 14:47:47 +0000615 Current.Previous->Type == TT_PointerOrReference ||
Daniel Jasperb8b42952013-05-31 16:14:28 +0000616 Current.Previous->Type == TT_TemplateCloser ||
617 isSimpleTypeSpecifier(*Current.Previous);
Nico Weber37d69312013-02-13 04:13:13 +0000618 bool ParensCouldEndDecl =
Manuel Klimekb3987012013-05-29 14:47:47 +0000619 Current.Next &&
620 Current.Next->isOneOf(tok::equal, tok::semi, tok::l_brace);
Daniel Jasper6a365aa2013-03-13 17:13:53 +0000621 bool IsSizeOfOrAlignOf =
Daniel Jasperb8b42952013-05-31 16:14:28 +0000622 LeftOfParens &&
623 LeftOfParens->isOneOf(tok::kw_sizeof, tok::kw_alignof);
624 if (ParensAreType && !ParensCouldEndDecl && !IsSizeOfOrAlignOf &&
Daniel Jasper37eff832013-02-23 08:07:18 +0000625 Contexts.back().IsExpression)
Daniel Jasperb8b42952013-05-31 16:14:28 +0000626 IsCast = true;
627 if (Current.Next &&
Daniel Jasperff1a2e52013-06-06 08:20:20 +0000628 Current.Next->isNot(tok::string_literal) &&
Daniel Jasperb8b42952013-05-31 16:14:28 +0000629 (Current.Next->Tok.isLiteral() ||
630 Current.Next->isOneOf(tok::kw_sizeof, tok::kw_alignof)))
631 IsCast = true;
632 // If there is an identifier after the (), it is likely a cast, unless
633 // there is also an identifier before the ().
Daniel Jasperff1a2e52013-06-06 08:20:20 +0000634 if (LeftOfParens && (LeftOfParens->Tok.getIdentifierInfo() == NULL ||
635 LeftOfParens->is(tok::kw_return)) &&
Nico Weber465e8612013-06-25 00:55:57 +0000636 LeftOfParens->Type != TT_TemplateCloser && Current.Next &&
637 Current.Next->is(tok::identifier))
Daniel Jasperb8b42952013-05-31 16:14:28 +0000638 IsCast = true;
639 if (IsCast && !ParensAreEmpty)
Nico Weber37d69312013-02-13 04:13:13 +0000640 Current.Type = TT_CastRParen;
Manuel Klimekb3987012013-05-29 14:47:47 +0000641 } else if (Current.is(tok::at) && Current.Next) {
642 switch (Current.Next->Tok.getObjCKeywordID()) {
Daniel Jasper01786732013-02-04 07:21:18 +0000643 case tok::objc_interface:
644 case tok::objc_implementation:
645 case tok::objc_protocol:
646 Current.Type = TT_ObjCDecl;
647 break;
648 case tok::objc_property:
649 Current.Type = TT_ObjCProperty;
650 break;
651 default:
652 break;
653 }
Daniel Jasper5ad390d2013-05-28 11:30:49 +0000654 } else if (Current.is(tok::period)) {
Alexander Kornienko0bdc6432013-07-04 14:47:51 +0000655 FormatToken *PreviousNoComment = Current.getPreviousNonComment();
Daniel Jasper5ad390d2013-05-28 11:30:49 +0000656 if (PreviousNoComment &&
657 PreviousNoComment->isOneOf(tok::comma, tok::l_brace))
658 Current.Type = TT_DesignatedInitializerPeriod;
Daniel Jasper01786732013-02-04 07:21:18 +0000659 }
660 }
661 }
662
Daniel Jasper6ac431c2013-07-02 09:47:29 +0000663 /// \brief Take a guess at whether \p Tok starts a name of a function or
664 /// variable declaration.
665 ///
666 /// This is a heuristic based on whether \p Tok is an identifier following
667 /// something that is likely a type.
668 bool isStartOfName(const FormatToken &Tok) {
669 if (Tok.isNot(tok::identifier) || Tok.Previous == NULL)
670 return false;
671
672 // Skip "const" as it does not have an influence on whether this is a name.
673 FormatToken *PreviousNotConst = Tok.Previous;
674 while (PreviousNotConst != NULL && PreviousNotConst->is(tok::kw_const))
675 PreviousNotConst = PreviousNotConst->Previous;
676
677 if (PreviousNotConst == NULL)
678 return false;
679
680 bool IsPPKeyword =
681 PreviousNotConst->is(tok::identifier) && PreviousNotConst->Previous &&
682 PreviousNotConst->Previous->is(tok::hash);
683
684 return (!IsPPKeyword && PreviousNotConst->is(tok::identifier)) ||
685 PreviousNotConst->Type == TT_PointerOrReference ||
686 PreviousNotConst->Type == TT_TemplateCloser ||
687 isSimpleTypeSpecifier(*PreviousNotConst);
688 }
689
Daniel Jasper01786732013-02-04 07:21:18 +0000690 /// \brief Return the type of the given token assuming it is * or &.
Manuel Klimekb3987012013-05-29 14:47:47 +0000691 TokenType determineStarAmpUsage(const FormatToken &Tok, bool IsExpression) {
Alexander Kornienko0bdc6432013-07-04 14:47:51 +0000692 const FormatToken *PrevToken = Tok.getPreviousNonComment();
Daniel Jasper01786732013-02-04 07:21:18 +0000693 if (PrevToken == NULL)
694 return TT_UnaryOperator;
695
Alexander Kornienko0bdc6432013-07-04 14:47:51 +0000696 const FormatToken *NextToken = Tok.getNextNonComment();
Daniel Jasper01786732013-02-04 07:21:18 +0000697 if (NextToken == NULL)
698 return TT_Unknown;
699
Daniel Jasper431f5912013-05-28 08:33:00 +0000700 if (PrevToken->is(tok::coloncolon) ||
701 (PrevToken->is(tok::l_paren) && !IsExpression))
Daniel Jasper8a5d7cd2013-03-01 17:13:29 +0000702 return TT_PointerOrReference;
703
Alexander Kornienkoe74de282013-03-13 14:41:29 +0000704 if (PrevToken->isOneOf(tok::l_paren, tok::l_square, tok::l_brace,
Daniel Jasperd3cf17b2013-03-14 10:50:25 +0000705 tok::comma, tok::semi, tok::kw_return, tok::colon,
Daniel Jasperdbef71e2013-05-07 14:17:18 +0000706 tok::equal, tok::kw_delete) ||
Alexander Kornienkoe74de282013-03-13 14:41:29 +0000707 PrevToken->Type == TT_BinaryOperator ||
Daniel Jasper01786732013-02-04 07:21:18 +0000708 PrevToken->Type == TT_UnaryOperator || PrevToken->Type == TT_CastRParen)
709 return TT_UnaryOperator;
710
Nico Webere8a97982013-02-06 06:20:11 +0000711 if (NextToken->is(tok::l_square))
712 return TT_PointerOrReference;
713
Manuel Klimekb3987012013-05-29 14:47:47 +0000714 if (PrevToken->Tok.isLiteral() ||
Alexander Kornienkoe74de282013-03-13 14:41:29 +0000715 PrevToken->isOneOf(tok::r_paren, tok::r_square) ||
Manuel Klimekb3987012013-05-29 14:47:47 +0000716 NextToken->Tok.isLiteral() || NextToken->isUnaryOperator())
Daniel Jasper01786732013-02-04 07:21:18 +0000717 return TT_BinaryOperator;
718
Daniel Jasper01786732013-02-04 07:21:18 +0000719 // It is very unlikely that we are going to find a pointer or reference type
720 // definition on the RHS of an assignment.
721 if (IsExpression)
722 return TT_BinaryOperator;
723
724 return TT_PointerOrReference;
725 }
726
Manuel Klimekb3987012013-05-29 14:47:47 +0000727 TokenType determinePlusMinusCaretUsage(const FormatToken &Tok) {
Alexander Kornienko0bdc6432013-07-04 14:47:51 +0000728 const FormatToken *PrevToken = Tok.getPreviousNonComment();
Daniel Jasperb8b42952013-05-31 16:14:28 +0000729 if (PrevToken == NULL || PrevToken->Type == TT_CastRParen)
Daniel Jasper01786732013-02-04 07:21:18 +0000730 return TT_UnaryOperator;
731
732 // Use heuristics to recognize unary operators.
Alexander Kornienkoe74de282013-03-13 14:41:29 +0000733 if (PrevToken->isOneOf(tok::equal, tok::l_paren, tok::comma, tok::l_square,
734 tok::question, tok::colon, tok::kw_return,
735 tok::kw_case, tok::at, tok::l_brace))
Daniel Jasper01786732013-02-04 07:21:18 +0000736 return TT_UnaryOperator;
737
Nico Weberee0feec2013-02-05 16:21:00 +0000738 // There can't be two consecutive binary operators.
Daniel Jasper01786732013-02-04 07:21:18 +0000739 if (PrevToken->Type == TT_BinaryOperator)
740 return TT_UnaryOperator;
741
742 // Fall back to marking the token as binary operator.
743 return TT_BinaryOperator;
744 }
745
746 /// \brief Determine whether ++/-- are pre- or post-increments/-decrements.
Manuel Klimekb3987012013-05-29 14:47:47 +0000747 TokenType determineIncrementUsage(const FormatToken &Tok) {
Alexander Kornienko0bdc6432013-07-04 14:47:51 +0000748 const FormatToken *PrevToken = Tok.getPreviousNonComment();
Daniel Jasperb8b42952013-05-31 16:14:28 +0000749 if (PrevToken == NULL || PrevToken->Type == TT_CastRParen)
Daniel Jasper01786732013-02-04 07:21:18 +0000750 return TT_UnaryOperator;
Alexander Kornienkoe74de282013-03-13 14:41:29 +0000751 if (PrevToken->isOneOf(tok::r_paren, tok::r_square, tok::identifier))
Daniel Jasper01786732013-02-04 07:21:18 +0000752 return TT_TrailingUnaryOperator;
753
754 return TT_UnaryOperator;
755 }
Daniel Jasper4e778092013-02-06 10:05:46 +0000756
Daniel Jasper8ed9f2b2013-04-03 13:36:17 +0000757 // FIXME: This is copy&pasted from Sema. Put it in a common place and remove
758 // duplication.
759 /// \brief Determine whether the token kind starts a simple-type-specifier.
Manuel Klimekb3987012013-05-29 14:47:47 +0000760 bool isSimpleTypeSpecifier(const FormatToken &Tok) const {
761 switch (Tok.Tok.getKind()) {
Daniel Jasper8ed9f2b2013-04-03 13:36:17 +0000762 case tok::kw_short:
763 case tok::kw_long:
764 case tok::kw___int64:
765 case tok::kw___int128:
766 case tok::kw_signed:
767 case tok::kw_unsigned:
768 case tok::kw_void:
769 case tok::kw_char:
770 case tok::kw_int:
771 case tok::kw_half:
772 case tok::kw_float:
773 case tok::kw_double:
774 case tok::kw_wchar_t:
775 case tok::kw_bool:
776 case tok::kw___underlying_type:
Daniel Jasper8ed9f2b2013-04-03 13:36:17 +0000777 case tok::annot_typename:
778 case tok::kw_char16_t:
779 case tok::kw_char32_t:
780 case tok::kw_typeof:
781 case tok::kw_decltype:
Alexander Kornienko00895102013-06-05 14:09:10 +0000782 return true;
Daniel Jasper8ed9f2b2013-04-03 13:36:17 +0000783 default:
Alexander Kornienko00895102013-06-05 14:09:10 +0000784 return false;
Daniel Jasper8ed9f2b2013-04-03 13:36:17 +0000785 }
Daniel Jasper8ed9f2b2013-04-03 13:36:17 +0000786 }
787
Daniel Jasper4e778092013-02-06 10:05:46 +0000788 SmallVector<Context, 8> Contexts;
789
Daniel Jasper4e778092013-02-06 10:05:46 +0000790 AnnotatedLine &Line;
Manuel Klimekb3987012013-05-29 14:47:47 +0000791 FormatToken *CurrentToken;
Daniel Jasper4e778092013-02-06 10:05:46 +0000792 bool KeywordVirtualFound;
Daniel Jasper1407bee2013-04-11 14:29:13 +0000793 bool NameFound;
Nico Weberc2e6d2a2013-02-11 15:32:15 +0000794 IdentifierInfo &Ident_in;
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000795};
796
Daniel Jasper29f123b2013-02-08 15:28:42 +0000797/// \brief Parses binary expressions by inserting fake parenthesis based on
798/// operator precedence.
799class ExpressionParser {
800public:
Daniel Jasper9acb8b42013-06-06 09:11:58 +0000801 ExpressionParser(AnnotatedLine &Line) : Current(Line.First) {
802 // Skip leading "}", e.g. in "} else if (...) {".
803 if (Current->is(tok::r_brace))
804 next();
805 }
Daniel Jasper29f123b2013-02-08 15:28:42 +0000806
807 /// \brief Parse expressions with the given operatore precedence.
Daniel Jasper237d4c12013-02-23 21:01:55 +0000808 void parse(int Precedence = 0) {
Daniel Jasperc01897c2013-05-31 14:56:12 +0000809 // Conditional expressions need to be parsed separately for proper nesting.
810 if (Precedence == prec::Conditional + 1) {
811 parseConditionalExpr();
812 return;
813 }
Daniel Jasper29f123b2013-02-08 15:28:42 +0000814 if (Precedence > prec::PointerToMember || Current == NULL)
815 return;
816
Manuel Klimekb3987012013-05-29 14:47:47 +0000817 FormatToken *Start = Current;
Daniel Jasper29f123b2013-02-08 15:28:42 +0000818 bool OperatorFound = false;
819
Daniel Jasper237d4c12013-02-23 21:01:55 +0000820 while (Current) {
Daniel Jasper29f123b2013-02-08 15:28:42 +0000821 // Consume operators with higher precedence.
Daniel Jasperbf71ba22013-04-08 20:33:42 +0000822 parse(Precedence + 1);
Daniel Jasper29f123b2013-02-08 15:28:42 +0000823
Daniel Jasper237d4c12013-02-23 21:01:55 +0000824 int CurrentPrecedence = 0;
825 if (Current) {
826 if (Current->Type == TT_ConditionalExpr)
Daniel Jasperb8b42952013-05-31 16:14:28 +0000827 CurrentPrecedence = 1 + (int)prec::Conditional;
Daniel Jasperbf71ba22013-04-08 20:33:42 +0000828 else if (Current->is(tok::semi) || Current->Type == TT_InlineASMColon)
Daniel Jasper237d4c12013-02-23 21:01:55 +0000829 CurrentPrecedence = 1;
830 else if (Current->Type == TT_BinaryOperator || Current->is(tok::comma))
Daniel Jasperb8b42952013-05-31 16:14:28 +0000831 CurrentPrecedence = 1 + (int)Current->getPrecedence();
Daniel Jasper237d4c12013-02-23 21:01:55 +0000832 }
833
Daniel Jasper29f123b2013-02-08 15:28:42 +0000834 // At the end of the line or when an operator with higher precedence is
835 // found, insert fake parenthesis and return.
Daniel Jasperac3223e2013-04-10 09:49:49 +0000836 if (Current == NULL || Current->closesScope() ||
Daniel Jasper237d4c12013-02-23 21:01:55 +0000837 (CurrentPrecedence != 0 && CurrentPrecedence < Precedence)) {
Daniel Jasperc01897c2013-05-31 14:56:12 +0000838 if (OperatorFound)
839 addFakeParenthesis(Start, prec::Level(Precedence - 1));
Daniel Jasper29f123b2013-02-08 15:28:42 +0000840 return;
841 }
842
843 // Consume scopes: (), [], <> and {}
Daniel Jasperac3223e2013-04-10 09:49:49 +0000844 if (Current->opensScope()) {
845 while (Current && !Current->closesScope()) {
Daniel Jasper29f123b2013-02-08 15:28:42 +0000846 next();
847 parse();
848 }
849 next();
850 } else {
851 // Operator found.
Daniel Jasper237d4c12013-02-23 21:01:55 +0000852 if (CurrentPrecedence == Precedence)
Daniel Jasper29f123b2013-02-08 15:28:42 +0000853 OperatorFound = true;
854
855 next();
856 }
857 }
858 }
859
860private:
Daniel Jasperc01897c2013-05-31 14:56:12 +0000861 void addFakeParenthesis(FormatToken *Start, prec::Level Precedence) {
862 Start->FakeLParens.push_back(Precedence);
863 if (Current)
864 ++Current->Previous->FakeRParens;
865 }
866
867 void parseConditionalExpr() {
868 FormatToken *Start = Current;
869 parse(prec::LogicalOr + 1);
870 if (!Current || !Current->is(tok::question))
871 return;
872 next();
873 parse(prec::LogicalOr + 1);
874 if (!Current || Current->Type != TT_ConditionalExpr)
875 return;
876 next();
877 parseConditionalExpr();
878 addFakeParenthesis(Start, prec::Conditional);
879 }
880
Daniel Jasper29f123b2013-02-08 15:28:42 +0000881 void next() {
Alexander Kornienkod71b15b2013-06-17 13:19:53 +0000882 if (Current)
883 Current = Current->Next;
884 while (Current && Current->isTrailingComment())
Manuel Klimekb3987012013-05-29 14:47:47 +0000885 Current = Current->Next;
Daniel Jasper29f123b2013-02-08 15:28:42 +0000886 }
887
Manuel Klimekb3987012013-05-29 14:47:47 +0000888 FormatToken *Current;
Daniel Jasper29f123b2013-02-08 15:28:42 +0000889};
890
Craig Topper14e66492013-07-01 04:03:19 +0000891} // end anonymous namespace
892
Daniel Jasper8ff690a2013-02-06 14:22:40 +0000893void TokenAnnotator::annotate(AnnotatedLine &Line) {
Alexander Kornienko00895102013-06-05 14:09:10 +0000894 AnnotatingParser Parser(Line, Ident_in);
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000895 Line.Type = Parser.parseLine();
896 if (Line.Type == LT_Invalid)
897 return;
898
Daniel Jasper29f123b2013-02-08 15:28:42 +0000899 ExpressionParser ExprParser(Line);
900 ExprParser.parse();
901
Manuel Klimekb3987012013-05-29 14:47:47 +0000902 if (Line.First->Type == TT_ObjCMethodSpecifier)
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000903 Line.Type = LT_ObjCMethodDecl;
Manuel Klimekb3987012013-05-29 14:47:47 +0000904 else if (Line.First->Type == TT_ObjCDecl)
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000905 Line.Type = LT_ObjCDecl;
Manuel Klimekb3987012013-05-29 14:47:47 +0000906 else if (Line.First->Type == TT_ObjCProperty)
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000907 Line.Type = LT_ObjCProperty;
908
Manuel Klimekb3987012013-05-29 14:47:47 +0000909 Line.First->SpacesRequiredBefore = 1;
910 Line.First->CanBreakBefore = Line.First->MustBreakBefore;
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000911}
912
Daniel Jasper8ff690a2013-02-06 14:22:40 +0000913void TokenAnnotator::calculateFormattingInformation(AnnotatedLine &Line) {
Alexander Kornienko00895102013-06-05 14:09:10 +0000914 Line.First->TotalLength = Line.First->CodePointCount;
Manuel Klimekb3987012013-05-29 14:47:47 +0000915 if (!Line.First->Next)
Daniel Jasper8ff690a2013-02-06 14:22:40 +0000916 return;
Manuel Klimekb3987012013-05-29 14:47:47 +0000917 FormatToken *Current = Line.First->Next;
Daniel Jasper8ff690a2013-02-06 14:22:40 +0000918 while (Current != NULL) {
Daniel Jasper729a7432013-02-11 12:36:37 +0000919 if (Current->Type == TT_LineComment)
920 Current->SpacesRequiredBefore = Style.SpacesBeforeTrailingComments;
921 else
922 Current->SpacesRequiredBefore =
923 spaceRequiredBefore(Line, *Current) ? 1 : 0;
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000924
Manuel Klimekb3987012013-05-29 14:47:47 +0000925 if (Current->MustBreakBefore) {
Alexander Kornienkoe3f11972013-06-12 19:04:12 +0000926 } else if (Current->is(tok::comment)) {
Manuel Klimekb3987012013-05-29 14:47:47 +0000927 Current->MustBreakBefore = Current->NewlinesBefore > 0;
928 } else if (Current->Previous->isTrailingComment() ||
Daniel Jasper8ff690a2013-02-06 14:22:40 +0000929 (Current->is(tok::string_literal) &&
Manuel Klimekb3987012013-05-29 14:47:47 +0000930 Current->Previous->is(tok::string_literal))) {
Daniel Jasper8ff690a2013-02-06 14:22:40 +0000931 Current->MustBreakBefore = true;
Manuel Klimekb3987012013-05-29 14:47:47 +0000932 } else if (Current->is(tok::lessless) && Current->Next &&
933 Current->Previous->is(tok::string_literal) &&
934 Current->Next->is(tok::string_literal)) {
Daniel Jasper8ff690a2013-02-06 14:22:40 +0000935 Current->MustBreakBefore = true;
Manuel Klimekb3987012013-05-29 14:47:47 +0000936 } else if (Current->Previous->ClosesTemplateDeclaration &&
Daniel Jasperbbc87762013-05-29 12:07:31 +0000937 Style.AlwaysBreakTemplateDeclarations) {
938 Current->MustBreakBefore = true;
Alexander Kornienko56312022013-07-04 12:02:44 +0000939 } else if (Style.AlwaysBreakBeforeMultilineStrings &&
940 Current->is(tok::string_literal) &&
941 Current->Previous->isNot(tok::lessless) &&
942 Current->Previous->Type != TT_InlineASMColon &&
Alexander Kornienko0bdc6432013-07-04 14:47:51 +0000943 Current->getNextNonComment() &&
944 Current->getNextNonComment()->is(tok::string_literal)) {
Alexander Kornienko56312022013-07-04 12:02:44 +0000945 Current->MustBreakBefore = true;
Daniel Jasper8ff690a2013-02-06 14:22:40 +0000946 } else {
947 Current->MustBreakBefore = false;
948 }
949 Current->CanBreakBefore =
950 Current->MustBreakBefore || canBreakBefore(Line, *Current);
951 if (Current->MustBreakBefore)
Manuel Klimekb3987012013-05-29 14:47:47 +0000952 Current->TotalLength = Current->Previous->TotalLength + Style.ColumnLimit;
Daniel Jasper8ff690a2013-02-06 14:22:40 +0000953 else
954 Current->TotalLength =
Alexander Kornienko00895102013-06-05 14:09:10 +0000955 Current->Previous->TotalLength + Current->CodePointCount +
Daniel Jasper729a7432013-02-11 12:36:37 +0000956 Current->SpacesRequiredBefore;
Daniel Jasper8ff690a2013-02-06 14:22:40 +0000957 // FIXME: Only calculate this if CanBreakBefore is true once static
958 // initializers etc. are sorted out.
959 // FIXME: Move magic numbers to a better place.
960 Current->SplitPenalty =
961 20 * Current->BindingStrength + splitPenalty(Line, *Current);
962
Manuel Klimekb3987012013-05-29 14:47:47 +0000963 Current = Current->Next;
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000964 }
Daniel Jasperbf71ba22013-04-08 20:33:42 +0000965
Manuel Klimeke573c3f2013-05-22 12:51:29 +0000966 calculateUnbreakableTailLengths(Line);
Daniel Jasperbf71ba22013-04-08 20:33:42 +0000967 DEBUG({
968 printDebugInfo(Line);
969 });
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000970}
971
Manuel Klimeke573c3f2013-05-22 12:51:29 +0000972void TokenAnnotator::calculateUnbreakableTailLengths(AnnotatedLine &Line) {
973 unsigned UnbreakableTailLength = 0;
Manuel Klimekb3987012013-05-29 14:47:47 +0000974 FormatToken *Current = Line.Last;
Manuel Klimeke573c3f2013-05-22 12:51:29 +0000975 while (Current != NULL) {
976 Current->UnbreakableTailLength = UnbreakableTailLength;
977 if (Current->CanBreakBefore ||
978 Current->isOneOf(tok::comment, tok::string_literal)) {
979 UnbreakableTailLength = 0;
980 } else {
981 UnbreakableTailLength +=
Alexander Kornienko00895102013-06-05 14:09:10 +0000982 Current->CodePointCount + Current->SpacesRequiredBefore;
Manuel Klimeke573c3f2013-05-22 12:51:29 +0000983 }
Manuel Klimekb3987012013-05-29 14:47:47 +0000984 Current = Current->Previous;
Manuel Klimeke573c3f2013-05-22 12:51:29 +0000985 }
986}
987
Daniel Jasper8ff690a2013-02-06 14:22:40 +0000988unsigned TokenAnnotator::splitPenalty(const AnnotatedLine &Line,
Manuel Klimekb3987012013-05-29 14:47:47 +0000989 const FormatToken &Tok) {
990 const FormatToken &Left = *Tok.Previous;
991 const FormatToken &Right = Tok;
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000992
Daniel Jasper5ad390d2013-05-28 11:30:49 +0000993 if (Left.is(tok::semi))
994 return 0;
995 if (Left.is(tok::comma))
996 return 1;
997
Daniel Jasper3c08a812013-02-24 18:54:32 +0000998 if (Right.Type == TT_StartOfName) {
Manuel Klimekb3987012013-05-29 14:47:47 +0000999 if (Line.First->is(tok::kw_for) && Right.PartOfMultiVariableDeclStmt)
Daniel Jasper3c08a812013-02-24 18:54:32 +00001000 return 3;
1001 else if (Line.MightBeFunctionDecl && Right.BindingStrength == 1)
1002 // FIXME: Clean up hack of using BindingStrength to find top-level names.
1003 return Style.PenaltyReturnTypeOnItsOwnLine;
1004 else
Daniel Jasper1407bee2013-04-11 14:29:13 +00001005 return 200;
Daniel Jasper3c08a812013-02-24 18:54:32 +00001006 }
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001007 if (Left.is(tok::equal) && Right.is(tok::l_brace))
1008 return 150;
1009 if (Left.is(tok::coloncolon))
1010 return 500;
Daniel Jasper6b119d62013-04-05 17:22:09 +00001011 if (Left.isOneOf(tok::kw_class, tok::kw_struct))
1012 return 5000;
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001013
Daniel Jasper6cabab42013-02-14 08:42:54 +00001014 if (Left.Type == TT_RangeBasedForLoopColon ||
1015 Left.Type == TT_InheritanceColon)
Daniel Jasper84a1a632013-02-26 13:18:08 +00001016 return 2;
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001017
Daniel Jasper5ad390d2013-05-28 11:30:49 +00001018 if (Right.isOneOf(tok::arrow, tok::period) &&
1019 Right.Type != TT_DesignatedInitializerPeriod) {
Daniel Jasper515f65d2013-02-18 13:24:21 +00001020 if (Line.Type == LT_BuilderTypeCall)
Daniel Jasper6a365aa2013-03-13 17:13:53 +00001021 return prec::PointerToMember;
Alexander Kornienkoe74de282013-03-13 14:41:29 +00001022 if (Left.isOneOf(tok::r_paren, tok::r_square) && Left.MatchingParen &&
1023 Left.MatchingParen->ParameterCount > 0)
Daniel Jasper518ee342013-02-26 13:59:14 +00001024 return 20; // Should be smaller than breaking at a nested comma.
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001025 return 150;
1026 }
1027
Daniel Jasper5ad72bb2013-05-22 08:28:26 +00001028 // Breaking before a trailing 'const' is bad.
1029 if (Left.is(tok::r_paren) && Right.is(tok::kw_const))
1030 return 150;
1031
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001032 // In for-loops, prefer breaking at ',' and ';'.
Manuel Klimekb3987012013-05-29 14:47:47 +00001033 if (Line.First->is(tok::kw_for) && Left.is(tok::equal))
Daniel Jasper7d812812013-02-21 15:00:29 +00001034 return 4;
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001035
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001036 // In Objective-C method expressions, prefer breaking before "param:" over
1037 // breaking after it.
Daniel Jasper63d7ced2013-02-05 10:07:47 +00001038 if (Right.Type == TT_ObjCSelectorName)
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001039 return 0;
Daniel Jasper63d7ced2013-02-05 10:07:47 +00001040 if (Left.is(tok::colon) && Left.Type == TT_ObjCMethodExpr)
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001041 return 20;
1042
Daniel Jasper1407bee2013-04-11 14:29:13 +00001043 if (Left.is(tok::l_paren) && Line.MightBeFunctionDecl)
1044 return 100;
Daniel Jasperac3223e2013-04-10 09:49:49 +00001045 if (Left.opensScope())
Daniel Jasper64f09282013-03-20 13:53:11 +00001046 return Left.ParameterCount > 1 ? prec::Comma : 20;
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001047
Daniel Jasper4e8a7b42013-02-06 21:04:05 +00001048 if (Right.is(tok::lessless)) {
1049 if (Left.is(tok::string_literal)) {
Alexander Kornienko00895102013-06-05 14:09:10 +00001050 StringRef Content = Left.TokenText;
Daniel Jasperbfa1edd2013-03-14 14:00:17 +00001051 Content = Content.drop_back(1).drop_front(1).trim();
1052 if (Content.size() > 1 &&
1053 (Content.back() == ':' || Content.back() == '='))
Daniel Jasper6e6efa72013-05-22 09:13:26 +00001054 return 20;
Daniel Jasper4e8a7b42013-02-06 21:04:05 +00001055 }
Daniel Jasper01786732013-02-04 07:21:18 +00001056 return prec::Shift;
Daniel Jasper4e8a7b42013-02-06 21:04:05 +00001057 }
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001058 if (Left.Type == TT_ConditionalExpr)
Daniel Jasper518ee342013-02-26 13:59:14 +00001059 return prec::Conditional;
Manuel Klimekb3987012013-05-29 14:47:47 +00001060 prec::Level Level = Left.getPrecedence();
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001061
1062 if (Level != prec::Unknown)
1063 return Level;
Daniel Jasper24849712013-03-01 16:48:32 +00001064
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001065 return 3;
1066}
1067
Daniel Jasper8ff690a2013-02-06 14:22:40 +00001068bool TokenAnnotator::spaceRequiredBetween(const AnnotatedLine &Line,
Manuel Klimekb3987012013-05-29 14:47:47 +00001069 const FormatToken &Left,
1070 const FormatToken &Right) {
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001071 if (Right.is(tok::hashhash))
1072 return Left.is(tok::hash);
Alexander Kornienkoe74de282013-03-13 14:41:29 +00001073 if (Left.isOneOf(tok::hashhash, tok::hash))
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001074 return Right.is(tok::hash);
Alexander Kornienkoe74de282013-03-13 14:41:29 +00001075 if (Right.isOneOf(tok::r_paren, tok::semi, tok::comma))
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001076 return false;
1077 if (Right.is(tok::less) &&
1078 (Left.is(tok::kw_template) ||
1079 (Line.Type == LT_ObjCDecl && Style.ObjCSpaceBeforeProtocolList)))
1080 return true;
1081 if (Left.is(tok::arrow) || Right.is(tok::arrow))
1082 return false;
Alexander Kornienkoe74de282013-03-13 14:41:29 +00001083 if (Left.isOneOf(tok::exclaim, tok::tilde))
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001084 return false;
1085 if (Left.is(tok::at) &&
Alexander Kornienkoe74de282013-03-13 14:41:29 +00001086 Right.isOneOf(tok::identifier, tok::string_literal, tok::char_constant,
1087 tok::numeric_constant, tok::l_paren, tok::l_brace,
1088 tok::kw_true, tok::kw_false))
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001089 return false;
1090 if (Left.is(tok::coloncolon))
1091 return false;
1092 if (Right.is(tok::coloncolon))
Alexander Kornienkoe74de282013-03-13 14:41:29 +00001093 return !Left.isOneOf(tok::identifier, tok::greater, tok::l_paren);
1094 if (Left.is(tok::less) || Right.isOneOf(tok::greater, tok::less))
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001095 return false;
Daniel Jasperc47d7f12013-07-01 09:47:25 +00001096 if (Right.is(tok::ellipsis))
1097 return false;
Alexander Kornienko3fd9ccd2013-03-12 16:28:18 +00001098 if (Right.Type == TT_PointerOrReference)
Manuel Klimekb3987012013-05-29 14:47:47 +00001099 return Left.Tok.isLiteral() ||
Alexander Kornienko3fd9ccd2013-03-12 16:28:18 +00001100 ((Left.Type != TT_PointerOrReference) && Left.isNot(tok::l_paren) &&
1101 !Style.PointerBindsToType);
Daniel Jasper3ff4a2f2013-05-28 15:27:10 +00001102 if (Right.Type == TT_FunctionTypeLParen && Left.isNot(tok::l_paren) &&
Daniel Jasper395228f2013-05-08 14:58:20 +00001103 (Left.Type != TT_PointerOrReference || Style.PointerBindsToType))
1104 return true;
Alexander Kornienko3fd9ccd2013-03-12 16:28:18 +00001105 if (Left.Type == TT_PointerOrReference)
Daniel Jasper3a1847e2013-07-01 09:34:09 +00001106 return Right.Tok.isLiteral() || Right.Type == TT_BlockComment ||
Daniel Jasper9322aae2013-03-20 09:53:18 +00001107 ((Right.Type != TT_PointerOrReference) &&
Daniel Jasper81d2d382013-04-01 17:13:26 +00001108 Right.isNot(tok::l_paren) && Style.PointerBindsToType &&
Manuel Klimekb3987012013-05-29 14:47:47 +00001109 Left.Previous &&
1110 !Left.Previous->isOneOf(tok::l_paren, tok::coloncolon));
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001111 if (Right.is(tok::star) && Left.is(tok::l_paren))
1112 return false;
Nico Weber051860e2013-02-10 02:08:05 +00001113 if (Left.is(tok::l_square))
1114 return Left.Type == TT_ObjCArrayLiteral && Right.isNot(tok::r_square);
1115 if (Right.is(tok::r_square))
1116 return Right.Type == TT_ObjCArrayLiteral;
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001117 if (Right.is(tok::l_square) && Right.Type != TT_ObjCMethodExpr)
1118 return false;
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001119 if (Left.is(tok::colon))
1120 return Left.Type != TT_ObjCMethodExpr;
1121 if (Right.is(tok::colon))
1122 return Right.Type != TT_ObjCMethodExpr;
1123 if (Left.is(tok::l_paren))
1124 return false;
1125 if (Right.is(tok::l_paren)) {
Alexander Kornienkoe74de282013-03-13 14:41:29 +00001126 return Line.Type == LT_ObjCDecl ||
1127 Left.isOneOf(tok::kw_if, tok::kw_for, tok::kw_while, tok::kw_switch,
1128 tok::kw_return, tok::kw_catch, tok::kw_new,
Daniel Jasper454cb702013-05-03 14:50:50 +00001129 tok::kw_delete, tok::semi);
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001130 }
Manuel Klimekb3987012013-05-29 14:47:47 +00001131 if (Left.is(tok::at) && Right.Tok.getObjCKeywordID() != tok::objc_not_keyword)
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001132 return false;
1133 if (Left.is(tok::l_brace) && Right.is(tok::r_brace))
Daniel Jasper2424eef2013-05-23 10:15:45 +00001134 return false; // No spaces in "{}".
1135 if (Left.is(tok::l_brace) || Right.is(tok::r_brace))
1136 return Style.SpacesInBracedLists;
Daniel Jasper1bee0732013-05-23 18:05:18 +00001137 if (Right.Type == TT_UnaryOperator)
1138 return !Left.isOneOf(tok::l_paren, tok::l_square, tok::at) &&
1139 (Left.isNot(tok::colon) || Left.Type != TT_ObjCMethodExpr);
Daniel Jasperce933562013-05-23 21:35:49 +00001140 if (Left.isOneOf(tok::identifier, tok::greater, tok::r_square) &&
Alexander Kornienko0bdc6432013-07-04 14:47:51 +00001141 Right.is(tok::l_brace) && Right.getNextNonComment())
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001142 return false;
Daniel Jasper5ad390d2013-05-28 11:30:49 +00001143 if (Left.is(tok::period) || Right.is(tok::period))
1144 return false;
Nico Weber861576b2013-06-26 00:15:19 +00001145 if (Left.Type == TT_BlockComment && Left.TokenText.endswith("=*/"))
1146 return false;
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001147 return true;
1148}
1149
Daniel Jasper8ff690a2013-02-06 14:22:40 +00001150bool TokenAnnotator::spaceRequiredBefore(const AnnotatedLine &Line,
Manuel Klimekb3987012013-05-29 14:47:47 +00001151 const FormatToken &Tok) {
1152 if (Tok.Tok.getIdentifierInfo() && Tok.Previous->Tok.getIdentifierInfo())
Daniel Jasper2b4c9242013-02-11 08:01:18 +00001153 return true; // Never ever merge two identifiers.
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001154 if (Line.Type == LT_ObjCMethodDecl) {
Manuel Klimekb3987012013-05-29 14:47:47 +00001155 if (Tok.Previous->Type == TT_ObjCMethodSpecifier)
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001156 return true;
Manuel Klimekb3987012013-05-29 14:47:47 +00001157 if (Tok.Previous->is(tok::r_paren) && Tok.is(tok::identifier))
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001158 // Don't space between ')' and <id>
1159 return false;
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001160 }
1161 if (Line.Type == LT_ObjCProperty &&
Manuel Klimekb3987012013-05-29 14:47:47 +00001162 (Tok.is(tok::equal) || Tok.Previous->is(tok::equal)))
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001163 return false;
1164
Manuel Klimekb3987012013-05-29 14:47:47 +00001165 if (Tok.Previous->is(tok::comma))
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001166 return true;
Daniel Jasper9c3c7b32013-02-28 13:40:17 +00001167 if (Tok.is(tok::comma))
1168 return false;
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001169 if (Tok.Type == TT_CtorInitializerColon || Tok.Type == TT_ObjCBlockLParen)
1170 return true;
Manuel Klimekb3987012013-05-29 14:47:47 +00001171 if (Tok.Previous->Tok.is(tok::kw_operator))
Daniel Jasper2b4c9242013-02-11 08:01:18 +00001172 return false;
1173 if (Tok.Type == TT_OverloadedOperatorLParen)
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001174 return false;
1175 if (Tok.is(tok::colon))
Manuel Klimekb3987012013-05-29 14:47:47 +00001176 return !Line.First->isOneOf(tok::kw_case, tok::kw_default) &&
Alexander Kornienko0bdc6432013-07-04 14:47:51 +00001177 Tok.getNextNonComment() != NULL && Tok.Type != TT_ObjCMethodExpr;
Manuel Klimekb3987012013-05-29 14:47:47 +00001178 if (Tok.Previous->Type == TT_UnaryOperator ||
1179 Tok.Previous->Type == TT_CastRParen)
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001180 return false;
Manuel Klimekb3987012013-05-29 14:47:47 +00001181 if (Tok.Previous->is(tok::greater) && Tok.is(tok::greater)) {
Daniel Jasper29f123b2013-02-08 15:28:42 +00001182 return Tok.Type == TT_TemplateCloser &&
Manuel Klimekb3987012013-05-29 14:47:47 +00001183 Tok.Previous->Type == TT_TemplateCloser &&
Daniel Jasper29f123b2013-02-08 15:28:42 +00001184 Style.Standard != FormatStyle::LS_Cpp11;
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001185 }
Alexander Kornienko54a38bd2013-03-20 16:41:56 +00001186 if (Tok.isOneOf(tok::arrowstar, tok::periodstar) ||
Manuel Klimekb3987012013-05-29 14:47:47 +00001187 Tok.Previous->isOneOf(tok::arrowstar, tok::periodstar))
Daniel Jasper9c3c7b32013-02-28 13:40:17 +00001188 return false;
Manuel Klimekb3987012013-05-29 14:47:47 +00001189 if (Tok.Type == TT_BinaryOperator || Tok.Previous->Type == TT_BinaryOperator)
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001190 return true;
Manuel Klimekb3987012013-05-29 14:47:47 +00001191 if (Tok.Previous->Type == TT_TemplateCloser && Tok.is(tok::l_paren))
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001192 return false;
Manuel Klimekb3987012013-05-29 14:47:47 +00001193 if (Tok.is(tok::less) && Line.First->is(tok::hash))
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001194 return true;
1195 if (Tok.Type == TT_TrailingUnaryOperator)
1196 return false;
Manuel Klimekb3987012013-05-29 14:47:47 +00001197 return spaceRequiredBetween(Line, *Tok.Previous, Tok);
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001198}
1199
Daniel Jasper8ff690a2013-02-06 14:22:40 +00001200bool TokenAnnotator::canBreakBefore(const AnnotatedLine &Line,
Manuel Klimekb3987012013-05-29 14:47:47 +00001201 const FormatToken &Right) {
1202 const FormatToken &Left = *Right.Previous;
Daniel Jaspera03ab102013-02-13 20:33:44 +00001203 if (Right.Type == TT_StartOfName)
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001204 return true;
Nico Weberf2ff8122013-05-26 05:39:26 +00001205 if (Right.is(tok::colon) &&
1206 (Right.Type == TT_ObjCDictLiteral || Right.Type == TT_ObjCMethodExpr))
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001207 return false;
Nico Weberf2ff8122013-05-26 05:39:26 +00001208 if (Left.is(tok::colon) &&
1209 (Left.Type == TT_ObjCDictLiteral || Left.Type == TT_ObjCMethodExpr))
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001210 return true;
Daniel Jasper63d7ced2013-02-05 10:07:47 +00001211 if (Right.Type == TT_ObjCSelectorName)
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001212 return true;
1213 if (Left.ClosesTemplateDeclaration)
1214 return true;
1215 if (Right.Type == TT_ConditionalExpr || Right.is(tok::question))
1216 return true;
Daniel Jasper6cabab42013-02-14 08:42:54 +00001217 if (Right.Type == TT_RangeBasedForLoopColon ||
Daniel Jasper27b91cc2013-04-05 17:21:59 +00001218 Right.Type == TT_OverloadedOperatorLParen)
Daniel Jasper6cabab42013-02-14 08:42:54 +00001219 return false;
Daniel Jasperc194c952013-05-06 06:45:09 +00001220 if (Left.Type == TT_RangeBasedForLoopColon)
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001221 return true;
Daniel Jasper7d812812013-02-21 15:00:29 +00001222 if (Right.Type == TT_RangeBasedForLoopColon)
1223 return false;
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001224 if (Left.Type == TT_PointerOrReference || Left.Type == TT_TemplateCloser ||
1225 Left.Type == TT_UnaryOperator || Left.Type == TT_ConditionalExpr ||
Alexander Kornienkoe74de282013-03-13 14:41:29 +00001226 Left.isOneOf(tok::question, tok::kw_operator))
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001227 return false;
1228 if (Left.is(tok::equal) && Line.Type == LT_VirtualFunctionDecl)
1229 return false;
Manuel Klimekb3987012013-05-29 14:47:47 +00001230 if (Left.is(tok::l_paren) && Right.is(tok::l_paren) && Left.Previous &&
1231 Left.Previous->is(tok::kw___attribute))
Daniel Jasper8ed41002013-02-28 14:44:25 +00001232 return false;
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001233
Daniel Jasper65d2c382013-06-06 16:08:57 +00001234 if (Right.isTrailingComment())
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001235 // We rely on MustBreakBefore being set correctly here as we should not
1236 // change the "binding" behavior of a comment.
1237 return false;
1238
Daniel Jasper5ad72bb2013-05-22 08:28:26 +00001239 // We only break before r_brace if there was a corresponding break before
1240 // the l_brace, which is tracked by BreakBeforeClosingBrace.
1241 if (Right.isOneOf(tok::r_brace, tok::r_paren, tok::greater))
1242 return false;
1243
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001244 // Allow breaking after a trailing 'const', e.g. after a method declaration,
1245 // unless it is follow by ';', '{' or '='.
Manuel Klimekb3987012013-05-29 14:47:47 +00001246 if (Left.is(tok::kw_const) && Left.Previous != NULL &&
1247 Left.Previous->is(tok::r_paren))
Alexander Kornienkoe74de282013-03-13 14:41:29 +00001248 return !Right.isOneOf(tok::l_brace, tok::semi, tok::equal);
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001249
Daniel Jasper8ef19a22013-03-14 09:50:46 +00001250 if (Right.is(tok::kw___attribute))
1251 return true;
1252
Daniel Jasper3a204412013-02-23 07:46:38 +00001253 if (Left.is(tok::identifier) && Right.is(tok::string_literal))
1254 return true;
Daniel Jasperac3223e2013-04-10 09:49:49 +00001255 return (Left.isBinaryOperator() && Left.isNot(tok::lessless)) ||
Daniel Jasper6b119d62013-04-05 17:22:09 +00001256 Left.isOneOf(tok::comma, tok::coloncolon, tok::semi, tok::l_brace,
1257 tok::kw_class, tok::kw_struct) ||
Alexander Kornienkoe74de282013-03-13 14:41:29 +00001258 Right.isOneOf(tok::lessless, tok::arrow, tok::period, tok::colon) ||
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001259 (Left.is(tok::r_paren) && Left.Type != TT_CastRParen &&
Daniel Jaspere033e872013-05-21 09:16:31 +00001260 Right.isOneOf(tok::identifier, tok::kw_const, tok::kw___attribute)) ||
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001261 (Left.is(tok::l_paren) && !Right.is(tok::r_paren)) ||
1262 (Left.is(tok::l_square) && !Right.is(tok::r_square));
1263}
1264
Daniel Jasperbf71ba22013-04-08 20:33:42 +00001265void TokenAnnotator::printDebugInfo(const AnnotatedLine &Line) {
1266 llvm::errs() << "AnnotatedTokens:\n";
Manuel Klimekb3987012013-05-29 14:47:47 +00001267 const FormatToken *Tok = Line.First;
Daniel Jasperbf71ba22013-04-08 20:33:42 +00001268 while (Tok) {
Manuel Klimekb3987012013-05-29 14:47:47 +00001269 llvm::errs() << " M=" << Tok->MustBreakBefore
1270 << " C=" << Tok->CanBreakBefore << " T=" << Tok->Type << " S="
1271 << Tok->SpacesRequiredBefore << " P=" << Tok->SplitPenalty
1272 << " Name=" << Tok->Tok.getName() << " FakeLParens=";
Daniel Jasperbf71ba22013-04-08 20:33:42 +00001273 for (unsigned i = 0, e = Tok->FakeLParens.size(); i != e; ++i)
1274 llvm::errs() << Tok->FakeLParens[i] << "/";
1275 llvm::errs() << " FakeRParens=" << Tok->FakeRParens << "\n";
Manuel Klimekb3987012013-05-29 14:47:47 +00001276 Tok = Tok->Next;
Daniel Jasperbf71ba22013-04-08 20:33:42 +00001277 }
1278 llvm::errs() << "----\n";
1279}
1280
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001281} // namespace format
1282} // namespace clang