blob: fc53681394e68f8daf58dc755c5e560f93e48847 [file] [log] [blame]
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001//===--- TokenAnnotator.cpp - Format C++ code -----------------------------===//
2//
3// The LLVM Compiler Infrastructure
4//
5// This file is distributed under the University of Illinois Open Source
6// License. See LICENSE.TXT for details.
7//
8//===----------------------------------------------------------------------===//
9///
10/// \file
11/// \brief This file implements a token annotator, i.e. creates
12/// \c AnnotatedTokens out of \c FormatTokens with required extra information.
13///
14//===----------------------------------------------------------------------===//
15
16#include "TokenAnnotator.h"
17#include "clang/Basic/SourceManager.h"
Daniel Jasperbf71ba22013-04-08 20:33:42 +000018#include "llvm/Support/Debug.h"
Daniel Jasper32d28ee2013-01-29 21:01:14 +000019
20namespace clang {
21namespace format {
22
Daniel Jasper32d28ee2013-01-29 21:01:14 +000023/// \brief A parser that gathers additional information about tokens.
24///
Alexander Kornienko3fd9ccd2013-03-12 16:28:18 +000025/// The \c TokenAnnotator tries to match parenthesis and square brakets and
Daniel Jasper32d28ee2013-01-29 21:01:14 +000026/// store a parenthesis levels. It also tries to resolve matching "<" and ">"
27/// into template parameter lists.
28class AnnotatingParser {
29public:
Alexander Kornienko00895102013-06-05 14:09:10 +000030 AnnotatingParser(AnnotatedLine &Line, IdentifierInfo &Ident_in)
31 : Line(Line), CurrentToken(Line.First), KeywordVirtualFound(false),
32 NameFound(false), Ident_in(Ident_in) {
Daniel Jasper923ebef2013-03-14 13:45:21 +000033 Contexts.push_back(Context(tok::unknown, 1, /*IsExpression=*/ false));
Daniel Jasper32d28ee2013-01-29 21:01:14 +000034 }
35
Nico Weber95e8e462013-02-12 16:17:07 +000036private:
Daniel Jasper32d28ee2013-01-29 21:01:14 +000037 bool parseAngle() {
38 if (CurrentToken == NULL)
39 return false;
Daniel Jasper923ebef2013-03-14 13:45:21 +000040 ScopedContextCreator ContextCreator(*this, tok::less, 10);
Manuel Klimekb3987012013-05-29 14:47:47 +000041 FormatToken *Left = CurrentToken->Previous;
Daniel Jasper4e778092013-02-06 10:05:46 +000042 Contexts.back().IsExpression = false;
Daniel Jasper32d28ee2013-01-29 21:01:14 +000043 while (CurrentToken != NULL) {
44 if (CurrentToken->is(tok::greater)) {
45 Left->MatchingParen = CurrentToken;
46 CurrentToken->MatchingParen = Left;
47 CurrentToken->Type = TT_TemplateCloser;
48 next();
49 return true;
50 }
Alexander Kornienkoe74de282013-03-13 14:41:29 +000051 if (CurrentToken->isOneOf(tok::r_paren, tok::r_square, tok::r_brace,
Daniel Jasper5d823e32013-05-15 13:46:48 +000052 tok::question, tok::colon))
53 return false;
Daniel Jasper0348be02013-06-01 18:56:00 +000054 // If a && or || is found and interpreted as a binary operator, this set
Daniel Jasper15f33f02013-06-03 16:16:41 +000055 // of angles is likely part of something like "a < b && c > d". If the
Daniel Jasper0348be02013-06-01 18:56:00 +000056 // angles are inside an expression, the ||/&& might also be a binary
57 // operator that was misinterpreted because we are parsing template
58 // parameters.
59 // FIXME: This is getting out of hand, write a decent parser.
Manuel Klimekb3987012013-05-29 14:47:47 +000060 if (CurrentToken->Previous->isOneOf(tok::pipepipe, tok::ampamp) &&
Daniel Jasper0348be02013-06-01 18:56:00 +000061 (CurrentToken->Previous->Type == TT_BinaryOperator ||
62 Contexts[Contexts.size() - 2].IsExpression) &&
Manuel Klimekb3987012013-05-29 14:47:47 +000063 Line.First->isNot(tok::kw_template))
Daniel Jasper32d28ee2013-01-29 21:01:14 +000064 return false;
Daniel Jasper9fc56f22013-02-14 15:01:34 +000065 updateParameterCount(Left, CurrentToken);
Daniel Jasper32d28ee2013-01-29 21:01:14 +000066 if (!consumeToken())
67 return false;
68 }
69 return false;
70 }
71
72 bool parseParens(bool LookForDecls = false) {
73 if (CurrentToken == NULL)
74 return false;
Daniel Jasper923ebef2013-03-14 13:45:21 +000075 ScopedContextCreator ContextCreator(*this, tok::l_paren, 1);
Daniel Jasper4e778092013-02-06 10:05:46 +000076
77 // FIXME: This is a bit of a hack. Do better.
78 Contexts.back().ColonIsForRangeExpr =
79 Contexts.size() == 2 && Contexts[0].ColonIsForRangeExpr;
80
Daniel Jasper32d28ee2013-01-29 21:01:14 +000081 bool StartsObjCMethodExpr = false;
Manuel Klimekb3987012013-05-29 14:47:47 +000082 FormatToken *Left = CurrentToken->Previous;
Daniel Jasper32d28ee2013-01-29 21:01:14 +000083 if (CurrentToken->is(tok::caret)) {
84 // ^( starts a block.
85 Left->Type = TT_ObjCBlockLParen;
Manuel Klimekb3987012013-05-29 14:47:47 +000086 } else if (FormatToken *MaybeSel = Left->Previous) {
Daniel Jasper32d28ee2013-01-29 21:01:14 +000087 // @selector( starts a selector.
Manuel Klimekb3987012013-05-29 14:47:47 +000088 if (MaybeSel->isObjCAtKeyword(tok::objc_selector) && MaybeSel->Previous &&
89 MaybeSel->Previous->is(tok::at)) {
Daniel Jasper32d28ee2013-01-29 21:01:14 +000090 StartsObjCMethodExpr = true;
91 }
92 }
93
Daniel Jasper4e778092013-02-06 10:05:46 +000094 if (StartsObjCMethodExpr) {
95 Contexts.back().ColonIsObjCMethodExpr = true;
96 Left->Type = TT_ObjCMethodExpr;
97 }
Daniel Jasper32d28ee2013-01-29 21:01:14 +000098
Daniel Jasper431f5912013-05-28 08:33:00 +000099 bool MightBeFunctionType = CurrentToken->is(tok::star);
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000100 while (CurrentToken != NULL) {
101 // LookForDecls is set when "if (" has been seen. Check for
102 // 'identifier' '*' 'identifier' followed by not '=' -- this
103 // '*' has to be a binary operator but determineStarAmpUsage() will
104 // categorize it as an unary operator, so set the right type here.
Manuel Klimekb3987012013-05-29 14:47:47 +0000105 if (LookForDecls && CurrentToken->Next) {
106 FormatToken *Prev = CurrentToken->Previous;
107 FormatToken *Next = CurrentToken->Next;
108 if (Prev->Previous->is(tok::identifier) &&
109 Prev->isOneOf(tok::star, tok::amp, tok::ampamp) &&
110 CurrentToken->is(tok::identifier) && Next->isNot(tok::equal)) {
111 Prev->Type = TT_BinaryOperator;
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000112 LookForDecls = false;
113 }
114 }
115
116 if (CurrentToken->is(tok::r_paren)) {
Manuel Klimekb3987012013-05-29 14:47:47 +0000117 if (MightBeFunctionType && CurrentToken->Next &&
118 CurrentToken->Next->isOneOf(tok::l_paren, tok::l_square))
Daniel Jasper431f5912013-05-28 08:33:00 +0000119 Left->Type = TT_FunctionTypeLParen;
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000120 Left->MatchingParen = CurrentToken;
121 CurrentToken->MatchingParen = Left;
122
Daniel Jasper63d7ced2013-02-05 10:07:47 +0000123 if (StartsObjCMethodExpr) {
Daniel Jasper4e778092013-02-06 10:05:46 +0000124 CurrentToken->Type = TT_ObjCMethodExpr;
125 if (Contexts.back().FirstObjCSelectorName != NULL) {
126 Contexts.back().FirstObjCSelectorName->LongestObjCSelectorName =
127 Contexts.back().LongestObjCSelectorName;
Daniel Jasper63d7ced2013-02-05 10:07:47 +0000128 }
129 }
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000130
131 next();
132 return true;
133 }
Alexander Kornienkoe74de282013-03-13 14:41:29 +0000134 if (CurrentToken->isOneOf(tok::r_square, tok::r_brace))
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000135 return false;
Manuel Klimekb3987012013-05-29 14:47:47 +0000136 if (CurrentToken->Previous->Type == TT_PointerOrReference &&
137 CurrentToken->Previous->Previous->isOneOf(tok::l_paren,
138 tok::coloncolon))
Daniel Jasper431f5912013-05-28 08:33:00 +0000139 MightBeFunctionType = true;
Daniel Jasper9fc56f22013-02-14 15:01:34 +0000140 updateParameterCount(Left, CurrentToken);
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000141 if (!consumeToken())
142 return false;
143 }
144 return false;
145 }
146
147 bool parseSquare() {
148 if (!CurrentToken)
149 return false;
150
151 // A '[' could be an index subscript (after an indentifier or after
Nico Weber051860e2013-02-10 02:08:05 +0000152 // ')' or ']'), it could be the start of an Objective-C method
153 // expression, or it could the the start of an Objective-C array literal.
Manuel Klimekb3987012013-05-29 14:47:47 +0000154 FormatToken *Left = CurrentToken->Previous;
155 FormatToken *Parent = Left->getPreviousNoneComment();
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000156 bool StartsObjCMethodExpr =
Daniel Jasper6f21a982013-03-13 07:49:51 +0000157 Contexts.back().CanBeExpression &&
Alexander Kornienkoe74de282013-03-13 14:41:29 +0000158 (!Parent || Parent->isOneOf(tok::colon, tok::l_square, tok::l_paren,
159 tok::kw_return, tok::kw_throw) ||
Daniel Jasperac3223e2013-04-10 09:49:49 +0000160 Parent->isUnaryOperator() || Parent->Type == TT_ObjCForIn ||
Alexander Kornienkoe74de282013-03-13 14:41:29 +0000161 Parent->Type == TT_CastRParen ||
Manuel Klimekb3987012013-05-29 14:47:47 +0000162 getBinOpPrecedence(Parent->Tok.getKind(), true, true) > prec::Unknown);
Daniel Jasper923ebef2013-03-14 13:45:21 +0000163 ScopedContextCreator ContextCreator(*this, tok::l_square, 10);
Daniel Jasper6f21a982013-03-13 07:49:51 +0000164 Contexts.back().IsExpression = true;
Nico Weber051860e2013-02-10 02:08:05 +0000165 bool StartsObjCArrayLiteral = Parent && Parent->is(tok::at);
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000166
Daniel Jasper4e778092013-02-06 10:05:46 +0000167 if (StartsObjCMethodExpr) {
168 Contexts.back().ColonIsObjCMethodExpr = true;
169 Left->Type = TT_ObjCMethodExpr;
Nico Weber051860e2013-02-10 02:08:05 +0000170 } else if (StartsObjCArrayLiteral) {
171 Left->Type = TT_ObjCArrayLiteral;
Daniel Jasper4e778092013-02-06 10:05:46 +0000172 }
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000173
174 while (CurrentToken != NULL) {
175 if (CurrentToken->is(tok::r_square)) {
Manuel Klimekb3987012013-05-29 14:47:47 +0000176 if (CurrentToken->Next && CurrentToken->Next->is(tok::l_paren)) {
Nico Webere8a97982013-02-06 06:20:11 +0000177 // An ObjC method call is rarely followed by an open parenthesis.
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000178 // FIXME: Do we incorrectly label ":" with this?
179 StartsObjCMethodExpr = false;
180 Left->Type = TT_Unknown;
181 }
Daniel Jasper01786732013-02-04 07:21:18 +0000182 if (StartsObjCMethodExpr) {
Daniel Jasper4e778092013-02-06 10:05:46 +0000183 CurrentToken->Type = TT_ObjCMethodExpr;
Nico Webere8a97982013-02-06 06:20:11 +0000184 // determineStarAmpUsage() thinks that '*' '[' is allocating an
185 // array of pointers, but if '[' starts a selector then '*' is a
186 // binary operator.
Alexander Kornienko3fd9ccd2013-03-12 16:28:18 +0000187 if (Parent != NULL && Parent->Type == TT_PointerOrReference)
Nico Weber4ed7f3e2013-02-06 16:54:35 +0000188 Parent->Type = TT_BinaryOperator;
Nico Weber051860e2013-02-10 02:08:05 +0000189 } else if (StartsObjCArrayLiteral) {
190 CurrentToken->Type = TT_ObjCArrayLiteral;
Daniel Jasper01786732013-02-04 07:21:18 +0000191 }
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000192 Left->MatchingParen = CurrentToken;
193 CurrentToken->MatchingParen = Left;
Daniel Jasper4e778092013-02-06 10:05:46 +0000194 if (Contexts.back().FirstObjCSelectorName != NULL)
195 Contexts.back().FirstObjCSelectorName->LongestObjCSelectorName =
196 Contexts.back().LongestObjCSelectorName;
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000197 next();
198 return true;
199 }
Alexander Kornienkoe74de282013-03-13 14:41:29 +0000200 if (CurrentToken->isOneOf(tok::r_paren, tok::r_brace))
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000201 return false;
Daniel Jasper9fc56f22013-02-14 15:01:34 +0000202 updateParameterCount(Left, CurrentToken);
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000203 if (!consumeToken())
204 return false;
205 }
206 return false;
207 }
208
209 bool parseBrace() {
Daniel Jasper53e72cd2013-05-06 08:27:33 +0000210 if (CurrentToken != NULL) {
211 ScopedContextCreator ContextCreator(*this, tok::l_brace, 1);
Manuel Klimekb3987012013-05-29 14:47:47 +0000212 FormatToken *Left = CurrentToken->Previous;
Nico Weberf2ff8122013-05-26 05:39:26 +0000213
Manuel Klimekb3987012013-05-29 14:47:47 +0000214 FormatToken *Parent = Left->getPreviousNoneComment();
Nico Weberf2ff8122013-05-26 05:39:26 +0000215 bool StartsObjCDictLiteral = Parent && Parent->is(tok::at);
216 if (StartsObjCDictLiteral) {
217 Contexts.back().ColonIsObjCDictLiteral = true;
218 Left->Type = TT_ObjCDictLiteral;
219 }
220
Daniel Jasper53e72cd2013-05-06 08:27:33 +0000221 while (CurrentToken != NULL) {
222 if (CurrentToken->is(tok::r_brace)) {
Nico Weberf2ff8122013-05-26 05:39:26 +0000223 if (StartsObjCDictLiteral)
224 CurrentToken->Type = TT_ObjCDictLiteral;
Daniel Jasper53e72cd2013-05-06 08:27:33 +0000225 Left->MatchingParen = CurrentToken;
226 CurrentToken->MatchingParen = Left;
227 next();
228 return true;
229 }
230 if (CurrentToken->isOneOf(tok::r_paren, tok::r_square))
231 return false;
232 updateParameterCount(Left, CurrentToken);
233 if (!consumeToken())
234 return false;
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000235 }
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000236 }
Daniel Jasper53e72cd2013-05-06 08:27:33 +0000237 // No closing "}" found, this probably starts a definition.
238 Line.StartsDefinition = true;
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000239 return true;
240 }
Daniel Jasperc4615b72013-02-20 12:56:39 +0000241
Manuel Klimekb3987012013-05-29 14:47:47 +0000242 void updateParameterCount(FormatToken *Left, FormatToken *Current) {
Daniel Jasper9fc56f22013-02-14 15:01:34 +0000243 if (Current->is(tok::comma))
244 ++Left->ParameterCount;
245 else if (Left->ParameterCount == 0 && Current->isNot(tok::comment))
246 Left->ParameterCount = 1;
247 }
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000248
249 bool parseConditional() {
250 while (CurrentToken != NULL) {
251 if (CurrentToken->is(tok::colon)) {
252 CurrentToken->Type = TT_ConditionalExpr;
253 next();
254 return true;
255 }
256 if (!consumeToken())
257 return false;
258 }
259 return false;
260 }
261
262 bool parseTemplateDeclaration() {
263 if (CurrentToken != NULL && CurrentToken->is(tok::less)) {
264 CurrentToken->Type = TT_TemplateOpener;
265 next();
266 if (!parseAngle())
267 return false;
Daniel Jasper34511fb2013-02-19 17:14:38 +0000268 if (CurrentToken != NULL)
Manuel Klimekb3987012013-05-29 14:47:47 +0000269 CurrentToken->Previous->ClosesTemplateDeclaration = true;
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000270 return true;
271 }
272 return false;
273 }
274
275 bool consumeToken() {
Manuel Klimekb3987012013-05-29 14:47:47 +0000276 FormatToken *Tok = CurrentToken;
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000277 next();
Manuel Klimekb3987012013-05-29 14:47:47 +0000278 switch (Tok->Tok.getKind()) {
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000279 case tok::plus:
280 case tok::minus:
Manuel Klimekb3987012013-05-29 14:47:47 +0000281 if (Tok->Previous == NULL && Line.MustBeDeclaration)
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000282 Tok->Type = TT_ObjCMethodSpecifier;
283 break;
284 case tok::colon:
Manuel Klimekb3987012013-05-29 14:47:47 +0000285 if (Tok->Previous == NULL)
Daniel Jaspercf6d76a2013-03-18 12:50:26 +0000286 return false;
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000287 // Colons from ?: are handled in parseConditional().
Manuel Klimekb3987012013-05-29 14:47:47 +0000288 if (Tok->Previous->is(tok::r_paren) && Contexts.size() == 1) {
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000289 Tok->Type = TT_CtorInitializerColon;
Nico Weberf2ff8122013-05-26 05:39:26 +0000290 } else if (Contexts.back().ColonIsObjCDictLiteral) {
291 Tok->Type = TT_ObjCDictLiteral;
Daniel Jasper4e778092013-02-06 10:05:46 +0000292 } else if (Contexts.back().ColonIsObjCMethodExpr ||
Manuel Klimekb3987012013-05-29 14:47:47 +0000293 Line.First->Type == TT_ObjCMethodSpecifier) {
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000294 Tok->Type = TT_ObjCMethodExpr;
Manuel Klimekb3987012013-05-29 14:47:47 +0000295 Tok->Previous->Type = TT_ObjCSelectorName;
Alexander Kornienko00895102013-06-05 14:09:10 +0000296 if (Tok->Previous->CodePointCount >
297 Contexts.back().LongestObjCSelectorName) {
298 Contexts.back().LongestObjCSelectorName =
299 Tok->Previous->CodePointCount;
300 }
Daniel Jasper4e778092013-02-06 10:05:46 +0000301 if (Contexts.back().FirstObjCSelectorName == NULL)
Manuel Klimekb3987012013-05-29 14:47:47 +0000302 Contexts.back().FirstObjCSelectorName = Tok->Previous;
Daniel Jasper4e778092013-02-06 10:05:46 +0000303 } else if (Contexts.back().ColonIsForRangeExpr) {
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000304 Tok->Type = TT_RangeBasedForLoopColon;
Daniel Jasper6cabab42013-02-14 08:42:54 +0000305 } else if (Contexts.size() == 1) {
306 Tok->Type = TT_InheritanceColon;
Daniel Jasper923ebef2013-03-14 13:45:21 +0000307 } else if (Contexts.back().ContextKind == tok::l_paren) {
308 Tok->Type = TT_InlineASMColon;
Daniel Jasper63d7ced2013-02-05 10:07:47 +0000309 }
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000310 break;
311 case tok::kw_if:
312 case tok::kw_while:
313 if (CurrentToken != NULL && CurrentToken->is(tok::l_paren)) {
314 next();
315 if (!parseParens(/*LookForDecls=*/ true))
316 return false;
317 }
318 break;
319 case tok::kw_for:
Daniel Jasper4e778092013-02-06 10:05:46 +0000320 Contexts.back().ColonIsForRangeExpr = true;
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000321 next();
322 if (!parseParens())
323 return false;
324 break;
325 case tok::l_paren:
326 if (!parseParens())
327 return false;
Daniel Jasper1407bee2013-04-11 14:29:13 +0000328 if (Line.MustBeDeclaration && NameFound && !Contexts.back().IsExpression)
Daniel Jasper3c08a812013-02-24 18:54:32 +0000329 Line.MightBeFunctionDecl = true;
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000330 break;
331 case tok::l_square:
332 if (!parseSquare())
333 return false;
334 break;
335 case tok::l_brace:
336 if (!parseBrace())
337 return false;
338 break;
339 case tok::less:
340 if (parseAngle())
341 Tok->Type = TT_TemplateOpener;
342 else {
343 Tok->Type = TT_BinaryOperator;
344 CurrentToken = Tok;
345 next();
346 }
347 break;
348 case tok::r_paren:
349 case tok::r_square:
350 return false;
351 case tok::r_brace:
352 // Lines can start with '}'.
Manuel Klimekb3987012013-05-29 14:47:47 +0000353 if (Tok->Previous != NULL)
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000354 return false;
355 break;
356 case tok::greater:
357 Tok->Type = TT_BinaryOperator;
358 break;
359 case tok::kw_operator:
Daniel Jasper2b4c9242013-02-11 08:01:18 +0000360 while (CurrentToken && CurrentToken->isNot(tok::l_paren)) {
Alexander Kornienkoe74de282013-03-13 14:41:29 +0000361 if (CurrentToken->isOneOf(tok::star, tok::amp))
Daniel Jasper2b4c9242013-02-11 08:01:18 +0000362 CurrentToken->Type = TT_PointerOrReference;
363 consumeToken();
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000364 }
Daniel Jasper6ea933c2013-05-10 07:59:58 +0000365 if (CurrentToken) {
Daniel Jasper2b4c9242013-02-11 08:01:18 +0000366 CurrentToken->Type = TT_OverloadedOperatorLParen;
Manuel Klimekb3987012013-05-29 14:47:47 +0000367 if (CurrentToken->Previous->Type == TT_BinaryOperator)
368 CurrentToken->Previous->Type = TT_OverloadedOperator;
Daniel Jasper6ea933c2013-05-10 07:59:58 +0000369 }
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000370 break;
371 case tok::question:
372 parseConditional();
373 break;
374 case tok::kw_template:
375 parseTemplateDeclaration();
376 break;
Nico Weberc2e6d2a2013-02-11 15:32:15 +0000377 case tok::identifier:
Manuel Klimekb3987012013-05-29 14:47:47 +0000378 if (Line.First->is(tok::kw_for) &&
379 Tok->Tok.getIdentifierInfo() == &Ident_in)
Nico Weberc2e6d2a2013-02-11 15:32:15 +0000380 Tok->Type = TT_ObjCForIn;
381 break;
Daniel Jasper8ed9f2b2013-04-03 13:36:17 +0000382 case tok::comma:
383 if (Contexts.back().FirstStartOfName)
384 Contexts.back().FirstStartOfName->PartOfMultiVariableDeclStmt = true;
385 break;
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000386 default:
387 break;
388 }
389 return true;
390 }
391
392 void parseIncludeDirective() {
393 next();
394 if (CurrentToken != NULL && CurrentToken->is(tok::less)) {
395 next();
396 while (CurrentToken != NULL) {
Manuel Klimekb3987012013-05-29 14:47:47 +0000397 if (CurrentToken->isNot(tok::comment) || CurrentToken->Next)
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000398 CurrentToken->Type = TT_ImplicitStringLiteral;
399 next();
400 }
401 } else {
402 while (CurrentToken != NULL) {
Daniel Jasper3a204412013-02-23 07:46:38 +0000403 if (CurrentToken->is(tok::string_literal))
404 // Mark these string literals as "implicit" literals, too, so that
405 // they are not split or line-wrapped.
406 CurrentToken->Type = TT_ImplicitStringLiteral;
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000407 next();
408 }
409 }
410 }
411
412 void parseWarningOrError() {
413 next();
414 // We still want to format the whitespace left of the first token of the
415 // warning or error.
416 next();
417 while (CurrentToken != NULL) {
418 CurrentToken->Type = TT_ImplicitStringLiteral;
419 next();
420 }
421 }
422
423 void parsePreprocessorDirective() {
424 next();
425 if (CurrentToken == NULL)
426 return;
427 // Hashes in the middle of a line can lead to any strange token
428 // sequence.
Manuel Klimekb3987012013-05-29 14:47:47 +0000429 if (CurrentToken->Tok.getIdentifierInfo() == NULL)
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000430 return;
Manuel Klimekb3987012013-05-29 14:47:47 +0000431 switch (CurrentToken->Tok.getIdentifierInfo()->getPPKeywordID()) {
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000432 case tok::pp_include:
433 case tok::pp_import:
434 parseIncludeDirective();
435 break;
436 case tok::pp_error:
437 case tok::pp_warning:
438 parseWarningOrError();
439 break;
Daniel Jasperaae7bad2013-04-23 13:54:04 +0000440 case tok::pp_if:
441 case tok::pp_elif:
442 parseLine();
443 break;
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000444 default:
445 break;
446 }
Daniel Jasper5b7e7b02013-02-05 09:34:14 +0000447 while (CurrentToken != NULL)
448 next();
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000449 }
450
Nico Weber95e8e462013-02-12 16:17:07 +0000451public:
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000452 LineType parseLine() {
453 int PeriodsAndArrows = 0;
Manuel Klimekb3987012013-05-29 14:47:47 +0000454 FormatToken *LastPeriodOrArrow = NULL;
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000455 bool CanBeBuilderTypeStmt = true;
456 if (CurrentToken->is(tok::hash)) {
457 parsePreprocessorDirective();
458 return LT_PreprocessorDirective;
459 }
460 while (CurrentToken != NULL) {
461 if (CurrentToken->is(tok::kw_virtual))
462 KeywordVirtualFound = true;
Alexander Kornienkoe74de282013-03-13 14:41:29 +0000463 if (CurrentToken->isOneOf(tok::period, tok::arrow)) {
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000464 ++PeriodsAndArrows;
Daniel Jasper24849712013-03-01 16:48:32 +0000465 LastPeriodOrArrow = CurrentToken;
466 }
Manuel Klimekb3987012013-05-29 14:47:47 +0000467 FormatToken *TheToken = CurrentToken;
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000468 if (!consumeToken())
469 return LT_Invalid;
Manuel Klimekb3987012013-05-29 14:47:47 +0000470 if (TheToken->getPrecedence() > prec::Assignment &&
Daniel Jasper82282dc2013-02-18 13:52:06 +0000471 TheToken->Type == TT_BinaryOperator)
Daniel Jasper4a544e52013-02-15 20:33:06 +0000472 CanBeBuilderTypeStmt = false;
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000473 }
474 if (KeywordVirtualFound)
475 return LT_VirtualFunctionDecl;
476
477 // Assume a builder-type call if there are 2 or more "." and "->".
Daniel Jasper24849712013-03-01 16:48:32 +0000478 if (PeriodsAndArrows >= 2 && CanBeBuilderTypeStmt) {
479 LastPeriodOrArrow->LastInChainOfCalls = true;
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000480 return LT_BuilderTypeCall;
Daniel Jasper24849712013-03-01 16:48:32 +0000481 }
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000482
Manuel Klimekb3987012013-05-29 14:47:47 +0000483 if (Line.First->Type == TT_ObjCMethodSpecifier) {
Daniel Jasper4e778092013-02-06 10:05:46 +0000484 if (Contexts.back().FirstObjCSelectorName != NULL)
485 Contexts.back().FirstObjCSelectorName->LongestObjCSelectorName =
486 Contexts.back().LongestObjCSelectorName;
Daniel Jasper63d7ced2013-02-05 10:07:47 +0000487 return LT_ObjCMethodDecl;
488 }
489
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000490 return LT_Other;
491 }
492
Nico Weber95e8e462013-02-12 16:17:07 +0000493private:
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000494 void next() {
Daniel Jasper01786732013-02-04 07:21:18 +0000495 if (CurrentToken != NULL) {
496 determineTokenType(*CurrentToken);
Daniel Jasper4e778092013-02-06 10:05:46 +0000497 CurrentToken->BindingStrength = Contexts.back().BindingStrength;
Daniel Jasper01786732013-02-04 07:21:18 +0000498 }
499
Manuel Klimekb3987012013-05-29 14:47:47 +0000500 if (CurrentToken != NULL)
501 CurrentToken = CurrentToken->Next;
Daniel Jasperd0f349b2013-02-18 12:44:35 +0000502
503 // Reset token type in case we have already looked at it and then recovered
504 // from an error (e.g. failure to find the matching >).
505 if (CurrentToken != NULL)
506 CurrentToken->Type = TT_Unknown;
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000507 }
508
Daniel Jasper4e778092013-02-06 10:05:46 +0000509 /// \brief A struct to hold information valid in a specific context, e.g.
510 /// a pair of parenthesis.
511 struct Context {
Daniel Jasper923ebef2013-03-14 13:45:21 +0000512 Context(tok::TokenKind ContextKind, unsigned BindingStrength,
513 bool IsExpression)
514 : ContextKind(ContextKind), BindingStrength(BindingStrength),
515 LongestObjCSelectorName(0), ColonIsForRangeExpr(false),
Nico Weberf2ff8122013-05-26 05:39:26 +0000516 ColonIsObjCDictLiteral(false), ColonIsObjCMethodExpr(false),
517 FirstObjCSelectorName(NULL), FirstStartOfName(NULL),
518 IsExpression(IsExpression), CanBeExpression(true) {}
Daniel Jasper01786732013-02-04 07:21:18 +0000519
Daniel Jasper923ebef2013-03-14 13:45:21 +0000520 tok::TokenKind ContextKind;
Daniel Jasper4e778092013-02-06 10:05:46 +0000521 unsigned BindingStrength;
522 unsigned LongestObjCSelectorName;
523 bool ColonIsForRangeExpr;
Nico Weberf2ff8122013-05-26 05:39:26 +0000524 bool ColonIsObjCDictLiteral;
Daniel Jasper4e778092013-02-06 10:05:46 +0000525 bool ColonIsObjCMethodExpr;
Manuel Klimekb3987012013-05-29 14:47:47 +0000526 FormatToken *FirstObjCSelectorName;
527 FormatToken *FirstStartOfName;
Daniel Jasper4e778092013-02-06 10:05:46 +0000528 bool IsExpression;
Daniel Jasper6f21a982013-03-13 07:49:51 +0000529 bool CanBeExpression;
Daniel Jasper4e778092013-02-06 10:05:46 +0000530 };
531
532 /// \brief Puts a new \c Context onto the stack \c Contexts for the lifetime
533 /// of each instance.
534 struct ScopedContextCreator {
535 AnnotatingParser &P;
536
Daniel Jasper923ebef2013-03-14 13:45:21 +0000537 ScopedContextCreator(AnnotatingParser &P, tok::TokenKind ContextKind,
538 unsigned Increase)
539 : P(P) {
540 P.Contexts.push_back(
541 Context(ContextKind, P.Contexts.back().BindingStrength + Increase,
542 P.Contexts.back().IsExpression));
Daniel Jasper4e778092013-02-06 10:05:46 +0000543 }
544
545 ~ScopedContextCreator() { P.Contexts.pop_back(); }
546 };
Daniel Jasper01786732013-02-04 07:21:18 +0000547
Manuel Klimekb3987012013-05-29 14:47:47 +0000548 void determineTokenType(FormatToken &Current) {
549 if (Current.getPrecedence() == prec::Assignment &&
550 (!Current.Previous || Current.Previous->isNot(tok::kw_operator))) {
Daniel Jasper4e778092013-02-06 10:05:46 +0000551 Contexts.back().IsExpression = true;
Manuel Klimekb3987012013-05-29 14:47:47 +0000552 for (FormatToken *Previous = Current.Previous;
Nico Weber95e8e462013-02-12 16:17:07 +0000553 Previous && Previous->isNot(tok::comma);
Manuel Klimekb3987012013-05-29 14:47:47 +0000554 Previous = Previous->Previous) {
Daniel Jasper9c65b062013-02-27 11:43:50 +0000555 if (Previous->is(tok::r_square))
556 Previous = Previous->MatchingParen;
Daniel Jasper01786732013-02-04 07:21:18 +0000557 if (Previous->Type == TT_BinaryOperator &&
Alexander Kornienkoe74de282013-03-13 14:41:29 +0000558 Previous->isOneOf(tok::star, tok::amp)) {
Daniel Jasper01786732013-02-04 07:21:18 +0000559 Previous->Type = TT_PointerOrReference;
560 }
Daniel Jasper01786732013-02-04 07:21:18 +0000561 }
Alexander Kornienkoe74de282013-03-13 14:41:29 +0000562 } else if (Current.isOneOf(tok::kw_return, tok::kw_throw) ||
Nico Weber95e8e462013-02-12 16:17:07 +0000563 (Current.is(tok::l_paren) && !Line.MustBeDeclaration &&
Daniel Jasper378d93d2013-05-13 07:14:40 +0000564 !Line.InPPDirective &&
Manuel Klimekb3987012013-05-29 14:47:47 +0000565 (!Current.Previous || Current.Previous->isNot(tok::kw_for)))) {
Daniel Jasper4e778092013-02-06 10:05:46 +0000566 Contexts.back().IsExpression = true;
Alexander Kornienkoe74de282013-03-13 14:41:29 +0000567 } else if (Current.isOneOf(tok::r_paren, tok::greater, tok::comma)) {
Manuel Klimekb3987012013-05-29 14:47:47 +0000568 for (FormatToken *Previous = Current.Previous;
Alexander Kornienkoe74de282013-03-13 14:41:29 +0000569 Previous && Previous->isOneOf(tok::star, tok::amp);
Manuel Klimekb3987012013-05-29 14:47:47 +0000570 Previous = Previous->Previous)
Nico Weber95e8e462013-02-12 16:17:07 +0000571 Previous->Type = TT_PointerOrReference;
Manuel Klimekb3987012013-05-29 14:47:47 +0000572 } else if (Current.Previous &&
573 Current.Previous->Type == TT_CtorInitializerColon) {
Daniel Jasperd0f349b2013-02-18 12:44:35 +0000574 Contexts.back().IsExpression = true;
Daniel Jasper6f21a982013-03-13 07:49:51 +0000575 } else if (Current.is(tok::kw_new)) {
576 Contexts.back().CanBeExpression = false;
Daniel Jasper16a69ef2013-05-03 14:41:24 +0000577 } else if (Current.is(tok::semi)) {
578 // This should be the condition or increment in a for-loop.
579 Contexts.back().IsExpression = true;
Nico Weber95e8e462013-02-12 16:17:07 +0000580 }
Daniel Jasper01786732013-02-04 07:21:18 +0000581
582 if (Current.Type == TT_Unknown) {
Manuel Klimekb3987012013-05-29 14:47:47 +0000583 if (Current.Previous && Current.is(tok::identifier) &&
584 ((Current.Previous->is(tok::identifier) &&
585 Current.Previous->Tok.getIdentifierInfo()->getPPKeywordID() ==
Daniel Jasper11e13802013-05-08 14:12:04 +0000586 tok::pp_not_keyword) ||
Manuel Klimekb3987012013-05-29 14:47:47 +0000587 isSimpleTypeSpecifier(*Current.Previous) ||
588 Current.Previous->Type == TT_PointerOrReference ||
589 Current.Previous->Type == TT_TemplateCloser)) {
Daniel Jasper8ed9f2b2013-04-03 13:36:17 +0000590 Contexts.back().FirstStartOfName = &Current;
Daniel Jasper3c08a812013-02-24 18:54:32 +0000591 Current.Type = TT_StartOfName;
Daniel Jasper1407bee2013-04-11 14:29:13 +0000592 NameFound = true;
Alexander Kornienkoe74de282013-03-13 14:41:29 +0000593 } else if (Current.isOneOf(tok::star, tok::amp, tok::ampamp)) {
Daniel Jasper4e778092013-02-06 10:05:46 +0000594 Current.Type =
595 determineStarAmpUsage(Current, Contexts.back().IsExpression);
Alexander Kornienkoe74de282013-03-13 14:41:29 +0000596 } else if (Current.isOneOf(tok::minus, tok::plus, tok::caret)) {
Daniel Jasper01786732013-02-04 07:21:18 +0000597 Current.Type = determinePlusMinusCaretUsage(Current);
Alexander Kornienkoe74de282013-03-13 14:41:29 +0000598 } else if (Current.isOneOf(tok::minusminus, tok::plusplus)) {
Daniel Jasper01786732013-02-04 07:21:18 +0000599 Current.Type = determineIncrementUsage(Current);
600 } else if (Current.is(tok::exclaim)) {
601 Current.Type = TT_UnaryOperator;
Daniel Jasperac3223e2013-04-10 09:49:49 +0000602 } else if (Current.isBinaryOperator()) {
Daniel Jasper01786732013-02-04 07:21:18 +0000603 Current.Type = TT_BinaryOperator;
604 } else if (Current.is(tok::comment)) {
Alexander Kornienko00895102013-06-05 14:09:10 +0000605 if (Current.TokenText.startswith("//"))
Daniel Jasper01786732013-02-04 07:21:18 +0000606 Current.Type = TT_LineComment;
607 else
608 Current.Type = TT_BlockComment;
Nico Weber37d69312013-02-13 04:13:13 +0000609 } else if (Current.is(tok::r_paren)) {
Daniel Jasperb8b42952013-05-31 16:14:28 +0000610 FormatToken *LeftOfParens = NULL;
611 if (Current.MatchingParen)
612 LeftOfParens = Current.MatchingParen->getPreviousNoneComment();
613 bool IsCast = false;
614 bool ParensAreEmpty = Current.Previous == Current.MatchingParen;
615 bool ParensAreType = !Current.Previous ||
Manuel Klimekb3987012013-05-29 14:47:47 +0000616 Current.Previous->Type == TT_PointerOrReference ||
Daniel Jasperb8b42952013-05-31 16:14:28 +0000617 Current.Previous->Type == TT_TemplateCloser ||
618 isSimpleTypeSpecifier(*Current.Previous);
Nico Weber37d69312013-02-13 04:13:13 +0000619 bool ParensCouldEndDecl =
Manuel Klimekb3987012013-05-29 14:47:47 +0000620 Current.Next &&
621 Current.Next->isOneOf(tok::equal, tok::semi, tok::l_brace);
Daniel Jasper6a365aa2013-03-13 17:13:53 +0000622 bool IsSizeOfOrAlignOf =
Daniel Jasperb8b42952013-05-31 16:14:28 +0000623 LeftOfParens &&
624 LeftOfParens->isOneOf(tok::kw_sizeof, tok::kw_alignof);
625 if (ParensAreType && !ParensCouldEndDecl && !IsSizeOfOrAlignOf &&
Daniel Jasper37eff832013-02-23 08:07:18 +0000626 Contexts.back().IsExpression)
Daniel Jasperb8b42952013-05-31 16:14:28 +0000627 IsCast = true;
628 if (Current.Next &&
Daniel Jasperff1a2e52013-06-06 08:20:20 +0000629 Current.Next->isNot(tok::string_literal) &&
Daniel Jasperb8b42952013-05-31 16:14:28 +0000630 (Current.Next->Tok.isLiteral() ||
631 Current.Next->isOneOf(tok::kw_sizeof, tok::kw_alignof)))
632 IsCast = true;
633 // If there is an identifier after the (), it is likely a cast, unless
634 // there is also an identifier before the ().
Daniel Jasperff1a2e52013-06-06 08:20:20 +0000635 if (LeftOfParens && (LeftOfParens->Tok.getIdentifierInfo() == NULL ||
636 LeftOfParens->is(tok::kw_return)) &&
637 LeftOfParens->Type != TT_TemplateCloser &&
Daniel Jasperb8b42952013-05-31 16:14:28 +0000638 LeftOfParens->Type != TT_ObjCMethodExpr && Current.Next &&
639 (Current.Next->is(tok::identifier)))
640 IsCast = true;
641 if (IsCast && !ParensAreEmpty)
Nico Weber37d69312013-02-13 04:13:13 +0000642 Current.Type = TT_CastRParen;
Manuel Klimekb3987012013-05-29 14:47:47 +0000643 } else if (Current.is(tok::at) && Current.Next) {
644 switch (Current.Next->Tok.getObjCKeywordID()) {
Daniel Jasper01786732013-02-04 07:21:18 +0000645 case tok::objc_interface:
646 case tok::objc_implementation:
647 case tok::objc_protocol:
648 Current.Type = TT_ObjCDecl;
649 break;
650 case tok::objc_property:
651 Current.Type = TT_ObjCProperty;
652 break;
653 default:
654 break;
655 }
Daniel Jasper5ad390d2013-05-28 11:30:49 +0000656 } else if (Current.is(tok::period)) {
Manuel Klimekb3987012013-05-29 14:47:47 +0000657 FormatToken *PreviousNoComment = Current.getPreviousNoneComment();
Daniel Jasper5ad390d2013-05-28 11:30:49 +0000658 if (PreviousNoComment &&
659 PreviousNoComment->isOneOf(tok::comma, tok::l_brace))
660 Current.Type = TT_DesignatedInitializerPeriod;
Daniel Jasper01786732013-02-04 07:21:18 +0000661 }
662 }
663 }
664
Daniel Jasper01786732013-02-04 07:21:18 +0000665 /// \brief Return the type of the given token assuming it is * or &.
Manuel Klimekb3987012013-05-29 14:47:47 +0000666 TokenType determineStarAmpUsage(const FormatToken &Tok, bool IsExpression) {
667 const FormatToken *PrevToken = Tok.getPreviousNoneComment();
Daniel Jasper01786732013-02-04 07:21:18 +0000668 if (PrevToken == NULL)
669 return TT_UnaryOperator;
670
Manuel Klimekb3987012013-05-29 14:47:47 +0000671 const FormatToken *NextToken = Tok.getNextNoneComment();
Daniel Jasper01786732013-02-04 07:21:18 +0000672 if (NextToken == NULL)
673 return TT_Unknown;
674
Daniel Jasper431f5912013-05-28 08:33:00 +0000675 if (PrevToken->is(tok::coloncolon) ||
676 (PrevToken->is(tok::l_paren) && !IsExpression))
Daniel Jasper8a5d7cd2013-03-01 17:13:29 +0000677 return TT_PointerOrReference;
678
Alexander Kornienkoe74de282013-03-13 14:41:29 +0000679 if (PrevToken->isOneOf(tok::l_paren, tok::l_square, tok::l_brace,
Daniel Jasperd3cf17b2013-03-14 10:50:25 +0000680 tok::comma, tok::semi, tok::kw_return, tok::colon,
Daniel Jasperdbef71e2013-05-07 14:17:18 +0000681 tok::equal, tok::kw_delete) ||
Alexander Kornienkoe74de282013-03-13 14:41:29 +0000682 PrevToken->Type == TT_BinaryOperator ||
Daniel Jasper01786732013-02-04 07:21:18 +0000683 PrevToken->Type == TT_UnaryOperator || PrevToken->Type == TT_CastRParen)
684 return TT_UnaryOperator;
685
Nico Webere8a97982013-02-06 06:20:11 +0000686 if (NextToken->is(tok::l_square))
687 return TT_PointerOrReference;
688
Manuel Klimekb3987012013-05-29 14:47:47 +0000689 if (PrevToken->Tok.isLiteral() ||
Alexander Kornienkoe74de282013-03-13 14:41:29 +0000690 PrevToken->isOneOf(tok::r_paren, tok::r_square) ||
Manuel Klimekb3987012013-05-29 14:47:47 +0000691 NextToken->Tok.isLiteral() || NextToken->isUnaryOperator())
Daniel Jasper01786732013-02-04 07:21:18 +0000692 return TT_BinaryOperator;
693
Daniel Jasper01786732013-02-04 07:21:18 +0000694 // It is very unlikely that we are going to find a pointer or reference type
695 // definition on the RHS of an assignment.
696 if (IsExpression)
697 return TT_BinaryOperator;
698
699 return TT_PointerOrReference;
700 }
701
Manuel Klimekb3987012013-05-29 14:47:47 +0000702 TokenType determinePlusMinusCaretUsage(const FormatToken &Tok) {
703 const FormatToken *PrevToken = Tok.getPreviousNoneComment();
Daniel Jasperb8b42952013-05-31 16:14:28 +0000704 if (PrevToken == NULL || PrevToken->Type == TT_CastRParen)
Daniel Jasper01786732013-02-04 07:21:18 +0000705 return TT_UnaryOperator;
706
707 // Use heuristics to recognize unary operators.
Alexander Kornienkoe74de282013-03-13 14:41:29 +0000708 if (PrevToken->isOneOf(tok::equal, tok::l_paren, tok::comma, tok::l_square,
709 tok::question, tok::colon, tok::kw_return,
710 tok::kw_case, tok::at, tok::l_brace))
Daniel Jasper01786732013-02-04 07:21:18 +0000711 return TT_UnaryOperator;
712
Nico Weberee0feec2013-02-05 16:21:00 +0000713 // There can't be two consecutive binary operators.
Daniel Jasper01786732013-02-04 07:21:18 +0000714 if (PrevToken->Type == TT_BinaryOperator)
715 return TT_UnaryOperator;
716
717 // Fall back to marking the token as binary operator.
718 return TT_BinaryOperator;
719 }
720
721 /// \brief Determine whether ++/-- are pre- or post-increments/-decrements.
Manuel Klimekb3987012013-05-29 14:47:47 +0000722 TokenType determineIncrementUsage(const FormatToken &Tok) {
723 const FormatToken *PrevToken = Tok.getPreviousNoneComment();
Daniel Jasperb8b42952013-05-31 16:14:28 +0000724 if (PrevToken == NULL || PrevToken->Type == TT_CastRParen)
Daniel Jasper01786732013-02-04 07:21:18 +0000725 return TT_UnaryOperator;
Alexander Kornienkoe74de282013-03-13 14:41:29 +0000726 if (PrevToken->isOneOf(tok::r_paren, tok::r_square, tok::identifier))
Daniel Jasper01786732013-02-04 07:21:18 +0000727 return TT_TrailingUnaryOperator;
728
729 return TT_UnaryOperator;
730 }
Daniel Jasper4e778092013-02-06 10:05:46 +0000731
Daniel Jasper8ed9f2b2013-04-03 13:36:17 +0000732 // FIXME: This is copy&pasted from Sema. Put it in a common place and remove
733 // duplication.
734 /// \brief Determine whether the token kind starts a simple-type-specifier.
Manuel Klimekb3987012013-05-29 14:47:47 +0000735 bool isSimpleTypeSpecifier(const FormatToken &Tok) const {
736 switch (Tok.Tok.getKind()) {
Daniel Jasper8ed9f2b2013-04-03 13:36:17 +0000737 case tok::kw_short:
738 case tok::kw_long:
739 case tok::kw___int64:
740 case tok::kw___int128:
741 case tok::kw_signed:
742 case tok::kw_unsigned:
743 case tok::kw_void:
744 case tok::kw_char:
745 case tok::kw_int:
746 case tok::kw_half:
747 case tok::kw_float:
748 case tok::kw_double:
749 case tok::kw_wchar_t:
750 case tok::kw_bool:
751 case tok::kw___underlying_type:
Daniel Jasper8ed9f2b2013-04-03 13:36:17 +0000752 case tok::annot_typename:
753 case tok::kw_char16_t:
754 case tok::kw_char32_t:
755 case tok::kw_typeof:
756 case tok::kw_decltype:
Alexander Kornienko00895102013-06-05 14:09:10 +0000757 return true;
Daniel Jasper8ed9f2b2013-04-03 13:36:17 +0000758 default:
Alexander Kornienko00895102013-06-05 14:09:10 +0000759 return false;
Daniel Jasper8ed9f2b2013-04-03 13:36:17 +0000760 }
Daniel Jasper8ed9f2b2013-04-03 13:36:17 +0000761 }
762
Daniel Jasper4e778092013-02-06 10:05:46 +0000763 SmallVector<Context, 8> Contexts;
764
Daniel Jasper4e778092013-02-06 10:05:46 +0000765 AnnotatedLine &Line;
Manuel Klimekb3987012013-05-29 14:47:47 +0000766 FormatToken *CurrentToken;
Daniel Jasper4e778092013-02-06 10:05:46 +0000767 bool KeywordVirtualFound;
Daniel Jasper1407bee2013-04-11 14:29:13 +0000768 bool NameFound;
Nico Weberc2e6d2a2013-02-11 15:32:15 +0000769 IdentifierInfo &Ident_in;
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000770};
771
Daniel Jasper29f123b2013-02-08 15:28:42 +0000772/// \brief Parses binary expressions by inserting fake parenthesis based on
773/// operator precedence.
774class ExpressionParser {
775public:
Manuel Klimekb3987012013-05-29 14:47:47 +0000776 ExpressionParser(AnnotatedLine &Line) : Current(Line.First) {}
Daniel Jasper29f123b2013-02-08 15:28:42 +0000777
778 /// \brief Parse expressions with the given operatore precedence.
Daniel Jasper237d4c12013-02-23 21:01:55 +0000779 void parse(int Precedence = 0) {
Daniel Jasperc01897c2013-05-31 14:56:12 +0000780 // Conditional expressions need to be parsed separately for proper nesting.
781 if (Precedence == prec::Conditional + 1) {
782 parseConditionalExpr();
783 return;
784 }
Daniel Jasper29f123b2013-02-08 15:28:42 +0000785 if (Precedence > prec::PointerToMember || Current == NULL)
786 return;
787
Daniel Jasper29f123b2013-02-08 15:28:42 +0000788 // Eagerly consume trailing comments.
Daniel Jasperac3223e2013-04-10 09:49:49 +0000789 while (Current && Current->isTrailingComment()) {
Daniel Jasper29f123b2013-02-08 15:28:42 +0000790 next();
791 }
792
Manuel Klimekb3987012013-05-29 14:47:47 +0000793 FormatToken *Start = Current;
Daniel Jasper29f123b2013-02-08 15:28:42 +0000794 bool OperatorFound = false;
795
Daniel Jasper237d4c12013-02-23 21:01:55 +0000796 while (Current) {
Daniel Jasper29f123b2013-02-08 15:28:42 +0000797 // Consume operators with higher precedence.
Daniel Jasperbf71ba22013-04-08 20:33:42 +0000798 parse(Precedence + 1);
Daniel Jasper29f123b2013-02-08 15:28:42 +0000799
Daniel Jasper237d4c12013-02-23 21:01:55 +0000800 int CurrentPrecedence = 0;
801 if (Current) {
802 if (Current->Type == TT_ConditionalExpr)
Daniel Jasperb8b42952013-05-31 16:14:28 +0000803 CurrentPrecedence = 1 + (int)prec::Conditional;
Daniel Jasperbf71ba22013-04-08 20:33:42 +0000804 else if (Current->is(tok::semi) || Current->Type == TT_InlineASMColon)
Daniel Jasper237d4c12013-02-23 21:01:55 +0000805 CurrentPrecedence = 1;
806 else if (Current->Type == TT_BinaryOperator || Current->is(tok::comma))
Daniel Jasperb8b42952013-05-31 16:14:28 +0000807 CurrentPrecedence = 1 + (int)Current->getPrecedence();
Daniel Jasper237d4c12013-02-23 21:01:55 +0000808 }
809
Daniel Jasper29f123b2013-02-08 15:28:42 +0000810 // At the end of the line or when an operator with higher precedence is
811 // found, insert fake parenthesis and return.
Daniel Jasperac3223e2013-04-10 09:49:49 +0000812 if (Current == NULL || Current->closesScope() ||
Daniel Jasper237d4c12013-02-23 21:01:55 +0000813 (CurrentPrecedence != 0 && CurrentPrecedence < Precedence)) {
Daniel Jasperc01897c2013-05-31 14:56:12 +0000814 if (OperatorFound)
815 addFakeParenthesis(Start, prec::Level(Precedence - 1));
Daniel Jasper29f123b2013-02-08 15:28:42 +0000816 return;
817 }
818
819 // Consume scopes: (), [], <> and {}
Daniel Jasperac3223e2013-04-10 09:49:49 +0000820 if (Current->opensScope()) {
821 while (Current && !Current->closesScope()) {
Daniel Jasper29f123b2013-02-08 15:28:42 +0000822 next();
823 parse();
824 }
825 next();
826 } else {
827 // Operator found.
Daniel Jasper237d4c12013-02-23 21:01:55 +0000828 if (CurrentPrecedence == Precedence)
Daniel Jasper29f123b2013-02-08 15:28:42 +0000829 OperatorFound = true;
830
831 next();
832 }
833 }
834 }
835
836private:
Daniel Jasperc01897c2013-05-31 14:56:12 +0000837 void addFakeParenthesis(FormatToken *Start, prec::Level Precedence) {
838 Start->FakeLParens.push_back(Precedence);
839 if (Current)
840 ++Current->Previous->FakeRParens;
841 }
842
843 void parseConditionalExpr() {
844 FormatToken *Start = Current;
845 parse(prec::LogicalOr + 1);
846 if (!Current || !Current->is(tok::question))
847 return;
848 next();
849 parse(prec::LogicalOr + 1);
850 if (!Current || Current->Type != TT_ConditionalExpr)
851 return;
852 next();
853 parseConditionalExpr();
854 addFakeParenthesis(Start, prec::Conditional);
855 }
856
Daniel Jasper29f123b2013-02-08 15:28:42 +0000857 void next() {
858 if (Current != NULL)
Manuel Klimekb3987012013-05-29 14:47:47 +0000859 Current = Current->Next;
Daniel Jasper29f123b2013-02-08 15:28:42 +0000860 }
861
Manuel Klimekb3987012013-05-29 14:47:47 +0000862 FormatToken *Current;
Daniel Jasper29f123b2013-02-08 15:28:42 +0000863};
864
Daniel Jasper8ff690a2013-02-06 14:22:40 +0000865void TokenAnnotator::annotate(AnnotatedLine &Line) {
Alexander Kornienko00895102013-06-05 14:09:10 +0000866 AnnotatingParser Parser(Line, Ident_in);
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000867 Line.Type = Parser.parseLine();
868 if (Line.Type == LT_Invalid)
869 return;
870
Daniel Jasper29f123b2013-02-08 15:28:42 +0000871 ExpressionParser ExprParser(Line);
872 ExprParser.parse();
873
Manuel Klimekb3987012013-05-29 14:47:47 +0000874 if (Line.First->Type == TT_ObjCMethodSpecifier)
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000875 Line.Type = LT_ObjCMethodDecl;
Manuel Klimekb3987012013-05-29 14:47:47 +0000876 else if (Line.First->Type == TT_ObjCDecl)
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000877 Line.Type = LT_ObjCDecl;
Manuel Klimekb3987012013-05-29 14:47:47 +0000878 else if (Line.First->Type == TT_ObjCProperty)
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000879 Line.Type = LT_ObjCProperty;
880
Manuel Klimekb3987012013-05-29 14:47:47 +0000881 Line.First->SpacesRequiredBefore = 1;
882 Line.First->CanBreakBefore = Line.First->MustBreakBefore;
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000883}
884
Daniel Jasper8ff690a2013-02-06 14:22:40 +0000885void TokenAnnotator::calculateFormattingInformation(AnnotatedLine &Line) {
Alexander Kornienko00895102013-06-05 14:09:10 +0000886 Line.First->TotalLength = Line.First->CodePointCount;
Manuel Klimekb3987012013-05-29 14:47:47 +0000887 if (!Line.First->Next)
Daniel Jasper8ff690a2013-02-06 14:22:40 +0000888 return;
Manuel Klimekb3987012013-05-29 14:47:47 +0000889 FormatToken *Current = Line.First->Next;
Daniel Jasper8ff690a2013-02-06 14:22:40 +0000890 while (Current != NULL) {
Daniel Jasper729a7432013-02-11 12:36:37 +0000891 if (Current->Type == TT_LineComment)
892 Current->SpacesRequiredBefore = Style.SpacesBeforeTrailingComments;
893 else
894 Current->SpacesRequiredBefore =
895 spaceRequiredBefore(Line, *Current) ? 1 : 0;
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000896
Manuel Klimekb3987012013-05-29 14:47:47 +0000897 if (Current->MustBreakBefore) {
Daniel Jasper8ff690a2013-02-06 14:22:40 +0000898 } else if (Current->Type == TT_LineComment) {
Manuel Klimekb3987012013-05-29 14:47:47 +0000899 Current->MustBreakBefore = Current->NewlinesBefore > 0;
900 } else if (Current->Previous->isTrailingComment() ||
Daniel Jasper8ff690a2013-02-06 14:22:40 +0000901 (Current->is(tok::string_literal) &&
Manuel Klimekb3987012013-05-29 14:47:47 +0000902 Current->Previous->is(tok::string_literal))) {
Daniel Jasper8ff690a2013-02-06 14:22:40 +0000903 Current->MustBreakBefore = true;
Manuel Klimekb3987012013-05-29 14:47:47 +0000904 } else if (Current->is(tok::lessless) && Current->Next &&
905 Current->Previous->is(tok::string_literal) &&
906 Current->Next->is(tok::string_literal)) {
Daniel Jasper8ff690a2013-02-06 14:22:40 +0000907 Current->MustBreakBefore = true;
Manuel Klimekb3987012013-05-29 14:47:47 +0000908 } else if (Current->Previous->ClosesTemplateDeclaration &&
Daniel Jasperbbc87762013-05-29 12:07:31 +0000909 Style.AlwaysBreakTemplateDeclarations) {
910 Current->MustBreakBefore = true;
Daniel Jasper8ff690a2013-02-06 14:22:40 +0000911 } else {
912 Current->MustBreakBefore = false;
913 }
914 Current->CanBreakBefore =
915 Current->MustBreakBefore || canBreakBefore(Line, *Current);
916 if (Current->MustBreakBefore)
Manuel Klimekb3987012013-05-29 14:47:47 +0000917 Current->TotalLength = Current->Previous->TotalLength + Style.ColumnLimit;
Daniel Jasper8ff690a2013-02-06 14:22:40 +0000918 else
919 Current->TotalLength =
Alexander Kornienko00895102013-06-05 14:09:10 +0000920 Current->Previous->TotalLength + Current->CodePointCount +
Daniel Jasper729a7432013-02-11 12:36:37 +0000921 Current->SpacesRequiredBefore;
Daniel Jasper8ff690a2013-02-06 14:22:40 +0000922 // FIXME: Only calculate this if CanBreakBefore is true once static
923 // initializers etc. are sorted out.
924 // FIXME: Move magic numbers to a better place.
925 Current->SplitPenalty =
926 20 * Current->BindingStrength + splitPenalty(Line, *Current);
927
Manuel Klimekb3987012013-05-29 14:47:47 +0000928 Current = Current->Next;
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000929 }
Daniel Jasperbf71ba22013-04-08 20:33:42 +0000930
Manuel Klimeke573c3f2013-05-22 12:51:29 +0000931 calculateUnbreakableTailLengths(Line);
Daniel Jasperbf71ba22013-04-08 20:33:42 +0000932 DEBUG({
933 printDebugInfo(Line);
934 });
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000935}
936
Manuel Klimeke573c3f2013-05-22 12:51:29 +0000937void TokenAnnotator::calculateUnbreakableTailLengths(AnnotatedLine &Line) {
938 unsigned UnbreakableTailLength = 0;
Manuel Klimekb3987012013-05-29 14:47:47 +0000939 FormatToken *Current = Line.Last;
Manuel Klimeke573c3f2013-05-22 12:51:29 +0000940 while (Current != NULL) {
941 Current->UnbreakableTailLength = UnbreakableTailLength;
942 if (Current->CanBreakBefore ||
943 Current->isOneOf(tok::comment, tok::string_literal)) {
944 UnbreakableTailLength = 0;
945 } else {
946 UnbreakableTailLength +=
Alexander Kornienko00895102013-06-05 14:09:10 +0000947 Current->CodePointCount + Current->SpacesRequiredBefore;
Manuel Klimeke573c3f2013-05-22 12:51:29 +0000948 }
Manuel Klimekb3987012013-05-29 14:47:47 +0000949 Current = Current->Previous;
Manuel Klimeke573c3f2013-05-22 12:51:29 +0000950 }
951}
952
Daniel Jasper8ff690a2013-02-06 14:22:40 +0000953unsigned TokenAnnotator::splitPenalty(const AnnotatedLine &Line,
Manuel Klimekb3987012013-05-29 14:47:47 +0000954 const FormatToken &Tok) {
955 const FormatToken &Left = *Tok.Previous;
956 const FormatToken &Right = Tok;
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000957
Daniel Jasper5ad390d2013-05-28 11:30:49 +0000958 if (Left.is(tok::semi))
959 return 0;
960 if (Left.is(tok::comma))
961 return 1;
962
Daniel Jasper3c08a812013-02-24 18:54:32 +0000963 if (Right.Type == TT_StartOfName) {
Manuel Klimekb3987012013-05-29 14:47:47 +0000964 if (Line.First->is(tok::kw_for) && Right.PartOfMultiVariableDeclStmt)
Daniel Jasper3c08a812013-02-24 18:54:32 +0000965 return 3;
966 else if (Line.MightBeFunctionDecl && Right.BindingStrength == 1)
967 // FIXME: Clean up hack of using BindingStrength to find top-level names.
968 return Style.PenaltyReturnTypeOnItsOwnLine;
969 else
Daniel Jasper1407bee2013-04-11 14:29:13 +0000970 return 200;
Daniel Jasper3c08a812013-02-24 18:54:32 +0000971 }
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000972 if (Left.is(tok::equal) && Right.is(tok::l_brace))
973 return 150;
974 if (Left.is(tok::coloncolon))
975 return 500;
Daniel Jasper6b119d62013-04-05 17:22:09 +0000976 if (Left.isOneOf(tok::kw_class, tok::kw_struct))
977 return 5000;
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000978
Daniel Jasper6cabab42013-02-14 08:42:54 +0000979 if (Left.Type == TT_RangeBasedForLoopColon ||
980 Left.Type == TT_InheritanceColon)
Daniel Jasper84a1a632013-02-26 13:18:08 +0000981 return 2;
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000982
Daniel Jasper5ad390d2013-05-28 11:30:49 +0000983 if (Right.isOneOf(tok::arrow, tok::period) &&
984 Right.Type != TT_DesignatedInitializerPeriod) {
Daniel Jasper515f65d2013-02-18 13:24:21 +0000985 if (Line.Type == LT_BuilderTypeCall)
Daniel Jasper6a365aa2013-03-13 17:13:53 +0000986 return prec::PointerToMember;
Alexander Kornienkoe74de282013-03-13 14:41:29 +0000987 if (Left.isOneOf(tok::r_paren, tok::r_square) && Left.MatchingParen &&
988 Left.MatchingParen->ParameterCount > 0)
Daniel Jasper518ee342013-02-26 13:59:14 +0000989 return 20; // Should be smaller than breaking at a nested comma.
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000990 return 150;
991 }
992
Daniel Jasper5ad72bb2013-05-22 08:28:26 +0000993 // Breaking before a trailing 'const' is bad.
994 if (Left.is(tok::r_paren) && Right.is(tok::kw_const))
995 return 150;
996
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000997 // In for-loops, prefer breaking at ',' and ';'.
Manuel Klimekb3987012013-05-29 14:47:47 +0000998 if (Line.First->is(tok::kw_for) && Left.is(tok::equal))
Daniel Jasper7d812812013-02-21 15:00:29 +0000999 return 4;
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001000
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001001 // In Objective-C method expressions, prefer breaking before "param:" over
1002 // breaking after it.
Daniel Jasper63d7ced2013-02-05 10:07:47 +00001003 if (Right.Type == TT_ObjCSelectorName)
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001004 return 0;
Daniel Jasper63d7ced2013-02-05 10:07:47 +00001005 if (Left.is(tok::colon) && Left.Type == TT_ObjCMethodExpr)
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001006 return 20;
1007
Daniel Jasper1407bee2013-04-11 14:29:13 +00001008 if (Left.is(tok::l_paren) && Line.MightBeFunctionDecl)
1009 return 100;
Daniel Jasperac3223e2013-04-10 09:49:49 +00001010 if (Left.opensScope())
Daniel Jasper64f09282013-03-20 13:53:11 +00001011 return Left.ParameterCount > 1 ? prec::Comma : 20;
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001012
Daniel Jasper4e8a7b42013-02-06 21:04:05 +00001013 if (Right.is(tok::lessless)) {
1014 if (Left.is(tok::string_literal)) {
Alexander Kornienko00895102013-06-05 14:09:10 +00001015 StringRef Content = Left.TokenText;
Daniel Jasperbfa1edd2013-03-14 14:00:17 +00001016 Content = Content.drop_back(1).drop_front(1).trim();
1017 if (Content.size() > 1 &&
1018 (Content.back() == ':' || Content.back() == '='))
Daniel Jasper6e6efa72013-05-22 09:13:26 +00001019 return 20;
Daniel Jasper4e8a7b42013-02-06 21:04:05 +00001020 }
Daniel Jasper01786732013-02-04 07:21:18 +00001021 return prec::Shift;
Daniel Jasper4e8a7b42013-02-06 21:04:05 +00001022 }
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001023 if (Left.Type == TT_ConditionalExpr)
Daniel Jasper518ee342013-02-26 13:59:14 +00001024 return prec::Conditional;
Manuel Klimekb3987012013-05-29 14:47:47 +00001025 prec::Level Level = Left.getPrecedence();
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001026
1027 if (Level != prec::Unknown)
1028 return Level;
Daniel Jasper24849712013-03-01 16:48:32 +00001029
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001030 return 3;
1031}
1032
Daniel Jasper8ff690a2013-02-06 14:22:40 +00001033bool TokenAnnotator::spaceRequiredBetween(const AnnotatedLine &Line,
Manuel Klimekb3987012013-05-29 14:47:47 +00001034 const FormatToken &Left,
1035 const FormatToken &Right) {
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001036 if (Right.is(tok::hashhash))
1037 return Left.is(tok::hash);
Alexander Kornienkoe74de282013-03-13 14:41:29 +00001038 if (Left.isOneOf(tok::hashhash, tok::hash))
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001039 return Right.is(tok::hash);
Alexander Kornienkoe74de282013-03-13 14:41:29 +00001040 if (Right.isOneOf(tok::r_paren, tok::semi, tok::comma))
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001041 return false;
1042 if (Right.is(tok::less) &&
1043 (Left.is(tok::kw_template) ||
1044 (Line.Type == LT_ObjCDecl && Style.ObjCSpaceBeforeProtocolList)))
1045 return true;
1046 if (Left.is(tok::arrow) || Right.is(tok::arrow))
1047 return false;
Alexander Kornienkoe74de282013-03-13 14:41:29 +00001048 if (Left.isOneOf(tok::exclaim, tok::tilde))
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001049 return false;
1050 if (Left.is(tok::at) &&
Alexander Kornienkoe74de282013-03-13 14:41:29 +00001051 Right.isOneOf(tok::identifier, tok::string_literal, tok::char_constant,
1052 tok::numeric_constant, tok::l_paren, tok::l_brace,
1053 tok::kw_true, tok::kw_false))
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001054 return false;
1055 if (Left.is(tok::coloncolon))
1056 return false;
1057 if (Right.is(tok::coloncolon))
Alexander Kornienkoe74de282013-03-13 14:41:29 +00001058 return !Left.isOneOf(tok::identifier, tok::greater, tok::l_paren);
1059 if (Left.is(tok::less) || Right.isOneOf(tok::greater, tok::less))
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001060 return false;
Alexander Kornienko3fd9ccd2013-03-12 16:28:18 +00001061 if (Right.Type == TT_PointerOrReference)
Manuel Klimekb3987012013-05-29 14:47:47 +00001062 return Left.Tok.isLiteral() ||
Alexander Kornienko3fd9ccd2013-03-12 16:28:18 +00001063 ((Left.Type != TT_PointerOrReference) && Left.isNot(tok::l_paren) &&
1064 !Style.PointerBindsToType);
Daniel Jasper3ff4a2f2013-05-28 15:27:10 +00001065 if (Right.Type == TT_FunctionTypeLParen && Left.isNot(tok::l_paren) &&
Daniel Jasper395228f2013-05-08 14:58:20 +00001066 (Left.Type != TT_PointerOrReference || Style.PointerBindsToType))
1067 return true;
Alexander Kornienko3fd9ccd2013-03-12 16:28:18 +00001068 if (Left.Type == TT_PointerOrReference)
Manuel Klimekb3987012013-05-29 14:47:47 +00001069 return Right.Tok.isLiteral() ||
Daniel Jasper9322aae2013-03-20 09:53:18 +00001070 ((Right.Type != TT_PointerOrReference) &&
Daniel Jasper81d2d382013-04-01 17:13:26 +00001071 Right.isNot(tok::l_paren) && Style.PointerBindsToType &&
Manuel Klimekb3987012013-05-29 14:47:47 +00001072 Left.Previous &&
1073 !Left.Previous->isOneOf(tok::l_paren, tok::coloncolon));
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001074 if (Right.is(tok::star) && Left.is(tok::l_paren))
1075 return false;
Nico Weber051860e2013-02-10 02:08:05 +00001076 if (Left.is(tok::l_square))
1077 return Left.Type == TT_ObjCArrayLiteral && Right.isNot(tok::r_square);
1078 if (Right.is(tok::r_square))
1079 return Right.Type == TT_ObjCArrayLiteral;
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001080 if (Right.is(tok::l_square) && Right.Type != TT_ObjCMethodExpr)
1081 return false;
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001082 if (Left.is(tok::colon))
1083 return Left.Type != TT_ObjCMethodExpr;
1084 if (Right.is(tok::colon))
1085 return Right.Type != TT_ObjCMethodExpr;
1086 if (Left.is(tok::l_paren))
1087 return false;
1088 if (Right.is(tok::l_paren)) {
Alexander Kornienkoe74de282013-03-13 14:41:29 +00001089 return Line.Type == LT_ObjCDecl ||
1090 Left.isOneOf(tok::kw_if, tok::kw_for, tok::kw_while, tok::kw_switch,
1091 tok::kw_return, tok::kw_catch, tok::kw_new,
Daniel Jasper454cb702013-05-03 14:50:50 +00001092 tok::kw_delete, tok::semi);
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001093 }
Manuel Klimekb3987012013-05-29 14:47:47 +00001094 if (Left.is(tok::at) && Right.Tok.getObjCKeywordID() != tok::objc_not_keyword)
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001095 return false;
1096 if (Left.is(tok::l_brace) && Right.is(tok::r_brace))
Daniel Jasper2424eef2013-05-23 10:15:45 +00001097 return false; // No spaces in "{}".
1098 if (Left.is(tok::l_brace) || Right.is(tok::r_brace))
1099 return Style.SpacesInBracedLists;
Daniel Jasper1bee0732013-05-23 18:05:18 +00001100 if (Right.Type == TT_UnaryOperator)
1101 return !Left.isOneOf(tok::l_paren, tok::l_square, tok::at) &&
1102 (Left.isNot(tok::colon) || Left.Type != TT_ObjCMethodExpr);
Daniel Jasperce933562013-05-23 21:35:49 +00001103 if (Left.isOneOf(tok::identifier, tok::greater, tok::r_square) &&
1104 Right.is(tok::l_brace) && Right.getNextNoneComment())
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001105 return false;
Daniel Jasperf0220182013-05-06 06:35:44 +00001106 if (Right.is(tok::ellipsis))
1107 return false;
Daniel Jasper5ad390d2013-05-28 11:30:49 +00001108 if (Left.is(tok::period) || Right.is(tok::period))
1109 return false;
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001110 return true;
1111}
1112
Daniel Jasper8ff690a2013-02-06 14:22:40 +00001113bool TokenAnnotator::spaceRequiredBefore(const AnnotatedLine &Line,
Manuel Klimekb3987012013-05-29 14:47:47 +00001114 const FormatToken &Tok) {
1115 if (Tok.Tok.getIdentifierInfo() && Tok.Previous->Tok.getIdentifierInfo())
Daniel Jasper2b4c9242013-02-11 08:01:18 +00001116 return true; // Never ever merge two identifiers.
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001117 if (Line.Type == LT_ObjCMethodDecl) {
Manuel Klimekb3987012013-05-29 14:47:47 +00001118 if (Tok.Previous->Type == TT_ObjCMethodSpecifier)
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001119 return true;
Manuel Klimekb3987012013-05-29 14:47:47 +00001120 if (Tok.Previous->is(tok::r_paren) && Tok.is(tok::identifier))
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001121 // Don't space between ')' and <id>
1122 return false;
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001123 }
1124 if (Line.Type == LT_ObjCProperty &&
Manuel Klimekb3987012013-05-29 14:47:47 +00001125 (Tok.is(tok::equal) || Tok.Previous->is(tok::equal)))
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001126 return false;
1127
Manuel Klimekb3987012013-05-29 14:47:47 +00001128 if (Tok.Previous->is(tok::comma))
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001129 return true;
Daniel Jasper9c3c7b32013-02-28 13:40:17 +00001130 if (Tok.is(tok::comma))
1131 return false;
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001132 if (Tok.Type == TT_CtorInitializerColon || Tok.Type == TT_ObjCBlockLParen)
1133 return true;
Manuel Klimekb3987012013-05-29 14:47:47 +00001134 if (Tok.Previous->Tok.is(tok::kw_operator))
Daniel Jasper2b4c9242013-02-11 08:01:18 +00001135 return false;
1136 if (Tok.Type == TT_OverloadedOperatorLParen)
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001137 return false;
1138 if (Tok.is(tok::colon))
Manuel Klimekb3987012013-05-29 14:47:47 +00001139 return !Line.First->isOneOf(tok::kw_case, tok::kw_default) &&
Daniel Jasperac3223e2013-04-10 09:49:49 +00001140 Tok.getNextNoneComment() != NULL && Tok.Type != TT_ObjCMethodExpr;
Manuel Klimekb3987012013-05-29 14:47:47 +00001141 if (Tok.Previous->Type == TT_UnaryOperator ||
1142 Tok.Previous->Type == TT_CastRParen)
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001143 return false;
Manuel Klimekb3987012013-05-29 14:47:47 +00001144 if (Tok.Previous->is(tok::greater) && Tok.is(tok::greater)) {
Daniel Jasper29f123b2013-02-08 15:28:42 +00001145 return Tok.Type == TT_TemplateCloser &&
Manuel Klimekb3987012013-05-29 14:47:47 +00001146 Tok.Previous->Type == TT_TemplateCloser &&
Daniel Jasper29f123b2013-02-08 15:28:42 +00001147 Style.Standard != FormatStyle::LS_Cpp11;
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001148 }
Alexander Kornienko54a38bd2013-03-20 16:41:56 +00001149 if (Tok.isOneOf(tok::arrowstar, tok::periodstar) ||
Manuel Klimekb3987012013-05-29 14:47:47 +00001150 Tok.Previous->isOneOf(tok::arrowstar, tok::periodstar))
Daniel Jasper9c3c7b32013-02-28 13:40:17 +00001151 return false;
Manuel Klimekb3987012013-05-29 14:47:47 +00001152 if (Tok.Type == TT_BinaryOperator || Tok.Previous->Type == TT_BinaryOperator)
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001153 return true;
Manuel Klimekb3987012013-05-29 14:47:47 +00001154 if (Tok.Previous->Type == TT_TemplateCloser && Tok.is(tok::l_paren))
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001155 return false;
Manuel Klimekb3987012013-05-29 14:47:47 +00001156 if (Tok.is(tok::less) && Line.First->is(tok::hash))
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001157 return true;
1158 if (Tok.Type == TT_TrailingUnaryOperator)
1159 return false;
Manuel Klimekb3987012013-05-29 14:47:47 +00001160 return spaceRequiredBetween(Line, *Tok.Previous, Tok);
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001161}
1162
Daniel Jasper8ff690a2013-02-06 14:22:40 +00001163bool TokenAnnotator::canBreakBefore(const AnnotatedLine &Line,
Manuel Klimekb3987012013-05-29 14:47:47 +00001164 const FormatToken &Right) {
1165 const FormatToken &Left = *Right.Previous;
Daniel Jaspera03ab102013-02-13 20:33:44 +00001166 if (Right.Type == TT_StartOfName)
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001167 return true;
Nico Weberf2ff8122013-05-26 05:39:26 +00001168 if (Right.is(tok::colon) &&
1169 (Right.Type == TT_ObjCDictLiteral || Right.Type == TT_ObjCMethodExpr))
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001170 return false;
Nico Weberf2ff8122013-05-26 05:39:26 +00001171 if (Left.is(tok::colon) &&
1172 (Left.Type == TT_ObjCDictLiteral || Left.Type == TT_ObjCMethodExpr))
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001173 return true;
Daniel Jasper63d7ced2013-02-05 10:07:47 +00001174 if (Right.Type == TT_ObjCSelectorName)
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001175 return true;
1176 if (Left.ClosesTemplateDeclaration)
1177 return true;
1178 if (Right.Type == TT_ConditionalExpr || Right.is(tok::question))
1179 return true;
Daniel Jasper6cabab42013-02-14 08:42:54 +00001180 if (Right.Type == TT_RangeBasedForLoopColon ||
Daniel Jasper27b91cc2013-04-05 17:21:59 +00001181 Right.Type == TT_OverloadedOperatorLParen)
Daniel Jasper6cabab42013-02-14 08:42:54 +00001182 return false;
Daniel Jasperc194c952013-05-06 06:45:09 +00001183 if (Left.Type == TT_RangeBasedForLoopColon)
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001184 return true;
Daniel Jasper7d812812013-02-21 15:00:29 +00001185 if (Right.Type == TT_RangeBasedForLoopColon)
1186 return false;
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001187 if (Left.Type == TT_PointerOrReference || Left.Type == TT_TemplateCloser ||
1188 Left.Type == TT_UnaryOperator || Left.Type == TT_ConditionalExpr ||
Alexander Kornienkoe74de282013-03-13 14:41:29 +00001189 Left.isOneOf(tok::question, tok::kw_operator))
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001190 return false;
1191 if (Left.is(tok::equal) && Line.Type == LT_VirtualFunctionDecl)
1192 return false;
Manuel Klimekb3987012013-05-29 14:47:47 +00001193 if (Left.is(tok::l_paren) && Right.is(tok::l_paren) && Left.Previous &&
1194 Left.Previous->is(tok::kw___attribute))
Daniel Jasper8ed41002013-02-28 14:44:25 +00001195 return false;
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001196
1197 if (Right.Type == TT_LineComment)
1198 // We rely on MustBreakBefore being set correctly here as we should not
1199 // change the "binding" behavior of a comment.
1200 return false;
1201
Daniel Jasper5ad72bb2013-05-22 08:28:26 +00001202 // We only break before r_brace if there was a corresponding break before
1203 // the l_brace, which is tracked by BreakBeforeClosingBrace.
1204 if (Right.isOneOf(tok::r_brace, tok::r_paren, tok::greater))
1205 return false;
1206
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001207 // Allow breaking after a trailing 'const', e.g. after a method declaration,
1208 // unless it is follow by ';', '{' or '='.
Manuel Klimekb3987012013-05-29 14:47:47 +00001209 if (Left.is(tok::kw_const) && Left.Previous != NULL &&
1210 Left.Previous->is(tok::r_paren))
Alexander Kornienkoe74de282013-03-13 14:41:29 +00001211 return !Right.isOneOf(tok::l_brace, tok::semi, tok::equal);
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001212
Daniel Jasper8ef19a22013-03-14 09:50:46 +00001213 if (Right.is(tok::kw___attribute))
1214 return true;
1215
Daniel Jasper3a204412013-02-23 07:46:38 +00001216 if (Left.is(tok::identifier) && Right.is(tok::string_literal))
1217 return true;
Daniel Jasperac3223e2013-04-10 09:49:49 +00001218 return (Left.isBinaryOperator() && Left.isNot(tok::lessless)) ||
Daniel Jasper6b119d62013-04-05 17:22:09 +00001219 Left.isOneOf(tok::comma, tok::coloncolon, tok::semi, tok::l_brace,
1220 tok::kw_class, tok::kw_struct) ||
Alexander Kornienkoe74de282013-03-13 14:41:29 +00001221 Right.isOneOf(tok::lessless, tok::arrow, tok::period, tok::colon) ||
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001222 (Left.is(tok::r_paren) && Left.Type != TT_CastRParen &&
Daniel Jaspere033e872013-05-21 09:16:31 +00001223 Right.isOneOf(tok::identifier, tok::kw_const, tok::kw___attribute)) ||
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001224 (Left.is(tok::l_paren) && !Right.is(tok::r_paren)) ||
1225 (Left.is(tok::l_square) && !Right.is(tok::r_square));
1226}
1227
Daniel Jasperbf71ba22013-04-08 20:33:42 +00001228void TokenAnnotator::printDebugInfo(const AnnotatedLine &Line) {
1229 llvm::errs() << "AnnotatedTokens:\n";
Manuel Klimekb3987012013-05-29 14:47:47 +00001230 const FormatToken *Tok = Line.First;
Daniel Jasperbf71ba22013-04-08 20:33:42 +00001231 while (Tok) {
Manuel Klimekb3987012013-05-29 14:47:47 +00001232 llvm::errs() << " M=" << Tok->MustBreakBefore
1233 << " C=" << Tok->CanBreakBefore << " T=" << Tok->Type << " S="
1234 << Tok->SpacesRequiredBefore << " P=" << Tok->SplitPenalty
1235 << " Name=" << Tok->Tok.getName() << " FakeLParens=";
Daniel Jasperbf71ba22013-04-08 20:33:42 +00001236 for (unsigned i = 0, e = Tok->FakeLParens.size(); i != e; ++i)
1237 llvm::errs() << Tok->FakeLParens[i] << "/";
1238 llvm::errs() << " FakeRParens=" << Tok->FakeRParens << "\n";
Manuel Klimekb3987012013-05-29 14:47:47 +00001239 Tok = Tok->Next;
Daniel Jasperbf71ba22013-04-08 20:33:42 +00001240 }
1241 llvm::errs() << "----\n";
1242}
1243
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001244} // namespace format
1245} // namespace clang