blob: 83dea841b5ec7c5041431513c6e735ebe26182a7 [file] [log] [blame]
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001//===--- TokenAnnotator.cpp - Format C++ code -----------------------------===//
2//
3// The LLVM Compiler Infrastructure
4//
5// This file is distributed under the University of Illinois Open Source
6// License. See LICENSE.TXT for details.
7//
8//===----------------------------------------------------------------------===//
9///
10/// \file
11/// \brief This file implements a token annotator, i.e. creates
12/// \c AnnotatedTokens out of \c FormatTokens with required extra information.
13///
14//===----------------------------------------------------------------------===//
15
16#include "TokenAnnotator.h"
17#include "clang/Basic/SourceManager.h"
18#include "clang/Lex/Lexer.h"
Daniel Jasperbf71ba22013-04-08 20:33:42 +000019#include "llvm/Support/Debug.h"
Daniel Jasper32d28ee2013-01-29 21:01:14 +000020
21namespace clang {
22namespace format {
23
Daniel Jasper32d28ee2013-01-29 21:01:14 +000024/// \brief A parser that gathers additional information about tokens.
25///
Alexander Kornienko3fd9ccd2013-03-12 16:28:18 +000026/// The \c TokenAnnotator tries to match parenthesis and square brakets and
Daniel Jasper32d28ee2013-01-29 21:01:14 +000027/// store a parenthesis levels. It also tries to resolve matching "<" and ">"
28/// into template parameter lists.
29class AnnotatingParser {
30public:
Nico Weberc2e6d2a2013-02-11 15:32:15 +000031 AnnotatingParser(SourceManager &SourceMgr, Lexer &Lex, AnnotatedLine &Line,
32 IdentifierInfo &Ident_in)
Manuel Klimekb3987012013-05-29 14:47:47 +000033 : SourceMgr(SourceMgr), Lex(Lex), Line(Line), CurrentToken(Line.First),
Daniel Jasper1407bee2013-04-11 14:29:13 +000034 KeywordVirtualFound(false), NameFound(false), Ident_in(Ident_in) {
Daniel Jasper923ebef2013-03-14 13:45:21 +000035 Contexts.push_back(Context(tok::unknown, 1, /*IsExpression=*/ false));
Daniel Jasper32d28ee2013-01-29 21:01:14 +000036 }
37
Nico Weber95e8e462013-02-12 16:17:07 +000038private:
Daniel Jasper32d28ee2013-01-29 21:01:14 +000039 bool parseAngle() {
40 if (CurrentToken == NULL)
41 return false;
Daniel Jasper923ebef2013-03-14 13:45:21 +000042 ScopedContextCreator ContextCreator(*this, tok::less, 10);
Manuel Klimekb3987012013-05-29 14:47:47 +000043 FormatToken *Left = CurrentToken->Previous;
Daniel Jasper4e778092013-02-06 10:05:46 +000044 Contexts.back().IsExpression = false;
Daniel Jasper32d28ee2013-01-29 21:01:14 +000045 while (CurrentToken != NULL) {
46 if (CurrentToken->is(tok::greater)) {
47 Left->MatchingParen = CurrentToken;
48 CurrentToken->MatchingParen = Left;
49 CurrentToken->Type = TT_TemplateCloser;
50 next();
51 return true;
52 }
Alexander Kornienkoe74de282013-03-13 14:41:29 +000053 if (CurrentToken->isOneOf(tok::r_paren, tok::r_square, tok::r_brace,
Daniel Jasper5d823e32013-05-15 13:46:48 +000054 tok::question, tok::colon))
55 return false;
Daniel Jasper0348be02013-06-01 18:56:00 +000056 // If a && or || is found and interpreted as a binary operator, this set
Daniel Jasper15f33f02013-06-03 16:16:41 +000057 // of angles is likely part of something like "a < b && c > d". If the
Daniel Jasper0348be02013-06-01 18:56:00 +000058 // angles are inside an expression, the ||/&& might also be a binary
59 // operator that was misinterpreted because we are parsing template
60 // parameters.
61 // FIXME: This is getting out of hand, write a decent parser.
Manuel Klimekb3987012013-05-29 14:47:47 +000062 if (CurrentToken->Previous->isOneOf(tok::pipepipe, tok::ampamp) &&
Daniel Jasper0348be02013-06-01 18:56:00 +000063 (CurrentToken->Previous->Type == TT_BinaryOperator ||
64 Contexts[Contexts.size() - 2].IsExpression) &&
Manuel Klimekb3987012013-05-29 14:47:47 +000065 Line.First->isNot(tok::kw_template))
Daniel Jasper32d28ee2013-01-29 21:01:14 +000066 return false;
Daniel Jasper9fc56f22013-02-14 15:01:34 +000067 updateParameterCount(Left, CurrentToken);
Daniel Jasper32d28ee2013-01-29 21:01:14 +000068 if (!consumeToken())
69 return false;
70 }
71 return false;
72 }
73
74 bool parseParens(bool LookForDecls = false) {
75 if (CurrentToken == NULL)
76 return false;
Daniel Jasper923ebef2013-03-14 13:45:21 +000077 ScopedContextCreator ContextCreator(*this, tok::l_paren, 1);
Daniel Jasper4e778092013-02-06 10:05:46 +000078
79 // FIXME: This is a bit of a hack. Do better.
80 Contexts.back().ColonIsForRangeExpr =
81 Contexts.size() == 2 && Contexts[0].ColonIsForRangeExpr;
82
Daniel Jasper32d28ee2013-01-29 21:01:14 +000083 bool StartsObjCMethodExpr = false;
Manuel Klimekb3987012013-05-29 14:47:47 +000084 FormatToken *Left = CurrentToken->Previous;
Daniel Jasper32d28ee2013-01-29 21:01:14 +000085 if (CurrentToken->is(tok::caret)) {
86 // ^( starts a block.
87 Left->Type = TT_ObjCBlockLParen;
Manuel Klimekb3987012013-05-29 14:47:47 +000088 } else if (FormatToken *MaybeSel = Left->Previous) {
Daniel Jasper32d28ee2013-01-29 21:01:14 +000089 // @selector( starts a selector.
Manuel Klimekb3987012013-05-29 14:47:47 +000090 if (MaybeSel->isObjCAtKeyword(tok::objc_selector) && MaybeSel->Previous &&
91 MaybeSel->Previous->is(tok::at)) {
Daniel Jasper32d28ee2013-01-29 21:01:14 +000092 StartsObjCMethodExpr = true;
93 }
94 }
95
Daniel Jasper4e778092013-02-06 10:05:46 +000096 if (StartsObjCMethodExpr) {
97 Contexts.back().ColonIsObjCMethodExpr = true;
98 Left->Type = TT_ObjCMethodExpr;
99 }
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000100
Daniel Jasper431f5912013-05-28 08:33:00 +0000101 bool MightBeFunctionType = CurrentToken->is(tok::star);
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000102 while (CurrentToken != NULL) {
103 // LookForDecls is set when "if (" has been seen. Check for
104 // 'identifier' '*' 'identifier' followed by not '=' -- this
105 // '*' has to be a binary operator but determineStarAmpUsage() will
106 // categorize it as an unary operator, so set the right type here.
Manuel Klimekb3987012013-05-29 14:47:47 +0000107 if (LookForDecls && CurrentToken->Next) {
108 FormatToken *Prev = CurrentToken->Previous;
109 FormatToken *Next = CurrentToken->Next;
110 if (Prev->Previous->is(tok::identifier) &&
111 Prev->isOneOf(tok::star, tok::amp, tok::ampamp) &&
112 CurrentToken->is(tok::identifier) && Next->isNot(tok::equal)) {
113 Prev->Type = TT_BinaryOperator;
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000114 LookForDecls = false;
115 }
116 }
117
118 if (CurrentToken->is(tok::r_paren)) {
Manuel Klimekb3987012013-05-29 14:47:47 +0000119 if (MightBeFunctionType && CurrentToken->Next &&
120 CurrentToken->Next->isOneOf(tok::l_paren, tok::l_square))
Daniel Jasper431f5912013-05-28 08:33:00 +0000121 Left->Type = TT_FunctionTypeLParen;
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000122 Left->MatchingParen = CurrentToken;
123 CurrentToken->MatchingParen = Left;
124
Daniel Jasper63d7ced2013-02-05 10:07:47 +0000125 if (StartsObjCMethodExpr) {
Daniel Jasper4e778092013-02-06 10:05:46 +0000126 CurrentToken->Type = TT_ObjCMethodExpr;
127 if (Contexts.back().FirstObjCSelectorName != NULL) {
128 Contexts.back().FirstObjCSelectorName->LongestObjCSelectorName =
129 Contexts.back().LongestObjCSelectorName;
Daniel Jasper63d7ced2013-02-05 10:07:47 +0000130 }
131 }
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000132
133 next();
134 return true;
135 }
Alexander Kornienkoe74de282013-03-13 14:41:29 +0000136 if (CurrentToken->isOneOf(tok::r_square, tok::r_brace))
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000137 return false;
Manuel Klimekb3987012013-05-29 14:47:47 +0000138 if (CurrentToken->Previous->Type == TT_PointerOrReference &&
139 CurrentToken->Previous->Previous->isOneOf(tok::l_paren,
140 tok::coloncolon))
Daniel Jasper431f5912013-05-28 08:33:00 +0000141 MightBeFunctionType = true;
Daniel Jasper9fc56f22013-02-14 15:01:34 +0000142 updateParameterCount(Left, CurrentToken);
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000143 if (!consumeToken())
144 return false;
145 }
146 return false;
147 }
148
149 bool parseSquare() {
150 if (!CurrentToken)
151 return false;
152
153 // A '[' could be an index subscript (after an indentifier or after
Nico Weber051860e2013-02-10 02:08:05 +0000154 // ')' or ']'), it could be the start of an Objective-C method
155 // expression, or it could the the start of an Objective-C array literal.
Manuel Klimekb3987012013-05-29 14:47:47 +0000156 FormatToken *Left = CurrentToken->Previous;
157 FormatToken *Parent = Left->getPreviousNoneComment();
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000158 bool StartsObjCMethodExpr =
Daniel Jasper6f21a982013-03-13 07:49:51 +0000159 Contexts.back().CanBeExpression &&
Alexander Kornienkoe74de282013-03-13 14:41:29 +0000160 (!Parent || Parent->isOneOf(tok::colon, tok::l_square, tok::l_paren,
161 tok::kw_return, tok::kw_throw) ||
Daniel Jasperac3223e2013-04-10 09:49:49 +0000162 Parent->isUnaryOperator() || Parent->Type == TT_ObjCForIn ||
Alexander Kornienkoe74de282013-03-13 14:41:29 +0000163 Parent->Type == TT_CastRParen ||
Manuel Klimekb3987012013-05-29 14:47:47 +0000164 getBinOpPrecedence(Parent->Tok.getKind(), true, true) > prec::Unknown);
Daniel Jasper923ebef2013-03-14 13:45:21 +0000165 ScopedContextCreator ContextCreator(*this, tok::l_square, 10);
Daniel Jasper6f21a982013-03-13 07:49:51 +0000166 Contexts.back().IsExpression = true;
Nico Weber051860e2013-02-10 02:08:05 +0000167 bool StartsObjCArrayLiteral = Parent && Parent->is(tok::at);
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000168
Daniel Jasper4e778092013-02-06 10:05:46 +0000169 if (StartsObjCMethodExpr) {
170 Contexts.back().ColonIsObjCMethodExpr = true;
171 Left->Type = TT_ObjCMethodExpr;
Nico Weber051860e2013-02-10 02:08:05 +0000172 } else if (StartsObjCArrayLiteral) {
173 Left->Type = TT_ObjCArrayLiteral;
Daniel Jasper4e778092013-02-06 10:05:46 +0000174 }
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000175
176 while (CurrentToken != NULL) {
177 if (CurrentToken->is(tok::r_square)) {
Manuel Klimekb3987012013-05-29 14:47:47 +0000178 if (CurrentToken->Next && CurrentToken->Next->is(tok::l_paren)) {
Nico Webere8a97982013-02-06 06:20:11 +0000179 // An ObjC method call is rarely followed by an open parenthesis.
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000180 // FIXME: Do we incorrectly label ":" with this?
181 StartsObjCMethodExpr = false;
182 Left->Type = TT_Unknown;
183 }
Daniel Jasper01786732013-02-04 07:21:18 +0000184 if (StartsObjCMethodExpr) {
Daniel Jasper4e778092013-02-06 10:05:46 +0000185 CurrentToken->Type = TT_ObjCMethodExpr;
Nico Webere8a97982013-02-06 06:20:11 +0000186 // determineStarAmpUsage() thinks that '*' '[' is allocating an
187 // array of pointers, but if '[' starts a selector then '*' is a
188 // binary operator.
Alexander Kornienko3fd9ccd2013-03-12 16:28:18 +0000189 if (Parent != NULL && Parent->Type == TT_PointerOrReference)
Nico Weber4ed7f3e2013-02-06 16:54:35 +0000190 Parent->Type = TT_BinaryOperator;
Nico Weber051860e2013-02-10 02:08:05 +0000191 } else if (StartsObjCArrayLiteral) {
192 CurrentToken->Type = TT_ObjCArrayLiteral;
Daniel Jasper01786732013-02-04 07:21:18 +0000193 }
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000194 Left->MatchingParen = CurrentToken;
195 CurrentToken->MatchingParen = Left;
Daniel Jasper4e778092013-02-06 10:05:46 +0000196 if (Contexts.back().FirstObjCSelectorName != NULL)
197 Contexts.back().FirstObjCSelectorName->LongestObjCSelectorName =
198 Contexts.back().LongestObjCSelectorName;
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000199 next();
200 return true;
201 }
Alexander Kornienkoe74de282013-03-13 14:41:29 +0000202 if (CurrentToken->isOneOf(tok::r_paren, tok::r_brace))
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000203 return false;
Daniel Jasper9fc56f22013-02-14 15:01:34 +0000204 updateParameterCount(Left, CurrentToken);
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000205 if (!consumeToken())
206 return false;
207 }
208 return false;
209 }
210
211 bool parseBrace() {
Daniel Jasper53e72cd2013-05-06 08:27:33 +0000212 if (CurrentToken != NULL) {
213 ScopedContextCreator ContextCreator(*this, tok::l_brace, 1);
Manuel Klimekb3987012013-05-29 14:47:47 +0000214 FormatToken *Left = CurrentToken->Previous;
Nico Weberf2ff8122013-05-26 05:39:26 +0000215
Manuel Klimekb3987012013-05-29 14:47:47 +0000216 FormatToken *Parent = Left->getPreviousNoneComment();
Nico Weberf2ff8122013-05-26 05:39:26 +0000217 bool StartsObjCDictLiteral = Parent && Parent->is(tok::at);
218 if (StartsObjCDictLiteral) {
219 Contexts.back().ColonIsObjCDictLiteral = true;
220 Left->Type = TT_ObjCDictLiteral;
221 }
222
Daniel Jasper53e72cd2013-05-06 08:27:33 +0000223 while (CurrentToken != NULL) {
224 if (CurrentToken->is(tok::r_brace)) {
Nico Weberf2ff8122013-05-26 05:39:26 +0000225 if (StartsObjCDictLiteral)
226 CurrentToken->Type = TT_ObjCDictLiteral;
Daniel Jasper53e72cd2013-05-06 08:27:33 +0000227 Left->MatchingParen = CurrentToken;
228 CurrentToken->MatchingParen = Left;
229 next();
230 return true;
231 }
232 if (CurrentToken->isOneOf(tok::r_paren, tok::r_square))
233 return false;
234 updateParameterCount(Left, CurrentToken);
235 if (!consumeToken())
236 return false;
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000237 }
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000238 }
Daniel Jasper53e72cd2013-05-06 08:27:33 +0000239 // No closing "}" found, this probably starts a definition.
240 Line.StartsDefinition = true;
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000241 return true;
242 }
Daniel Jasperc4615b72013-02-20 12:56:39 +0000243
Manuel Klimekb3987012013-05-29 14:47:47 +0000244 void updateParameterCount(FormatToken *Left, FormatToken *Current) {
Daniel Jasper9fc56f22013-02-14 15:01:34 +0000245 if (Current->is(tok::comma))
246 ++Left->ParameterCount;
247 else if (Left->ParameterCount == 0 && Current->isNot(tok::comment))
248 Left->ParameterCount = 1;
249 }
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000250
251 bool parseConditional() {
252 while (CurrentToken != NULL) {
253 if (CurrentToken->is(tok::colon)) {
254 CurrentToken->Type = TT_ConditionalExpr;
255 next();
256 return true;
257 }
258 if (!consumeToken())
259 return false;
260 }
261 return false;
262 }
263
264 bool parseTemplateDeclaration() {
265 if (CurrentToken != NULL && CurrentToken->is(tok::less)) {
266 CurrentToken->Type = TT_TemplateOpener;
267 next();
268 if (!parseAngle())
269 return false;
Daniel Jasper34511fb2013-02-19 17:14:38 +0000270 if (CurrentToken != NULL)
Manuel Klimekb3987012013-05-29 14:47:47 +0000271 CurrentToken->Previous->ClosesTemplateDeclaration = true;
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000272 return true;
273 }
274 return false;
275 }
276
277 bool consumeToken() {
Manuel Klimekb3987012013-05-29 14:47:47 +0000278 FormatToken *Tok = CurrentToken;
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000279 next();
Manuel Klimekb3987012013-05-29 14:47:47 +0000280 switch (Tok->Tok.getKind()) {
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000281 case tok::plus:
282 case tok::minus:
Manuel Klimekb3987012013-05-29 14:47:47 +0000283 if (Tok->Previous == NULL && Line.MustBeDeclaration)
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000284 Tok->Type = TT_ObjCMethodSpecifier;
285 break;
286 case tok::colon:
Manuel Klimekb3987012013-05-29 14:47:47 +0000287 if (Tok->Previous == NULL)
Daniel Jaspercf6d76a2013-03-18 12:50:26 +0000288 return false;
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000289 // Colons from ?: are handled in parseConditional().
Manuel Klimekb3987012013-05-29 14:47:47 +0000290 if (Tok->Previous->is(tok::r_paren) && Contexts.size() == 1) {
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000291 Tok->Type = TT_CtorInitializerColon;
Nico Weberf2ff8122013-05-26 05:39:26 +0000292 } else if (Contexts.back().ColonIsObjCDictLiteral) {
293 Tok->Type = TT_ObjCDictLiteral;
Daniel Jasper4e778092013-02-06 10:05:46 +0000294 } else if (Contexts.back().ColonIsObjCMethodExpr ||
Manuel Klimekb3987012013-05-29 14:47:47 +0000295 Line.First->Type == TT_ObjCMethodSpecifier) {
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000296 Tok->Type = TT_ObjCMethodExpr;
Manuel Klimekb3987012013-05-29 14:47:47 +0000297 Tok->Previous->Type = TT_ObjCSelectorName;
298 if (Tok->Previous->TokenLength >
Daniel Jasper11e13802013-05-08 14:12:04 +0000299 Contexts.back().LongestObjCSelectorName)
Manuel Klimekb3987012013-05-29 14:47:47 +0000300 Contexts.back().LongestObjCSelectorName = Tok->Previous->TokenLength;
Daniel Jasper4e778092013-02-06 10:05:46 +0000301 if (Contexts.back().FirstObjCSelectorName == NULL)
Manuel Klimekb3987012013-05-29 14:47:47 +0000302 Contexts.back().FirstObjCSelectorName = Tok->Previous;
Daniel Jasper4e778092013-02-06 10:05:46 +0000303 } else if (Contexts.back().ColonIsForRangeExpr) {
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000304 Tok->Type = TT_RangeBasedForLoopColon;
Daniel Jasper6cabab42013-02-14 08:42:54 +0000305 } else if (Contexts.size() == 1) {
306 Tok->Type = TT_InheritanceColon;
Daniel Jasper923ebef2013-03-14 13:45:21 +0000307 } else if (Contexts.back().ContextKind == tok::l_paren) {
308 Tok->Type = TT_InlineASMColon;
Daniel Jasper63d7ced2013-02-05 10:07:47 +0000309 }
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000310 break;
311 case tok::kw_if:
312 case tok::kw_while:
313 if (CurrentToken != NULL && CurrentToken->is(tok::l_paren)) {
314 next();
315 if (!parseParens(/*LookForDecls=*/ true))
316 return false;
317 }
318 break;
319 case tok::kw_for:
Daniel Jasper4e778092013-02-06 10:05:46 +0000320 Contexts.back().ColonIsForRangeExpr = true;
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000321 next();
322 if (!parseParens())
323 return false;
324 break;
325 case tok::l_paren:
326 if (!parseParens())
327 return false;
Daniel Jasper1407bee2013-04-11 14:29:13 +0000328 if (Line.MustBeDeclaration && NameFound && !Contexts.back().IsExpression)
Daniel Jasper3c08a812013-02-24 18:54:32 +0000329 Line.MightBeFunctionDecl = true;
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000330 break;
331 case tok::l_square:
332 if (!parseSquare())
333 return false;
334 break;
335 case tok::l_brace:
336 if (!parseBrace())
337 return false;
338 break;
339 case tok::less:
340 if (parseAngle())
341 Tok->Type = TT_TemplateOpener;
342 else {
343 Tok->Type = TT_BinaryOperator;
344 CurrentToken = Tok;
345 next();
346 }
347 break;
348 case tok::r_paren:
349 case tok::r_square:
350 return false;
351 case tok::r_brace:
352 // Lines can start with '}'.
Manuel Klimekb3987012013-05-29 14:47:47 +0000353 if (Tok->Previous != NULL)
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000354 return false;
355 break;
356 case tok::greater:
357 Tok->Type = TT_BinaryOperator;
358 break;
359 case tok::kw_operator:
Daniel Jasper2b4c9242013-02-11 08:01:18 +0000360 while (CurrentToken && CurrentToken->isNot(tok::l_paren)) {
Alexander Kornienkoe74de282013-03-13 14:41:29 +0000361 if (CurrentToken->isOneOf(tok::star, tok::amp))
Daniel Jasper2b4c9242013-02-11 08:01:18 +0000362 CurrentToken->Type = TT_PointerOrReference;
363 consumeToken();
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000364 }
Daniel Jasper6ea933c2013-05-10 07:59:58 +0000365 if (CurrentToken) {
Daniel Jasper2b4c9242013-02-11 08:01:18 +0000366 CurrentToken->Type = TT_OverloadedOperatorLParen;
Manuel Klimekb3987012013-05-29 14:47:47 +0000367 if (CurrentToken->Previous->Type == TT_BinaryOperator)
368 CurrentToken->Previous->Type = TT_OverloadedOperator;
Daniel Jasper6ea933c2013-05-10 07:59:58 +0000369 }
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000370 break;
371 case tok::question:
372 parseConditional();
373 break;
374 case tok::kw_template:
375 parseTemplateDeclaration();
376 break;
Nico Weberc2e6d2a2013-02-11 15:32:15 +0000377 case tok::identifier:
Manuel Klimekb3987012013-05-29 14:47:47 +0000378 if (Line.First->is(tok::kw_for) &&
379 Tok->Tok.getIdentifierInfo() == &Ident_in)
Nico Weberc2e6d2a2013-02-11 15:32:15 +0000380 Tok->Type = TT_ObjCForIn;
381 break;
Daniel Jasper8ed9f2b2013-04-03 13:36:17 +0000382 case tok::comma:
383 if (Contexts.back().FirstStartOfName)
384 Contexts.back().FirstStartOfName->PartOfMultiVariableDeclStmt = true;
385 break;
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000386 default:
387 break;
388 }
389 return true;
390 }
391
392 void parseIncludeDirective() {
393 next();
394 if (CurrentToken != NULL && CurrentToken->is(tok::less)) {
395 next();
396 while (CurrentToken != NULL) {
Manuel Klimekb3987012013-05-29 14:47:47 +0000397 if (CurrentToken->isNot(tok::comment) || CurrentToken->Next)
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000398 CurrentToken->Type = TT_ImplicitStringLiteral;
399 next();
400 }
401 } else {
402 while (CurrentToken != NULL) {
Daniel Jasper3a204412013-02-23 07:46:38 +0000403 if (CurrentToken->is(tok::string_literal))
404 // Mark these string literals as "implicit" literals, too, so that
405 // they are not split or line-wrapped.
406 CurrentToken->Type = TT_ImplicitStringLiteral;
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000407 next();
408 }
409 }
410 }
411
412 void parseWarningOrError() {
413 next();
414 // We still want to format the whitespace left of the first token of the
415 // warning or error.
416 next();
417 while (CurrentToken != NULL) {
418 CurrentToken->Type = TT_ImplicitStringLiteral;
419 next();
420 }
421 }
422
423 void parsePreprocessorDirective() {
424 next();
425 if (CurrentToken == NULL)
426 return;
427 // Hashes in the middle of a line can lead to any strange token
428 // sequence.
Manuel Klimekb3987012013-05-29 14:47:47 +0000429 if (CurrentToken->Tok.getIdentifierInfo() == NULL)
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000430 return;
Manuel Klimekb3987012013-05-29 14:47:47 +0000431 switch (CurrentToken->Tok.getIdentifierInfo()->getPPKeywordID()) {
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000432 case tok::pp_include:
433 case tok::pp_import:
434 parseIncludeDirective();
435 break;
436 case tok::pp_error:
437 case tok::pp_warning:
438 parseWarningOrError();
439 break;
Daniel Jasperaae7bad2013-04-23 13:54:04 +0000440 case tok::pp_if:
441 case tok::pp_elif:
442 parseLine();
443 break;
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000444 default:
445 break;
446 }
Daniel Jasper5b7e7b02013-02-05 09:34:14 +0000447 while (CurrentToken != NULL)
448 next();
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000449 }
450
Nico Weber95e8e462013-02-12 16:17:07 +0000451public:
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000452 LineType parseLine() {
453 int PeriodsAndArrows = 0;
Manuel Klimekb3987012013-05-29 14:47:47 +0000454 FormatToken *LastPeriodOrArrow = NULL;
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000455 bool CanBeBuilderTypeStmt = true;
456 if (CurrentToken->is(tok::hash)) {
457 parsePreprocessorDirective();
458 return LT_PreprocessorDirective;
459 }
460 while (CurrentToken != NULL) {
461 if (CurrentToken->is(tok::kw_virtual))
462 KeywordVirtualFound = true;
Alexander Kornienkoe74de282013-03-13 14:41:29 +0000463 if (CurrentToken->isOneOf(tok::period, tok::arrow)) {
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000464 ++PeriodsAndArrows;
Daniel Jasper24849712013-03-01 16:48:32 +0000465 LastPeriodOrArrow = CurrentToken;
466 }
Manuel Klimekb3987012013-05-29 14:47:47 +0000467 FormatToken *TheToken = CurrentToken;
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000468 if (!consumeToken())
469 return LT_Invalid;
Manuel Klimekb3987012013-05-29 14:47:47 +0000470 if (TheToken->getPrecedence() > prec::Assignment &&
Daniel Jasper82282dc2013-02-18 13:52:06 +0000471 TheToken->Type == TT_BinaryOperator)
Daniel Jasper4a544e52013-02-15 20:33:06 +0000472 CanBeBuilderTypeStmt = false;
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000473 }
474 if (KeywordVirtualFound)
475 return LT_VirtualFunctionDecl;
476
477 // Assume a builder-type call if there are 2 or more "." and "->".
Daniel Jasper24849712013-03-01 16:48:32 +0000478 if (PeriodsAndArrows >= 2 && CanBeBuilderTypeStmt) {
479 LastPeriodOrArrow->LastInChainOfCalls = true;
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000480 return LT_BuilderTypeCall;
Daniel Jasper24849712013-03-01 16:48:32 +0000481 }
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000482
Manuel Klimekb3987012013-05-29 14:47:47 +0000483 if (Line.First->Type == TT_ObjCMethodSpecifier) {
Daniel Jasper4e778092013-02-06 10:05:46 +0000484 if (Contexts.back().FirstObjCSelectorName != NULL)
485 Contexts.back().FirstObjCSelectorName->LongestObjCSelectorName =
486 Contexts.back().LongestObjCSelectorName;
Daniel Jasper63d7ced2013-02-05 10:07:47 +0000487 return LT_ObjCMethodDecl;
488 }
489
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000490 return LT_Other;
491 }
492
Nico Weber95e8e462013-02-12 16:17:07 +0000493private:
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000494 void next() {
Daniel Jasper01786732013-02-04 07:21:18 +0000495 if (CurrentToken != NULL) {
496 determineTokenType(*CurrentToken);
Daniel Jasper4e778092013-02-06 10:05:46 +0000497 CurrentToken->BindingStrength = Contexts.back().BindingStrength;
Daniel Jasper01786732013-02-04 07:21:18 +0000498 }
499
Manuel Klimekb3987012013-05-29 14:47:47 +0000500 if (CurrentToken != NULL)
501 CurrentToken = CurrentToken->Next;
Daniel Jasperd0f349b2013-02-18 12:44:35 +0000502
503 // Reset token type in case we have already looked at it and then recovered
504 // from an error (e.g. failure to find the matching >).
505 if (CurrentToken != NULL)
506 CurrentToken->Type = TT_Unknown;
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000507 }
508
Daniel Jasper4e778092013-02-06 10:05:46 +0000509 /// \brief A struct to hold information valid in a specific context, e.g.
510 /// a pair of parenthesis.
511 struct Context {
Daniel Jasper923ebef2013-03-14 13:45:21 +0000512 Context(tok::TokenKind ContextKind, unsigned BindingStrength,
513 bool IsExpression)
514 : ContextKind(ContextKind), BindingStrength(BindingStrength),
515 LongestObjCSelectorName(0), ColonIsForRangeExpr(false),
Nico Weberf2ff8122013-05-26 05:39:26 +0000516 ColonIsObjCDictLiteral(false), ColonIsObjCMethodExpr(false),
517 FirstObjCSelectorName(NULL), FirstStartOfName(NULL),
518 IsExpression(IsExpression), CanBeExpression(true) {}
Daniel Jasper01786732013-02-04 07:21:18 +0000519
Daniel Jasper923ebef2013-03-14 13:45:21 +0000520 tok::TokenKind ContextKind;
Daniel Jasper4e778092013-02-06 10:05:46 +0000521 unsigned BindingStrength;
522 unsigned LongestObjCSelectorName;
523 bool ColonIsForRangeExpr;
Nico Weberf2ff8122013-05-26 05:39:26 +0000524 bool ColonIsObjCDictLiteral;
Daniel Jasper4e778092013-02-06 10:05:46 +0000525 bool ColonIsObjCMethodExpr;
Manuel Klimekb3987012013-05-29 14:47:47 +0000526 FormatToken *FirstObjCSelectorName;
527 FormatToken *FirstStartOfName;
Daniel Jasper4e778092013-02-06 10:05:46 +0000528 bool IsExpression;
Daniel Jasper6f21a982013-03-13 07:49:51 +0000529 bool CanBeExpression;
Daniel Jasper4e778092013-02-06 10:05:46 +0000530 };
531
532 /// \brief Puts a new \c Context onto the stack \c Contexts for the lifetime
533 /// of each instance.
534 struct ScopedContextCreator {
535 AnnotatingParser &P;
536
Daniel Jasper923ebef2013-03-14 13:45:21 +0000537 ScopedContextCreator(AnnotatingParser &P, tok::TokenKind ContextKind,
538 unsigned Increase)
539 : P(P) {
540 P.Contexts.push_back(
541 Context(ContextKind, P.Contexts.back().BindingStrength + Increase,
542 P.Contexts.back().IsExpression));
Daniel Jasper4e778092013-02-06 10:05:46 +0000543 }
544
545 ~ScopedContextCreator() { P.Contexts.pop_back(); }
546 };
Daniel Jasper01786732013-02-04 07:21:18 +0000547
Manuel Klimekb3987012013-05-29 14:47:47 +0000548 void determineTokenType(FormatToken &Current) {
549 if (Current.getPrecedence() == prec::Assignment &&
550 (!Current.Previous || Current.Previous->isNot(tok::kw_operator))) {
Daniel Jasper4e778092013-02-06 10:05:46 +0000551 Contexts.back().IsExpression = true;
Manuel Klimekb3987012013-05-29 14:47:47 +0000552 for (FormatToken *Previous = Current.Previous;
Nico Weber95e8e462013-02-12 16:17:07 +0000553 Previous && Previous->isNot(tok::comma);
Manuel Klimekb3987012013-05-29 14:47:47 +0000554 Previous = Previous->Previous) {
Daniel Jasper9c65b062013-02-27 11:43:50 +0000555 if (Previous->is(tok::r_square))
556 Previous = Previous->MatchingParen;
Daniel Jasper01786732013-02-04 07:21:18 +0000557 if (Previous->Type == TT_BinaryOperator &&
Alexander Kornienkoe74de282013-03-13 14:41:29 +0000558 Previous->isOneOf(tok::star, tok::amp)) {
Daniel Jasper01786732013-02-04 07:21:18 +0000559 Previous->Type = TT_PointerOrReference;
560 }
Daniel Jasper01786732013-02-04 07:21:18 +0000561 }
Alexander Kornienkoe74de282013-03-13 14:41:29 +0000562 } else if (Current.isOneOf(tok::kw_return, tok::kw_throw) ||
Nico Weber95e8e462013-02-12 16:17:07 +0000563 (Current.is(tok::l_paren) && !Line.MustBeDeclaration &&
Daniel Jasper378d93d2013-05-13 07:14:40 +0000564 !Line.InPPDirective &&
Manuel Klimekb3987012013-05-29 14:47:47 +0000565 (!Current.Previous || Current.Previous->isNot(tok::kw_for)))) {
Daniel Jasper4e778092013-02-06 10:05:46 +0000566 Contexts.back().IsExpression = true;
Alexander Kornienkoe74de282013-03-13 14:41:29 +0000567 } else if (Current.isOneOf(tok::r_paren, tok::greater, tok::comma)) {
Manuel Klimekb3987012013-05-29 14:47:47 +0000568 for (FormatToken *Previous = Current.Previous;
Alexander Kornienkoe74de282013-03-13 14:41:29 +0000569 Previous && Previous->isOneOf(tok::star, tok::amp);
Manuel Klimekb3987012013-05-29 14:47:47 +0000570 Previous = Previous->Previous)
Nico Weber95e8e462013-02-12 16:17:07 +0000571 Previous->Type = TT_PointerOrReference;
Manuel Klimekb3987012013-05-29 14:47:47 +0000572 } else if (Current.Previous &&
573 Current.Previous->Type == TT_CtorInitializerColon) {
Daniel Jasperd0f349b2013-02-18 12:44:35 +0000574 Contexts.back().IsExpression = true;
Daniel Jasper6f21a982013-03-13 07:49:51 +0000575 } else if (Current.is(tok::kw_new)) {
576 Contexts.back().CanBeExpression = false;
Daniel Jasper16a69ef2013-05-03 14:41:24 +0000577 } else if (Current.is(tok::semi)) {
578 // This should be the condition or increment in a for-loop.
579 Contexts.back().IsExpression = true;
Nico Weber95e8e462013-02-12 16:17:07 +0000580 }
Daniel Jasper01786732013-02-04 07:21:18 +0000581
582 if (Current.Type == TT_Unknown) {
Manuel Klimekb3987012013-05-29 14:47:47 +0000583 if (Current.Previous && Current.is(tok::identifier) &&
584 ((Current.Previous->is(tok::identifier) &&
585 Current.Previous->Tok.getIdentifierInfo()->getPPKeywordID() ==
Daniel Jasper11e13802013-05-08 14:12:04 +0000586 tok::pp_not_keyword) ||
Manuel Klimekb3987012013-05-29 14:47:47 +0000587 isSimpleTypeSpecifier(*Current.Previous) ||
588 Current.Previous->Type == TT_PointerOrReference ||
589 Current.Previous->Type == TT_TemplateCloser)) {
Daniel Jasper8ed9f2b2013-04-03 13:36:17 +0000590 Contexts.back().FirstStartOfName = &Current;
Daniel Jasper3c08a812013-02-24 18:54:32 +0000591 Current.Type = TT_StartOfName;
Daniel Jasper1407bee2013-04-11 14:29:13 +0000592 NameFound = true;
Alexander Kornienkoe74de282013-03-13 14:41:29 +0000593 } else if (Current.isOneOf(tok::star, tok::amp, tok::ampamp)) {
Daniel Jasper4e778092013-02-06 10:05:46 +0000594 Current.Type =
595 determineStarAmpUsage(Current, Contexts.back().IsExpression);
Alexander Kornienkoe74de282013-03-13 14:41:29 +0000596 } else if (Current.isOneOf(tok::minus, tok::plus, tok::caret)) {
Daniel Jasper01786732013-02-04 07:21:18 +0000597 Current.Type = determinePlusMinusCaretUsage(Current);
Alexander Kornienkoe74de282013-03-13 14:41:29 +0000598 } else if (Current.isOneOf(tok::minusminus, tok::plusplus)) {
Daniel Jasper01786732013-02-04 07:21:18 +0000599 Current.Type = determineIncrementUsage(Current);
600 } else if (Current.is(tok::exclaim)) {
601 Current.Type = TT_UnaryOperator;
Daniel Jasperac3223e2013-04-10 09:49:49 +0000602 } else if (Current.isBinaryOperator()) {
Daniel Jasper01786732013-02-04 07:21:18 +0000603 Current.Type = TT_BinaryOperator;
604 } else if (Current.is(tok::comment)) {
Manuel Klimekb3987012013-05-29 14:47:47 +0000605 std::string Data(
606 Lexer::getSpelling(Current.Tok, SourceMgr, Lex.getLangOpts()));
Daniel Jasper01786732013-02-04 07:21:18 +0000607 if (StringRef(Data).startswith("//"))
608 Current.Type = TT_LineComment;
609 else
610 Current.Type = TT_BlockComment;
Nico Weber37d69312013-02-13 04:13:13 +0000611 } else if (Current.is(tok::r_paren)) {
Daniel Jasperb8b42952013-05-31 16:14:28 +0000612 FormatToken *LeftOfParens = NULL;
613 if (Current.MatchingParen)
614 LeftOfParens = Current.MatchingParen->getPreviousNoneComment();
615 bool IsCast = false;
616 bool ParensAreEmpty = Current.Previous == Current.MatchingParen;
617 bool ParensAreType = !Current.Previous ||
Manuel Klimekb3987012013-05-29 14:47:47 +0000618 Current.Previous->Type == TT_PointerOrReference ||
Daniel Jasperb8b42952013-05-31 16:14:28 +0000619 Current.Previous->Type == TT_TemplateCloser ||
620 isSimpleTypeSpecifier(*Current.Previous);
Nico Weber37d69312013-02-13 04:13:13 +0000621 bool ParensCouldEndDecl =
Manuel Klimekb3987012013-05-29 14:47:47 +0000622 Current.Next &&
623 Current.Next->isOneOf(tok::equal, tok::semi, tok::l_brace);
Daniel Jasper6a365aa2013-03-13 17:13:53 +0000624 bool IsSizeOfOrAlignOf =
Daniel Jasperb8b42952013-05-31 16:14:28 +0000625 LeftOfParens &&
626 LeftOfParens->isOneOf(tok::kw_sizeof, tok::kw_alignof);
627 if (ParensAreType && !ParensCouldEndDecl && !IsSizeOfOrAlignOf &&
Daniel Jasper37eff832013-02-23 08:07:18 +0000628 Contexts.back().IsExpression)
Daniel Jasperb8b42952013-05-31 16:14:28 +0000629 IsCast = true;
630 if (Current.Next &&
631 (Current.Next->Tok.isLiteral() ||
632 Current.Next->isOneOf(tok::kw_sizeof, tok::kw_alignof)))
633 IsCast = true;
634 // If there is an identifier after the (), it is likely a cast, unless
635 // there is also an identifier before the ().
636 if (LeftOfParens && LeftOfParens->Tok.getIdentifierInfo() == NULL &&
637 LeftOfParens->Type != TT_ObjCMethodExpr && Current.Next &&
638 (Current.Next->is(tok::identifier)))
639 IsCast = true;
640 if (IsCast && !ParensAreEmpty)
Nico Weber37d69312013-02-13 04:13:13 +0000641 Current.Type = TT_CastRParen;
Manuel Klimekb3987012013-05-29 14:47:47 +0000642 } else if (Current.is(tok::at) && Current.Next) {
643 switch (Current.Next->Tok.getObjCKeywordID()) {
Daniel Jasper01786732013-02-04 07:21:18 +0000644 case tok::objc_interface:
645 case tok::objc_implementation:
646 case tok::objc_protocol:
647 Current.Type = TT_ObjCDecl;
648 break;
649 case tok::objc_property:
650 Current.Type = TT_ObjCProperty;
651 break;
652 default:
653 break;
654 }
Daniel Jasper5ad390d2013-05-28 11:30:49 +0000655 } else if (Current.is(tok::period)) {
Manuel Klimekb3987012013-05-29 14:47:47 +0000656 FormatToken *PreviousNoComment = Current.getPreviousNoneComment();
Daniel Jasper5ad390d2013-05-28 11:30:49 +0000657 if (PreviousNoComment &&
658 PreviousNoComment->isOneOf(tok::comma, tok::l_brace))
659 Current.Type = TT_DesignatedInitializerPeriod;
Daniel Jasper01786732013-02-04 07:21:18 +0000660 }
661 }
662 }
663
Daniel Jasper01786732013-02-04 07:21:18 +0000664 /// \brief Return the type of the given token assuming it is * or &.
Manuel Klimekb3987012013-05-29 14:47:47 +0000665 TokenType determineStarAmpUsage(const FormatToken &Tok, bool IsExpression) {
666 const FormatToken *PrevToken = Tok.getPreviousNoneComment();
Daniel Jasper01786732013-02-04 07:21:18 +0000667 if (PrevToken == NULL)
668 return TT_UnaryOperator;
669
Manuel Klimekb3987012013-05-29 14:47:47 +0000670 const FormatToken *NextToken = Tok.getNextNoneComment();
Daniel Jasper01786732013-02-04 07:21:18 +0000671 if (NextToken == NULL)
672 return TT_Unknown;
673
Daniel Jasper431f5912013-05-28 08:33:00 +0000674 if (PrevToken->is(tok::coloncolon) ||
675 (PrevToken->is(tok::l_paren) && !IsExpression))
Daniel Jasper8a5d7cd2013-03-01 17:13:29 +0000676 return TT_PointerOrReference;
677
Alexander Kornienkoe74de282013-03-13 14:41:29 +0000678 if (PrevToken->isOneOf(tok::l_paren, tok::l_square, tok::l_brace,
Daniel Jasperd3cf17b2013-03-14 10:50:25 +0000679 tok::comma, tok::semi, tok::kw_return, tok::colon,
Daniel Jasperdbef71e2013-05-07 14:17:18 +0000680 tok::equal, tok::kw_delete) ||
Alexander Kornienkoe74de282013-03-13 14:41:29 +0000681 PrevToken->Type == TT_BinaryOperator ||
Daniel Jasper01786732013-02-04 07:21:18 +0000682 PrevToken->Type == TT_UnaryOperator || PrevToken->Type == TT_CastRParen)
683 return TT_UnaryOperator;
684
Nico Webere8a97982013-02-06 06:20:11 +0000685 if (NextToken->is(tok::l_square))
686 return TT_PointerOrReference;
687
Manuel Klimekb3987012013-05-29 14:47:47 +0000688 if (PrevToken->Tok.isLiteral() ||
Alexander Kornienkoe74de282013-03-13 14:41:29 +0000689 PrevToken->isOneOf(tok::r_paren, tok::r_square) ||
Manuel Klimekb3987012013-05-29 14:47:47 +0000690 NextToken->Tok.isLiteral() || NextToken->isUnaryOperator())
Daniel Jasper01786732013-02-04 07:21:18 +0000691 return TT_BinaryOperator;
692
Daniel Jasper01786732013-02-04 07:21:18 +0000693 // It is very unlikely that we are going to find a pointer or reference type
694 // definition on the RHS of an assignment.
695 if (IsExpression)
696 return TT_BinaryOperator;
697
698 return TT_PointerOrReference;
699 }
700
Manuel Klimekb3987012013-05-29 14:47:47 +0000701 TokenType determinePlusMinusCaretUsage(const FormatToken &Tok) {
702 const FormatToken *PrevToken = Tok.getPreviousNoneComment();
Daniel Jasperb8b42952013-05-31 16:14:28 +0000703 if (PrevToken == NULL || PrevToken->Type == TT_CastRParen)
Daniel Jasper01786732013-02-04 07:21:18 +0000704 return TT_UnaryOperator;
705
706 // Use heuristics to recognize unary operators.
Alexander Kornienkoe74de282013-03-13 14:41:29 +0000707 if (PrevToken->isOneOf(tok::equal, tok::l_paren, tok::comma, tok::l_square,
708 tok::question, tok::colon, tok::kw_return,
709 tok::kw_case, tok::at, tok::l_brace))
Daniel Jasper01786732013-02-04 07:21:18 +0000710 return TT_UnaryOperator;
711
Nico Weberee0feec2013-02-05 16:21:00 +0000712 // There can't be two consecutive binary operators.
Daniel Jasper01786732013-02-04 07:21:18 +0000713 if (PrevToken->Type == TT_BinaryOperator)
714 return TT_UnaryOperator;
715
716 // Fall back to marking the token as binary operator.
717 return TT_BinaryOperator;
718 }
719
720 /// \brief Determine whether ++/-- are pre- or post-increments/-decrements.
Manuel Klimekb3987012013-05-29 14:47:47 +0000721 TokenType determineIncrementUsage(const FormatToken &Tok) {
722 const FormatToken *PrevToken = Tok.getPreviousNoneComment();
Daniel Jasperb8b42952013-05-31 16:14:28 +0000723 if (PrevToken == NULL || PrevToken->Type == TT_CastRParen)
Daniel Jasper01786732013-02-04 07:21:18 +0000724 return TT_UnaryOperator;
Alexander Kornienkoe74de282013-03-13 14:41:29 +0000725 if (PrevToken->isOneOf(tok::r_paren, tok::r_square, tok::identifier))
Daniel Jasper01786732013-02-04 07:21:18 +0000726 return TT_TrailingUnaryOperator;
727
728 return TT_UnaryOperator;
729 }
Daniel Jasper4e778092013-02-06 10:05:46 +0000730
Daniel Jasper8ed9f2b2013-04-03 13:36:17 +0000731 // FIXME: This is copy&pasted from Sema. Put it in a common place and remove
732 // duplication.
733 /// \brief Determine whether the token kind starts a simple-type-specifier.
Manuel Klimekb3987012013-05-29 14:47:47 +0000734 bool isSimpleTypeSpecifier(const FormatToken &Tok) const {
735 switch (Tok.Tok.getKind()) {
Daniel Jasper8ed9f2b2013-04-03 13:36:17 +0000736 case tok::kw_short:
737 case tok::kw_long:
738 case tok::kw___int64:
739 case tok::kw___int128:
740 case tok::kw_signed:
741 case tok::kw_unsigned:
742 case tok::kw_void:
743 case tok::kw_char:
744 case tok::kw_int:
745 case tok::kw_half:
746 case tok::kw_float:
747 case tok::kw_double:
748 case tok::kw_wchar_t:
749 case tok::kw_bool:
750 case tok::kw___underlying_type:
751 return true;
752 case tok::annot_typename:
753 case tok::kw_char16_t:
754 case tok::kw_char32_t:
755 case tok::kw_typeof:
756 case tok::kw_decltype:
757 return Lex.getLangOpts().CPlusPlus;
758 default:
759 break;
760 }
761 return false;
762 }
763
Daniel Jasper4e778092013-02-06 10:05:46 +0000764 SmallVector<Context, 8> Contexts;
765
766 SourceManager &SourceMgr;
767 Lexer &Lex;
768 AnnotatedLine &Line;
Manuel Klimekb3987012013-05-29 14:47:47 +0000769 FormatToken *CurrentToken;
Daniel Jasper4e778092013-02-06 10:05:46 +0000770 bool KeywordVirtualFound;
Daniel Jasper1407bee2013-04-11 14:29:13 +0000771 bool NameFound;
Nico Weberc2e6d2a2013-02-11 15:32:15 +0000772 IdentifierInfo &Ident_in;
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000773};
774
Daniel Jasper29f123b2013-02-08 15:28:42 +0000775/// \brief Parses binary expressions by inserting fake parenthesis based on
776/// operator precedence.
777class ExpressionParser {
778public:
Manuel Klimekb3987012013-05-29 14:47:47 +0000779 ExpressionParser(AnnotatedLine &Line) : Current(Line.First) {}
Daniel Jasper29f123b2013-02-08 15:28:42 +0000780
781 /// \brief Parse expressions with the given operatore precedence.
Daniel Jasper237d4c12013-02-23 21:01:55 +0000782 void parse(int Precedence = 0) {
Daniel Jasperc01897c2013-05-31 14:56:12 +0000783 // Conditional expressions need to be parsed separately for proper nesting.
784 if (Precedence == prec::Conditional + 1) {
785 parseConditionalExpr();
786 return;
787 }
Daniel Jasper29f123b2013-02-08 15:28:42 +0000788 if (Precedence > prec::PointerToMember || Current == NULL)
789 return;
790
Daniel Jasper29f123b2013-02-08 15:28:42 +0000791 // Eagerly consume trailing comments.
Daniel Jasperac3223e2013-04-10 09:49:49 +0000792 while (Current && Current->isTrailingComment()) {
Daniel Jasper29f123b2013-02-08 15:28:42 +0000793 next();
794 }
795
Manuel Klimekb3987012013-05-29 14:47:47 +0000796 FormatToken *Start = Current;
Daniel Jasper29f123b2013-02-08 15:28:42 +0000797 bool OperatorFound = false;
798
Daniel Jasper237d4c12013-02-23 21:01:55 +0000799 while (Current) {
Daniel Jasper29f123b2013-02-08 15:28:42 +0000800 // Consume operators with higher precedence.
Daniel Jasperbf71ba22013-04-08 20:33:42 +0000801 parse(Precedence + 1);
Daniel Jasper29f123b2013-02-08 15:28:42 +0000802
Daniel Jasper237d4c12013-02-23 21:01:55 +0000803 int CurrentPrecedence = 0;
804 if (Current) {
805 if (Current->Type == TT_ConditionalExpr)
Daniel Jasperb8b42952013-05-31 16:14:28 +0000806 CurrentPrecedence = 1 + (int)prec::Conditional;
Daniel Jasperbf71ba22013-04-08 20:33:42 +0000807 else if (Current->is(tok::semi) || Current->Type == TT_InlineASMColon)
Daniel Jasper237d4c12013-02-23 21:01:55 +0000808 CurrentPrecedence = 1;
809 else if (Current->Type == TT_BinaryOperator || Current->is(tok::comma))
Daniel Jasperb8b42952013-05-31 16:14:28 +0000810 CurrentPrecedence = 1 + (int)Current->getPrecedence();
Daniel Jasper237d4c12013-02-23 21:01:55 +0000811 }
812
Daniel Jasper29f123b2013-02-08 15:28:42 +0000813 // At the end of the line or when an operator with higher precedence is
814 // found, insert fake parenthesis and return.
Daniel Jasperac3223e2013-04-10 09:49:49 +0000815 if (Current == NULL || Current->closesScope() ||
Daniel Jasper237d4c12013-02-23 21:01:55 +0000816 (CurrentPrecedence != 0 && CurrentPrecedence < Precedence)) {
Daniel Jasperc01897c2013-05-31 14:56:12 +0000817 if (OperatorFound)
818 addFakeParenthesis(Start, prec::Level(Precedence - 1));
Daniel Jasper29f123b2013-02-08 15:28:42 +0000819 return;
820 }
821
822 // Consume scopes: (), [], <> and {}
Daniel Jasperac3223e2013-04-10 09:49:49 +0000823 if (Current->opensScope()) {
824 while (Current && !Current->closesScope()) {
Daniel Jasper29f123b2013-02-08 15:28:42 +0000825 next();
826 parse();
827 }
828 next();
829 } else {
830 // Operator found.
Daniel Jasper237d4c12013-02-23 21:01:55 +0000831 if (CurrentPrecedence == Precedence)
Daniel Jasper29f123b2013-02-08 15:28:42 +0000832 OperatorFound = true;
833
834 next();
835 }
836 }
837 }
838
839private:
Daniel Jasperc01897c2013-05-31 14:56:12 +0000840 void addFakeParenthesis(FormatToken *Start, prec::Level Precedence) {
841 Start->FakeLParens.push_back(Precedence);
842 if (Current)
843 ++Current->Previous->FakeRParens;
844 }
845
846 void parseConditionalExpr() {
847 FormatToken *Start = Current;
848 parse(prec::LogicalOr + 1);
849 if (!Current || !Current->is(tok::question))
850 return;
851 next();
852 parse(prec::LogicalOr + 1);
853 if (!Current || Current->Type != TT_ConditionalExpr)
854 return;
855 next();
856 parseConditionalExpr();
857 addFakeParenthesis(Start, prec::Conditional);
858 }
859
Daniel Jasper29f123b2013-02-08 15:28:42 +0000860 void next() {
861 if (Current != NULL)
Manuel Klimekb3987012013-05-29 14:47:47 +0000862 Current = Current->Next;
Daniel Jasper29f123b2013-02-08 15:28:42 +0000863 }
864
Manuel Klimekb3987012013-05-29 14:47:47 +0000865 FormatToken *Current;
Daniel Jasper29f123b2013-02-08 15:28:42 +0000866};
867
Daniel Jasper8ff690a2013-02-06 14:22:40 +0000868void TokenAnnotator::annotate(AnnotatedLine &Line) {
Nico Weberc2e6d2a2013-02-11 15:32:15 +0000869 AnnotatingParser Parser(SourceMgr, Lex, Line, Ident_in);
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000870 Line.Type = Parser.parseLine();
871 if (Line.Type == LT_Invalid)
872 return;
873
Daniel Jasper29f123b2013-02-08 15:28:42 +0000874 ExpressionParser ExprParser(Line);
875 ExprParser.parse();
876
Manuel Klimekb3987012013-05-29 14:47:47 +0000877 if (Line.First->Type == TT_ObjCMethodSpecifier)
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000878 Line.Type = LT_ObjCMethodDecl;
Manuel Klimekb3987012013-05-29 14:47:47 +0000879 else if (Line.First->Type == TT_ObjCDecl)
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000880 Line.Type = LT_ObjCDecl;
Manuel Klimekb3987012013-05-29 14:47:47 +0000881 else if (Line.First->Type == TT_ObjCProperty)
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000882 Line.Type = LT_ObjCProperty;
883
Manuel Klimekb3987012013-05-29 14:47:47 +0000884 Line.First->SpacesRequiredBefore = 1;
885 Line.First->CanBreakBefore = Line.First->MustBreakBefore;
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000886}
887
Daniel Jasper8ff690a2013-02-06 14:22:40 +0000888void TokenAnnotator::calculateFormattingInformation(AnnotatedLine &Line) {
Manuel Klimekb3987012013-05-29 14:47:47 +0000889 Line.First->TotalLength = Line.First->TokenLength;
890 if (!Line.First->Next)
Daniel Jasper8ff690a2013-02-06 14:22:40 +0000891 return;
Manuel Klimekb3987012013-05-29 14:47:47 +0000892 FormatToken *Current = Line.First->Next;
Daniel Jasper8ff690a2013-02-06 14:22:40 +0000893 while (Current != NULL) {
Daniel Jasper729a7432013-02-11 12:36:37 +0000894 if (Current->Type == TT_LineComment)
895 Current->SpacesRequiredBefore = Style.SpacesBeforeTrailingComments;
896 else
897 Current->SpacesRequiredBefore =
898 spaceRequiredBefore(Line, *Current) ? 1 : 0;
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000899
Manuel Klimekb3987012013-05-29 14:47:47 +0000900 if (Current->MustBreakBefore) {
Daniel Jasper8ff690a2013-02-06 14:22:40 +0000901 } else if (Current->Type == TT_LineComment) {
Manuel Klimekb3987012013-05-29 14:47:47 +0000902 Current->MustBreakBefore = Current->NewlinesBefore > 0;
903 } else if (Current->Previous->isTrailingComment() ||
Daniel Jasper8ff690a2013-02-06 14:22:40 +0000904 (Current->is(tok::string_literal) &&
Manuel Klimekb3987012013-05-29 14:47:47 +0000905 Current->Previous->is(tok::string_literal))) {
Daniel Jasper8ff690a2013-02-06 14:22:40 +0000906 Current->MustBreakBefore = true;
Manuel Klimekb3987012013-05-29 14:47:47 +0000907 } else if (Current->is(tok::lessless) && Current->Next &&
908 Current->Previous->is(tok::string_literal) &&
909 Current->Next->is(tok::string_literal)) {
Daniel Jasper8ff690a2013-02-06 14:22:40 +0000910 Current->MustBreakBefore = true;
Manuel Klimekb3987012013-05-29 14:47:47 +0000911 } else if (Current->Previous->ClosesTemplateDeclaration &&
Daniel Jasperbbc87762013-05-29 12:07:31 +0000912 Style.AlwaysBreakTemplateDeclarations) {
913 Current->MustBreakBefore = true;
Daniel Jasper8ff690a2013-02-06 14:22:40 +0000914 } else {
915 Current->MustBreakBefore = false;
916 }
917 Current->CanBreakBefore =
918 Current->MustBreakBefore || canBreakBefore(Line, *Current);
919 if (Current->MustBreakBefore)
Manuel Klimekb3987012013-05-29 14:47:47 +0000920 Current->TotalLength = Current->Previous->TotalLength + Style.ColumnLimit;
Daniel Jasper8ff690a2013-02-06 14:22:40 +0000921 else
922 Current->TotalLength =
Manuel Klimekb3987012013-05-29 14:47:47 +0000923 Current->Previous->TotalLength + Current->TokenLength +
Daniel Jasper729a7432013-02-11 12:36:37 +0000924 Current->SpacesRequiredBefore;
Daniel Jasper8ff690a2013-02-06 14:22:40 +0000925 // FIXME: Only calculate this if CanBreakBefore is true once static
926 // initializers etc. are sorted out.
927 // FIXME: Move magic numbers to a better place.
928 Current->SplitPenalty =
929 20 * Current->BindingStrength + splitPenalty(Line, *Current);
930
Manuel Klimekb3987012013-05-29 14:47:47 +0000931 Current = Current->Next;
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000932 }
Daniel Jasperbf71ba22013-04-08 20:33:42 +0000933
Manuel Klimeke573c3f2013-05-22 12:51:29 +0000934 calculateUnbreakableTailLengths(Line);
Daniel Jasperbf71ba22013-04-08 20:33:42 +0000935 DEBUG({
936 printDebugInfo(Line);
937 });
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000938}
939
Manuel Klimeke573c3f2013-05-22 12:51:29 +0000940void TokenAnnotator::calculateUnbreakableTailLengths(AnnotatedLine &Line) {
941 unsigned UnbreakableTailLength = 0;
Manuel Klimekb3987012013-05-29 14:47:47 +0000942 FormatToken *Current = Line.Last;
Manuel Klimeke573c3f2013-05-22 12:51:29 +0000943 while (Current != NULL) {
944 Current->UnbreakableTailLength = UnbreakableTailLength;
945 if (Current->CanBreakBefore ||
946 Current->isOneOf(tok::comment, tok::string_literal)) {
947 UnbreakableTailLength = 0;
948 } else {
949 UnbreakableTailLength +=
Manuel Klimekb3987012013-05-29 14:47:47 +0000950 Current->TokenLength + Current->SpacesRequiredBefore;
Manuel Klimeke573c3f2013-05-22 12:51:29 +0000951 }
Manuel Klimekb3987012013-05-29 14:47:47 +0000952 Current = Current->Previous;
Manuel Klimeke573c3f2013-05-22 12:51:29 +0000953 }
954}
955
Daniel Jasper8ff690a2013-02-06 14:22:40 +0000956unsigned TokenAnnotator::splitPenalty(const AnnotatedLine &Line,
Manuel Klimekb3987012013-05-29 14:47:47 +0000957 const FormatToken &Tok) {
958 const FormatToken &Left = *Tok.Previous;
959 const FormatToken &Right = Tok;
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000960
Daniel Jasper5ad390d2013-05-28 11:30:49 +0000961 if (Left.is(tok::semi))
962 return 0;
963 if (Left.is(tok::comma))
964 return 1;
965
Daniel Jasper3c08a812013-02-24 18:54:32 +0000966 if (Right.Type == TT_StartOfName) {
Manuel Klimekb3987012013-05-29 14:47:47 +0000967 if (Line.First->is(tok::kw_for) && Right.PartOfMultiVariableDeclStmt)
Daniel Jasper3c08a812013-02-24 18:54:32 +0000968 return 3;
969 else if (Line.MightBeFunctionDecl && Right.BindingStrength == 1)
970 // FIXME: Clean up hack of using BindingStrength to find top-level names.
971 return Style.PenaltyReturnTypeOnItsOwnLine;
972 else
Daniel Jasper1407bee2013-04-11 14:29:13 +0000973 return 200;
Daniel Jasper3c08a812013-02-24 18:54:32 +0000974 }
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000975 if (Left.is(tok::equal) && Right.is(tok::l_brace))
976 return 150;
977 if (Left.is(tok::coloncolon))
978 return 500;
Daniel Jasper6b119d62013-04-05 17:22:09 +0000979 if (Left.isOneOf(tok::kw_class, tok::kw_struct))
980 return 5000;
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000981
Daniel Jasper6cabab42013-02-14 08:42:54 +0000982 if (Left.Type == TT_RangeBasedForLoopColon ||
983 Left.Type == TT_InheritanceColon)
Daniel Jasper84a1a632013-02-26 13:18:08 +0000984 return 2;
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000985
Daniel Jasper5ad390d2013-05-28 11:30:49 +0000986 if (Right.isOneOf(tok::arrow, tok::period) &&
987 Right.Type != TT_DesignatedInitializerPeriod) {
Daniel Jasper515f65d2013-02-18 13:24:21 +0000988 if (Line.Type == LT_BuilderTypeCall)
Daniel Jasper6a365aa2013-03-13 17:13:53 +0000989 return prec::PointerToMember;
Alexander Kornienkoe74de282013-03-13 14:41:29 +0000990 if (Left.isOneOf(tok::r_paren, tok::r_square) && Left.MatchingParen &&
991 Left.MatchingParen->ParameterCount > 0)
Daniel Jasper518ee342013-02-26 13:59:14 +0000992 return 20; // Should be smaller than breaking at a nested comma.
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000993 return 150;
994 }
995
Daniel Jasper5ad72bb2013-05-22 08:28:26 +0000996 // Breaking before a trailing 'const' is bad.
997 if (Left.is(tok::r_paren) && Right.is(tok::kw_const))
998 return 150;
999
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001000 // In for-loops, prefer breaking at ',' and ';'.
Manuel Klimekb3987012013-05-29 14:47:47 +00001001 if (Line.First->is(tok::kw_for) && Left.is(tok::equal))
Daniel Jasper7d812812013-02-21 15:00:29 +00001002 return 4;
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001003
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001004 // In Objective-C method expressions, prefer breaking before "param:" over
1005 // breaking after it.
Daniel Jasper63d7ced2013-02-05 10:07:47 +00001006 if (Right.Type == TT_ObjCSelectorName)
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001007 return 0;
Daniel Jasper63d7ced2013-02-05 10:07:47 +00001008 if (Left.is(tok::colon) && Left.Type == TT_ObjCMethodExpr)
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001009 return 20;
1010
Daniel Jasper1407bee2013-04-11 14:29:13 +00001011 if (Left.is(tok::l_paren) && Line.MightBeFunctionDecl)
1012 return 100;
Daniel Jasperac3223e2013-04-10 09:49:49 +00001013 if (Left.opensScope())
Daniel Jasper64f09282013-03-20 13:53:11 +00001014 return Left.ParameterCount > 1 ? prec::Comma : 20;
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001015
Daniel Jasper4e8a7b42013-02-06 21:04:05 +00001016 if (Right.is(tok::lessless)) {
1017 if (Left.is(tok::string_literal)) {
Manuel Klimekb3987012013-05-29 14:47:47 +00001018 StringRef Content =
1019 StringRef(Left.Tok.getLiteralData(), Left.TokenLength);
Daniel Jasperbfa1edd2013-03-14 14:00:17 +00001020 Content = Content.drop_back(1).drop_front(1).trim();
1021 if (Content.size() > 1 &&
1022 (Content.back() == ':' || Content.back() == '='))
Daniel Jasper6e6efa72013-05-22 09:13:26 +00001023 return 20;
Daniel Jasper4e8a7b42013-02-06 21:04:05 +00001024 }
Daniel Jasper01786732013-02-04 07:21:18 +00001025 return prec::Shift;
Daniel Jasper4e8a7b42013-02-06 21:04:05 +00001026 }
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001027 if (Left.Type == TT_ConditionalExpr)
Daniel Jasper518ee342013-02-26 13:59:14 +00001028 return prec::Conditional;
Manuel Klimekb3987012013-05-29 14:47:47 +00001029 prec::Level Level = Left.getPrecedence();
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001030
1031 if (Level != prec::Unknown)
1032 return Level;
Daniel Jasper24849712013-03-01 16:48:32 +00001033
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001034 return 3;
1035}
1036
Daniel Jasper8ff690a2013-02-06 14:22:40 +00001037bool TokenAnnotator::spaceRequiredBetween(const AnnotatedLine &Line,
Manuel Klimekb3987012013-05-29 14:47:47 +00001038 const FormatToken &Left,
1039 const FormatToken &Right) {
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001040 if (Right.is(tok::hashhash))
1041 return Left.is(tok::hash);
Alexander Kornienkoe74de282013-03-13 14:41:29 +00001042 if (Left.isOneOf(tok::hashhash, tok::hash))
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001043 return Right.is(tok::hash);
Alexander Kornienkoe74de282013-03-13 14:41:29 +00001044 if (Right.isOneOf(tok::r_paren, tok::semi, tok::comma))
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001045 return false;
1046 if (Right.is(tok::less) &&
1047 (Left.is(tok::kw_template) ||
1048 (Line.Type == LT_ObjCDecl && Style.ObjCSpaceBeforeProtocolList)))
1049 return true;
1050 if (Left.is(tok::arrow) || Right.is(tok::arrow))
1051 return false;
Alexander Kornienkoe74de282013-03-13 14:41:29 +00001052 if (Left.isOneOf(tok::exclaim, tok::tilde))
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001053 return false;
1054 if (Left.is(tok::at) &&
Alexander Kornienkoe74de282013-03-13 14:41:29 +00001055 Right.isOneOf(tok::identifier, tok::string_literal, tok::char_constant,
1056 tok::numeric_constant, tok::l_paren, tok::l_brace,
1057 tok::kw_true, tok::kw_false))
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001058 return false;
1059 if (Left.is(tok::coloncolon))
1060 return false;
1061 if (Right.is(tok::coloncolon))
Alexander Kornienkoe74de282013-03-13 14:41:29 +00001062 return !Left.isOneOf(tok::identifier, tok::greater, tok::l_paren);
1063 if (Left.is(tok::less) || Right.isOneOf(tok::greater, tok::less))
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001064 return false;
Alexander Kornienko3fd9ccd2013-03-12 16:28:18 +00001065 if (Right.Type == TT_PointerOrReference)
Manuel Klimekb3987012013-05-29 14:47:47 +00001066 return Left.Tok.isLiteral() ||
Alexander Kornienko3fd9ccd2013-03-12 16:28:18 +00001067 ((Left.Type != TT_PointerOrReference) && Left.isNot(tok::l_paren) &&
1068 !Style.PointerBindsToType);
Daniel Jasper3ff4a2f2013-05-28 15:27:10 +00001069 if (Right.Type == TT_FunctionTypeLParen && Left.isNot(tok::l_paren) &&
Daniel Jasper395228f2013-05-08 14:58:20 +00001070 (Left.Type != TT_PointerOrReference || Style.PointerBindsToType))
1071 return true;
Alexander Kornienko3fd9ccd2013-03-12 16:28:18 +00001072 if (Left.Type == TT_PointerOrReference)
Manuel Klimekb3987012013-05-29 14:47:47 +00001073 return Right.Tok.isLiteral() ||
Daniel Jasper9322aae2013-03-20 09:53:18 +00001074 ((Right.Type != TT_PointerOrReference) &&
Daniel Jasper81d2d382013-04-01 17:13:26 +00001075 Right.isNot(tok::l_paren) && Style.PointerBindsToType &&
Manuel Klimekb3987012013-05-29 14:47:47 +00001076 Left.Previous &&
1077 !Left.Previous->isOneOf(tok::l_paren, tok::coloncolon));
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001078 if (Right.is(tok::star) && Left.is(tok::l_paren))
1079 return false;
Nico Weber051860e2013-02-10 02:08:05 +00001080 if (Left.is(tok::l_square))
1081 return Left.Type == TT_ObjCArrayLiteral && Right.isNot(tok::r_square);
1082 if (Right.is(tok::r_square))
1083 return Right.Type == TT_ObjCArrayLiteral;
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001084 if (Right.is(tok::l_square) && Right.Type != TT_ObjCMethodExpr)
1085 return false;
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001086 if (Left.is(tok::colon))
1087 return Left.Type != TT_ObjCMethodExpr;
1088 if (Right.is(tok::colon))
1089 return Right.Type != TT_ObjCMethodExpr;
1090 if (Left.is(tok::l_paren))
1091 return false;
1092 if (Right.is(tok::l_paren)) {
Alexander Kornienkoe74de282013-03-13 14:41:29 +00001093 return Line.Type == LT_ObjCDecl ||
1094 Left.isOneOf(tok::kw_if, tok::kw_for, tok::kw_while, tok::kw_switch,
1095 tok::kw_return, tok::kw_catch, tok::kw_new,
Daniel Jasper454cb702013-05-03 14:50:50 +00001096 tok::kw_delete, tok::semi);
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001097 }
Manuel Klimekb3987012013-05-29 14:47:47 +00001098 if (Left.is(tok::at) && Right.Tok.getObjCKeywordID() != tok::objc_not_keyword)
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001099 return false;
1100 if (Left.is(tok::l_brace) && Right.is(tok::r_brace))
Daniel Jasper2424eef2013-05-23 10:15:45 +00001101 return false; // No spaces in "{}".
1102 if (Left.is(tok::l_brace) || Right.is(tok::r_brace))
1103 return Style.SpacesInBracedLists;
Daniel Jasper1bee0732013-05-23 18:05:18 +00001104 if (Right.Type == TT_UnaryOperator)
1105 return !Left.isOneOf(tok::l_paren, tok::l_square, tok::at) &&
1106 (Left.isNot(tok::colon) || Left.Type != TT_ObjCMethodExpr);
Daniel Jasperce933562013-05-23 21:35:49 +00001107 if (Left.isOneOf(tok::identifier, tok::greater, tok::r_square) &&
1108 Right.is(tok::l_brace) && Right.getNextNoneComment())
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001109 return false;
Daniel Jasperf0220182013-05-06 06:35:44 +00001110 if (Right.is(tok::ellipsis))
1111 return false;
Daniel Jasper5ad390d2013-05-28 11:30:49 +00001112 if (Left.is(tok::period) || Right.is(tok::period))
1113 return false;
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001114 return true;
1115}
1116
Daniel Jasper8ff690a2013-02-06 14:22:40 +00001117bool TokenAnnotator::spaceRequiredBefore(const AnnotatedLine &Line,
Manuel Klimekb3987012013-05-29 14:47:47 +00001118 const FormatToken &Tok) {
1119 if (Tok.Tok.getIdentifierInfo() && Tok.Previous->Tok.getIdentifierInfo())
Daniel Jasper2b4c9242013-02-11 08:01:18 +00001120 return true; // Never ever merge two identifiers.
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001121 if (Line.Type == LT_ObjCMethodDecl) {
Manuel Klimekb3987012013-05-29 14:47:47 +00001122 if (Tok.Previous->Type == TT_ObjCMethodSpecifier)
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001123 return true;
Manuel Klimekb3987012013-05-29 14:47:47 +00001124 if (Tok.Previous->is(tok::r_paren) && Tok.is(tok::identifier))
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001125 // Don't space between ')' and <id>
1126 return false;
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001127 }
1128 if (Line.Type == LT_ObjCProperty &&
Manuel Klimekb3987012013-05-29 14:47:47 +00001129 (Tok.is(tok::equal) || Tok.Previous->is(tok::equal)))
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001130 return false;
1131
Manuel Klimekb3987012013-05-29 14:47:47 +00001132 if (Tok.Previous->is(tok::comma))
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001133 return true;
Daniel Jasper9c3c7b32013-02-28 13:40:17 +00001134 if (Tok.is(tok::comma))
1135 return false;
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001136 if (Tok.Type == TT_CtorInitializerColon || Tok.Type == TT_ObjCBlockLParen)
1137 return true;
Manuel Klimekb3987012013-05-29 14:47:47 +00001138 if (Tok.Previous->Tok.is(tok::kw_operator))
Daniel Jasper2b4c9242013-02-11 08:01:18 +00001139 return false;
1140 if (Tok.Type == TT_OverloadedOperatorLParen)
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001141 return false;
1142 if (Tok.is(tok::colon))
Manuel Klimekb3987012013-05-29 14:47:47 +00001143 return !Line.First->isOneOf(tok::kw_case, tok::kw_default) &&
Daniel Jasperac3223e2013-04-10 09:49:49 +00001144 Tok.getNextNoneComment() != NULL && Tok.Type != TT_ObjCMethodExpr;
Manuel Klimekb3987012013-05-29 14:47:47 +00001145 if (Tok.Previous->Type == TT_UnaryOperator ||
1146 Tok.Previous->Type == TT_CastRParen)
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001147 return false;
Manuel Klimekb3987012013-05-29 14:47:47 +00001148 if (Tok.Previous->is(tok::greater) && Tok.is(tok::greater)) {
Daniel Jasper29f123b2013-02-08 15:28:42 +00001149 return Tok.Type == TT_TemplateCloser &&
Manuel Klimekb3987012013-05-29 14:47:47 +00001150 Tok.Previous->Type == TT_TemplateCloser &&
Daniel Jasper29f123b2013-02-08 15:28:42 +00001151 Style.Standard != FormatStyle::LS_Cpp11;
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001152 }
Alexander Kornienko54a38bd2013-03-20 16:41:56 +00001153 if (Tok.isOneOf(tok::arrowstar, tok::periodstar) ||
Manuel Klimekb3987012013-05-29 14:47:47 +00001154 Tok.Previous->isOneOf(tok::arrowstar, tok::periodstar))
Daniel Jasper9c3c7b32013-02-28 13:40:17 +00001155 return false;
Manuel Klimekb3987012013-05-29 14:47:47 +00001156 if (Tok.Type == TT_BinaryOperator || Tok.Previous->Type == TT_BinaryOperator)
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001157 return true;
Manuel Klimekb3987012013-05-29 14:47:47 +00001158 if (Tok.Previous->Type == TT_TemplateCloser && Tok.is(tok::l_paren))
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001159 return false;
Manuel Klimekb3987012013-05-29 14:47:47 +00001160 if (Tok.is(tok::less) && Line.First->is(tok::hash))
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001161 return true;
1162 if (Tok.Type == TT_TrailingUnaryOperator)
1163 return false;
Manuel Klimekb3987012013-05-29 14:47:47 +00001164 return spaceRequiredBetween(Line, *Tok.Previous, Tok);
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001165}
1166
Daniel Jasper8ff690a2013-02-06 14:22:40 +00001167bool TokenAnnotator::canBreakBefore(const AnnotatedLine &Line,
Manuel Klimekb3987012013-05-29 14:47:47 +00001168 const FormatToken &Right) {
1169 const FormatToken &Left = *Right.Previous;
Daniel Jaspera03ab102013-02-13 20:33:44 +00001170 if (Right.Type == TT_StartOfName)
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001171 return true;
Nico Weberf2ff8122013-05-26 05:39:26 +00001172 if (Right.is(tok::colon) &&
1173 (Right.Type == TT_ObjCDictLiteral || Right.Type == TT_ObjCMethodExpr))
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001174 return false;
Nico Weberf2ff8122013-05-26 05:39:26 +00001175 if (Left.is(tok::colon) &&
1176 (Left.Type == TT_ObjCDictLiteral || Left.Type == TT_ObjCMethodExpr))
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001177 return true;
Daniel Jasper63d7ced2013-02-05 10:07:47 +00001178 if (Right.Type == TT_ObjCSelectorName)
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001179 return true;
1180 if (Left.ClosesTemplateDeclaration)
1181 return true;
1182 if (Right.Type == TT_ConditionalExpr || Right.is(tok::question))
1183 return true;
Daniel Jasper6cabab42013-02-14 08:42:54 +00001184 if (Right.Type == TT_RangeBasedForLoopColon ||
Daniel Jasper27b91cc2013-04-05 17:21:59 +00001185 Right.Type == TT_OverloadedOperatorLParen)
Daniel Jasper6cabab42013-02-14 08:42:54 +00001186 return false;
Daniel Jasperc194c952013-05-06 06:45:09 +00001187 if (Left.Type == TT_RangeBasedForLoopColon)
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001188 return true;
Daniel Jasper7d812812013-02-21 15:00:29 +00001189 if (Right.Type == TT_RangeBasedForLoopColon)
1190 return false;
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001191 if (Left.Type == TT_PointerOrReference || Left.Type == TT_TemplateCloser ||
1192 Left.Type == TT_UnaryOperator || Left.Type == TT_ConditionalExpr ||
Alexander Kornienkoe74de282013-03-13 14:41:29 +00001193 Left.isOneOf(tok::question, tok::kw_operator))
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001194 return false;
1195 if (Left.is(tok::equal) && Line.Type == LT_VirtualFunctionDecl)
1196 return false;
Manuel Klimekb3987012013-05-29 14:47:47 +00001197 if (Left.is(tok::l_paren) && Right.is(tok::l_paren) && Left.Previous &&
1198 Left.Previous->is(tok::kw___attribute))
Daniel Jasper8ed41002013-02-28 14:44:25 +00001199 return false;
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001200
1201 if (Right.Type == TT_LineComment)
1202 // We rely on MustBreakBefore being set correctly here as we should not
1203 // change the "binding" behavior of a comment.
1204 return false;
1205
Daniel Jasper5ad72bb2013-05-22 08:28:26 +00001206 // We only break before r_brace if there was a corresponding break before
1207 // the l_brace, which is tracked by BreakBeforeClosingBrace.
1208 if (Right.isOneOf(tok::r_brace, tok::r_paren, tok::greater))
1209 return false;
1210
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001211 // Allow breaking after a trailing 'const', e.g. after a method declaration,
1212 // unless it is follow by ';', '{' or '='.
Manuel Klimekb3987012013-05-29 14:47:47 +00001213 if (Left.is(tok::kw_const) && Left.Previous != NULL &&
1214 Left.Previous->is(tok::r_paren))
Alexander Kornienkoe74de282013-03-13 14:41:29 +00001215 return !Right.isOneOf(tok::l_brace, tok::semi, tok::equal);
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001216
Daniel Jasper8ef19a22013-03-14 09:50:46 +00001217 if (Right.is(tok::kw___attribute))
1218 return true;
1219
Daniel Jasper3a204412013-02-23 07:46:38 +00001220 if (Left.is(tok::identifier) && Right.is(tok::string_literal))
1221 return true;
Daniel Jasperac3223e2013-04-10 09:49:49 +00001222 return (Left.isBinaryOperator() && Left.isNot(tok::lessless)) ||
Daniel Jasper6b119d62013-04-05 17:22:09 +00001223 Left.isOneOf(tok::comma, tok::coloncolon, tok::semi, tok::l_brace,
1224 tok::kw_class, tok::kw_struct) ||
Alexander Kornienkoe74de282013-03-13 14:41:29 +00001225 Right.isOneOf(tok::lessless, tok::arrow, tok::period, tok::colon) ||
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001226 (Left.is(tok::r_paren) && Left.Type != TT_CastRParen &&
Daniel Jaspere033e872013-05-21 09:16:31 +00001227 Right.isOneOf(tok::identifier, tok::kw_const, tok::kw___attribute)) ||
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001228 (Left.is(tok::l_paren) && !Right.is(tok::r_paren)) ||
1229 (Left.is(tok::l_square) && !Right.is(tok::r_square));
1230}
1231
Daniel Jasperbf71ba22013-04-08 20:33:42 +00001232void TokenAnnotator::printDebugInfo(const AnnotatedLine &Line) {
1233 llvm::errs() << "AnnotatedTokens:\n";
Manuel Klimekb3987012013-05-29 14:47:47 +00001234 const FormatToken *Tok = Line.First;
Daniel Jasperbf71ba22013-04-08 20:33:42 +00001235 while (Tok) {
Manuel Klimekb3987012013-05-29 14:47:47 +00001236 llvm::errs() << " M=" << Tok->MustBreakBefore
1237 << " C=" << Tok->CanBreakBefore << " T=" << Tok->Type << " S="
1238 << Tok->SpacesRequiredBefore << " P=" << Tok->SplitPenalty
1239 << " Name=" << Tok->Tok.getName() << " FakeLParens=";
Daniel Jasperbf71ba22013-04-08 20:33:42 +00001240 for (unsigned i = 0, e = Tok->FakeLParens.size(); i != e; ++i)
1241 llvm::errs() << Tok->FakeLParens[i] << "/";
1242 llvm::errs() << " FakeRParens=" << Tok->FakeRParens << "\n";
Manuel Klimekb3987012013-05-29 14:47:47 +00001243 Tok = Tok->Next;
Daniel Jasperbf71ba22013-04-08 20:33:42 +00001244 }
1245 llvm::errs() << "----\n";
1246}
1247
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001248} // namespace format
1249} // namespace clang