blob: 97be71c277ee1ce46db235a57bb6394f2e63756d [file] [log] [blame]
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001//===--- TokenAnnotator.cpp - Format C++ code -----------------------------===//
2//
3// The LLVM Compiler Infrastructure
4//
5// This file is distributed under the University of Illinois Open Source
6// License. See LICENSE.TXT for details.
7//
8//===----------------------------------------------------------------------===//
9///
10/// \file
11/// \brief This file implements a token annotator, i.e. creates
12/// \c AnnotatedTokens out of \c FormatTokens with required extra information.
13///
14//===----------------------------------------------------------------------===//
15
16#include "TokenAnnotator.h"
17#include "clang/Basic/SourceManager.h"
Daniel Jasperbf71ba22013-04-08 20:33:42 +000018#include "llvm/Support/Debug.h"
Daniel Jasper32d28ee2013-01-29 21:01:14 +000019
20namespace clang {
21namespace format {
22
Craig Topper14e66492013-07-01 04:03:19 +000023namespace {
24
Daniel Jasper32d28ee2013-01-29 21:01:14 +000025/// \brief A parser that gathers additional information about tokens.
26///
Alexander Kornienko3fd9ccd2013-03-12 16:28:18 +000027/// The \c TokenAnnotator tries to match parenthesis and square brakets and
Daniel Jasper32d28ee2013-01-29 21:01:14 +000028/// store a parenthesis levels. It also tries to resolve matching "<" and ">"
29/// into template parameter lists.
30class AnnotatingParser {
31public:
Alexander Kornienko00895102013-06-05 14:09:10 +000032 AnnotatingParser(AnnotatedLine &Line, IdentifierInfo &Ident_in)
33 : Line(Line), CurrentToken(Line.First), KeywordVirtualFound(false),
Daniel Jasper2ca37412013-07-09 14:36:48 +000034 NameFound(false), AutoFound(false), Ident_in(Ident_in) {
Nico Weber27268772013-06-26 00:30:14 +000035 Contexts.push_back(Context(tok::unknown, 1, /*IsExpression=*/false));
Daniel Jasper32d28ee2013-01-29 21:01:14 +000036 }
37
Nico Weber95e8e462013-02-12 16:17:07 +000038private:
Daniel Jasper32d28ee2013-01-29 21:01:14 +000039 bool parseAngle() {
40 if (CurrentToken == NULL)
41 return false;
Daniel Jasper923ebef2013-03-14 13:45:21 +000042 ScopedContextCreator ContextCreator(*this, tok::less, 10);
Manuel Klimekb3987012013-05-29 14:47:47 +000043 FormatToken *Left = CurrentToken->Previous;
Daniel Jasper4e778092013-02-06 10:05:46 +000044 Contexts.back().IsExpression = false;
Daniel Jasper32d28ee2013-01-29 21:01:14 +000045 while (CurrentToken != NULL) {
46 if (CurrentToken->is(tok::greater)) {
47 Left->MatchingParen = CurrentToken;
48 CurrentToken->MatchingParen = Left;
49 CurrentToken->Type = TT_TemplateCloser;
50 next();
51 return true;
52 }
Alexander Kornienkoe74de282013-03-13 14:41:29 +000053 if (CurrentToken->isOneOf(tok::r_paren, tok::r_square, tok::r_brace,
Daniel Jasper5d823e32013-05-15 13:46:48 +000054 tok::question, tok::colon))
55 return false;
Daniel Jasper0348be02013-06-01 18:56:00 +000056 // If a && or || is found and interpreted as a binary operator, this set
Daniel Jasper15f33f02013-06-03 16:16:41 +000057 // of angles is likely part of something like "a < b && c > d". If the
Daniel Jasper0348be02013-06-01 18:56:00 +000058 // angles are inside an expression, the ||/&& might also be a binary
59 // operator that was misinterpreted because we are parsing template
60 // parameters.
61 // FIXME: This is getting out of hand, write a decent parser.
Manuel Klimekb3987012013-05-29 14:47:47 +000062 if (CurrentToken->Previous->isOneOf(tok::pipepipe, tok::ampamp) &&
Daniel Jasper0348be02013-06-01 18:56:00 +000063 (CurrentToken->Previous->Type == TT_BinaryOperator ||
64 Contexts[Contexts.size() - 2].IsExpression) &&
Manuel Klimekb3987012013-05-29 14:47:47 +000065 Line.First->isNot(tok::kw_template))
Daniel Jasper32d28ee2013-01-29 21:01:14 +000066 return false;
Daniel Jasper9fc56f22013-02-14 15:01:34 +000067 updateParameterCount(Left, CurrentToken);
Daniel Jasper32d28ee2013-01-29 21:01:14 +000068 if (!consumeToken())
69 return false;
70 }
71 return false;
72 }
73
74 bool parseParens(bool LookForDecls = false) {
75 if (CurrentToken == NULL)
76 return false;
Daniel Jasper923ebef2013-03-14 13:45:21 +000077 ScopedContextCreator ContextCreator(*this, tok::l_paren, 1);
Daniel Jasper4e778092013-02-06 10:05:46 +000078
79 // FIXME: This is a bit of a hack. Do better.
80 Contexts.back().ColonIsForRangeExpr =
81 Contexts.size() == 2 && Contexts[0].ColonIsForRangeExpr;
82
Daniel Jasper32d28ee2013-01-29 21:01:14 +000083 bool StartsObjCMethodExpr = false;
Manuel Klimekb3987012013-05-29 14:47:47 +000084 FormatToken *Left = CurrentToken->Previous;
Daniel Jasper32d28ee2013-01-29 21:01:14 +000085 if (CurrentToken->is(tok::caret)) {
86 // ^( starts a block.
87 Left->Type = TT_ObjCBlockLParen;
Manuel Klimekb3987012013-05-29 14:47:47 +000088 } else if (FormatToken *MaybeSel = Left->Previous) {
Daniel Jasper32d28ee2013-01-29 21:01:14 +000089 // @selector( starts a selector.
Manuel Klimekb3987012013-05-29 14:47:47 +000090 if (MaybeSel->isObjCAtKeyword(tok::objc_selector) && MaybeSel->Previous &&
91 MaybeSel->Previous->is(tok::at)) {
Daniel Jasper32d28ee2013-01-29 21:01:14 +000092 StartsObjCMethodExpr = true;
93 }
94 }
95
Daniel Jasper4e778092013-02-06 10:05:46 +000096 if (StartsObjCMethodExpr) {
97 Contexts.back().ColonIsObjCMethodExpr = true;
98 Left->Type = TT_ObjCMethodExpr;
99 }
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000100
Daniel Jasper431f5912013-05-28 08:33:00 +0000101 bool MightBeFunctionType = CurrentToken->is(tok::star);
Daniel Jasperc7bd68f2013-07-10 14:02:49 +0000102 bool HasMultipleLines = false;
103 bool HasMultipleParametersOnALine = false;
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000104 while (CurrentToken != NULL) {
105 // LookForDecls is set when "if (" has been seen. Check for
106 // 'identifier' '*' 'identifier' followed by not '=' -- this
107 // '*' has to be a binary operator but determineStarAmpUsage() will
108 // categorize it as an unary operator, so set the right type here.
Manuel Klimekb3987012013-05-29 14:47:47 +0000109 if (LookForDecls && CurrentToken->Next) {
Alexander Kornienko0bdc6432013-07-04 14:47:51 +0000110 FormatToken *Prev = CurrentToken->getPreviousNonComment();
Alexander Kornienko2785b9a2013-06-07 16:02:52 +0000111 if (Prev) {
Alexander Kornienko0bdc6432013-07-04 14:47:51 +0000112 FormatToken *PrevPrev = Prev->getPreviousNonComment();
Alexander Kornienko2785b9a2013-06-07 16:02:52 +0000113 FormatToken *Next = CurrentToken->Next;
114 if (PrevPrev && PrevPrev->is(tok::identifier) &&
115 Prev->isOneOf(tok::star, tok::amp, tok::ampamp) &&
116 CurrentToken->is(tok::identifier) && Next->isNot(tok::equal)) {
117 Prev->Type = TT_BinaryOperator;
118 LookForDecls = false;
119 }
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000120 }
121 }
122
123 if (CurrentToken->is(tok::r_paren)) {
Manuel Klimekb3987012013-05-29 14:47:47 +0000124 if (MightBeFunctionType && CurrentToken->Next &&
Daniel Jaspere7d3bff2013-07-16 11:37:21 +0000125 (CurrentToken->Next->is(tok::l_paren) ||
126 (CurrentToken->Next->is(tok::l_square) &&
127 !Contexts.back().IsExpression)))
Daniel Jasper431f5912013-05-28 08:33:00 +0000128 Left->Type = TT_FunctionTypeLParen;
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000129 Left->MatchingParen = CurrentToken;
130 CurrentToken->MatchingParen = Left;
131
Daniel Jasper63d7ced2013-02-05 10:07:47 +0000132 if (StartsObjCMethodExpr) {
Daniel Jasper4e778092013-02-06 10:05:46 +0000133 CurrentToken->Type = TT_ObjCMethodExpr;
134 if (Contexts.back().FirstObjCSelectorName != NULL) {
135 Contexts.back().FirstObjCSelectorName->LongestObjCSelectorName =
136 Contexts.back().LongestObjCSelectorName;
Daniel Jasper63d7ced2013-02-05 10:07:47 +0000137 }
138 }
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000139
Daniel Jasperc7bd68f2013-07-10 14:02:49 +0000140 if (!HasMultipleLines)
141 Left->PackingKind = PPK_Inconclusive;
142 else if (HasMultipleParametersOnALine)
143 Left->PackingKind = PPK_BinPacked;
144 else
145 Left->PackingKind = PPK_OnePerLine;
146
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000147 next();
148 return true;
149 }
Alexander Kornienkoe74de282013-03-13 14:41:29 +0000150 if (CurrentToken->isOneOf(tok::r_square, tok::r_brace))
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000151 return false;
Manuel Klimekb3987012013-05-29 14:47:47 +0000152 if (CurrentToken->Previous->Type == TT_PointerOrReference &&
153 CurrentToken->Previous->Previous->isOneOf(tok::l_paren,
154 tok::coloncolon))
Daniel Jasper431f5912013-05-28 08:33:00 +0000155 MightBeFunctionType = true;
Daniel Jasper9fc56f22013-02-14 15:01:34 +0000156 updateParameterCount(Left, CurrentToken);
Daniel Jasperc7bd68f2013-07-10 14:02:49 +0000157 if (CurrentToken->is(tok::comma) && CurrentToken->Next &&
158 !CurrentToken->Next->HasUnescapedNewline &&
159 !CurrentToken->Next->isTrailingComment())
160 HasMultipleParametersOnALine = true;
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000161 if (!consumeToken())
162 return false;
Daniel Jasperc7bd68f2013-07-10 14:02:49 +0000163 if (CurrentToken && CurrentToken->HasUnescapedNewline)
164 HasMultipleLines = true;
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000165 }
166 return false;
167 }
168
169 bool parseSquare() {
170 if (!CurrentToken)
171 return false;
172
Alexander Kornienkod71b15b2013-06-17 13:19:53 +0000173 // A '[' could be an index subscript (after an identifier or after
Nico Weber051860e2013-02-10 02:08:05 +0000174 // ')' or ']'), it could be the start of an Objective-C method
175 // expression, or it could the the start of an Objective-C array literal.
Manuel Klimekb3987012013-05-29 14:47:47 +0000176 FormatToken *Left = CurrentToken->Previous;
Alexander Kornienko0bdc6432013-07-04 14:47:51 +0000177 FormatToken *Parent = Left->getPreviousNonComment();
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000178 bool StartsObjCMethodExpr =
Daniel Jasper6f21a982013-03-13 07:49:51 +0000179 Contexts.back().CanBeExpression &&
Alexander Kornienkoe74de282013-03-13 14:41:29 +0000180 (!Parent || Parent->isOneOf(tok::colon, tok::l_square, tok::l_paren,
181 tok::kw_return, tok::kw_throw) ||
Daniel Jasperac3223e2013-04-10 09:49:49 +0000182 Parent->isUnaryOperator() || Parent->Type == TT_ObjCForIn ||
Alexander Kornienkoe74de282013-03-13 14:41:29 +0000183 Parent->Type == TT_CastRParen ||
Manuel Klimekb3987012013-05-29 14:47:47 +0000184 getBinOpPrecedence(Parent->Tok.getKind(), true, true) > prec::Unknown);
Daniel Jasper923ebef2013-03-14 13:45:21 +0000185 ScopedContextCreator ContextCreator(*this, tok::l_square, 10);
Daniel Jasper6f21a982013-03-13 07:49:51 +0000186 Contexts.back().IsExpression = true;
Nico Weber051860e2013-02-10 02:08:05 +0000187 bool StartsObjCArrayLiteral = Parent && Parent->is(tok::at);
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000188
Daniel Jasper4e778092013-02-06 10:05:46 +0000189 if (StartsObjCMethodExpr) {
190 Contexts.back().ColonIsObjCMethodExpr = true;
191 Left->Type = TT_ObjCMethodExpr;
Nico Weber051860e2013-02-10 02:08:05 +0000192 } else if (StartsObjCArrayLiteral) {
193 Left->Type = TT_ObjCArrayLiteral;
Daniel Jasper4e778092013-02-06 10:05:46 +0000194 }
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000195
196 while (CurrentToken != NULL) {
197 if (CurrentToken->is(tok::r_square)) {
Manuel Klimekb3987012013-05-29 14:47:47 +0000198 if (CurrentToken->Next && CurrentToken->Next->is(tok::l_paren)) {
Nico Webere8a97982013-02-06 06:20:11 +0000199 // An ObjC method call is rarely followed by an open parenthesis.
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000200 // FIXME: Do we incorrectly label ":" with this?
201 StartsObjCMethodExpr = false;
202 Left->Type = TT_Unknown;
203 }
Daniel Jasper01786732013-02-04 07:21:18 +0000204 if (StartsObjCMethodExpr) {
Daniel Jasper4e778092013-02-06 10:05:46 +0000205 CurrentToken->Type = TT_ObjCMethodExpr;
Nico Webere8a97982013-02-06 06:20:11 +0000206 // determineStarAmpUsage() thinks that '*' '[' is allocating an
207 // array of pointers, but if '[' starts a selector then '*' is a
208 // binary operator.
Alexander Kornienko3fd9ccd2013-03-12 16:28:18 +0000209 if (Parent != NULL && Parent->Type == TT_PointerOrReference)
Nico Weber4ed7f3e2013-02-06 16:54:35 +0000210 Parent->Type = TT_BinaryOperator;
Nico Weber051860e2013-02-10 02:08:05 +0000211 } else if (StartsObjCArrayLiteral) {
212 CurrentToken->Type = TT_ObjCArrayLiteral;
Daniel Jasper01786732013-02-04 07:21:18 +0000213 }
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000214 Left->MatchingParen = CurrentToken;
215 CurrentToken->MatchingParen = Left;
Daniel Jasper4e778092013-02-06 10:05:46 +0000216 if (Contexts.back().FirstObjCSelectorName != NULL)
217 Contexts.back().FirstObjCSelectorName->LongestObjCSelectorName =
218 Contexts.back().LongestObjCSelectorName;
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000219 next();
220 return true;
221 }
Alexander Kornienkoe74de282013-03-13 14:41:29 +0000222 if (CurrentToken->isOneOf(tok::r_paren, tok::r_brace))
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000223 return false;
Daniel Jasper9fc56f22013-02-14 15:01:34 +0000224 updateParameterCount(Left, CurrentToken);
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000225 if (!consumeToken())
226 return false;
227 }
228 return false;
229 }
230
231 bool parseBrace() {
Daniel Jasper53e72cd2013-05-06 08:27:33 +0000232 if (CurrentToken != NULL) {
233 ScopedContextCreator ContextCreator(*this, tok::l_brace, 1);
Manuel Klimekb3987012013-05-29 14:47:47 +0000234 FormatToken *Left = CurrentToken->Previous;
Nico Weberf2ff8122013-05-26 05:39:26 +0000235
Alexander Kornienko0bdc6432013-07-04 14:47:51 +0000236 FormatToken *Parent = Left->getPreviousNonComment();
Nico Weberf2ff8122013-05-26 05:39:26 +0000237 bool StartsObjCDictLiteral = Parent && Parent->is(tok::at);
238 if (StartsObjCDictLiteral) {
239 Contexts.back().ColonIsObjCDictLiteral = true;
240 Left->Type = TT_ObjCDictLiteral;
241 }
242
Daniel Jasper53e72cd2013-05-06 08:27:33 +0000243 while (CurrentToken != NULL) {
244 if (CurrentToken->is(tok::r_brace)) {
Nico Weberf2ff8122013-05-26 05:39:26 +0000245 if (StartsObjCDictLiteral)
246 CurrentToken->Type = TT_ObjCDictLiteral;
Daniel Jasper53e72cd2013-05-06 08:27:33 +0000247 Left->MatchingParen = CurrentToken;
248 CurrentToken->MatchingParen = Left;
249 next();
250 return true;
251 }
252 if (CurrentToken->isOneOf(tok::r_paren, tok::r_square))
253 return false;
254 updateParameterCount(Left, CurrentToken);
255 if (!consumeToken())
256 return false;
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000257 }
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000258 }
Daniel Jasper53e72cd2013-05-06 08:27:33 +0000259 // No closing "}" found, this probably starts a definition.
260 Line.StartsDefinition = true;
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000261 return true;
262 }
Daniel Jasperc4615b72013-02-20 12:56:39 +0000263
Manuel Klimekb3987012013-05-29 14:47:47 +0000264 void updateParameterCount(FormatToken *Left, FormatToken *Current) {
Daniel Jasperc7bd68f2013-07-10 14:02:49 +0000265 if (Current->is(tok::comma)) {
Daniel Jasper9fc56f22013-02-14 15:01:34 +0000266 ++Left->ParameterCount;
Daniel Jasperc7bd68f2013-07-10 14:02:49 +0000267 } else if (Left->ParameterCount == 0 && Current->isNot(tok::comment)) {
Daniel Jasper9fc56f22013-02-14 15:01:34 +0000268 Left->ParameterCount = 1;
Daniel Jasperc7bd68f2013-07-10 14:02:49 +0000269 }
Daniel Jasper9fc56f22013-02-14 15:01:34 +0000270 }
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000271
272 bool parseConditional() {
273 while (CurrentToken != NULL) {
274 if (CurrentToken->is(tok::colon)) {
275 CurrentToken->Type = TT_ConditionalExpr;
276 next();
277 return true;
278 }
279 if (!consumeToken())
280 return false;
281 }
282 return false;
283 }
284
285 bool parseTemplateDeclaration() {
286 if (CurrentToken != NULL && CurrentToken->is(tok::less)) {
287 CurrentToken->Type = TT_TemplateOpener;
288 next();
289 if (!parseAngle())
290 return false;
Daniel Jasper34511fb2013-02-19 17:14:38 +0000291 if (CurrentToken != NULL)
Manuel Klimekb3987012013-05-29 14:47:47 +0000292 CurrentToken->Previous->ClosesTemplateDeclaration = true;
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000293 return true;
294 }
295 return false;
296 }
297
298 bool consumeToken() {
Manuel Klimekb3987012013-05-29 14:47:47 +0000299 FormatToken *Tok = CurrentToken;
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000300 next();
Manuel Klimekb3987012013-05-29 14:47:47 +0000301 switch (Tok->Tok.getKind()) {
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000302 case tok::plus:
303 case tok::minus:
Manuel Klimekb3987012013-05-29 14:47:47 +0000304 if (Tok->Previous == NULL && Line.MustBeDeclaration)
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000305 Tok->Type = TT_ObjCMethodSpecifier;
306 break;
307 case tok::colon:
Manuel Klimekb3987012013-05-29 14:47:47 +0000308 if (Tok->Previous == NULL)
Daniel Jaspercf6d76a2013-03-18 12:50:26 +0000309 return false;
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000310 // Colons from ?: are handled in parseConditional().
Manuel Klimekb3987012013-05-29 14:47:47 +0000311 if (Tok->Previous->is(tok::r_paren) && Contexts.size() == 1) {
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000312 Tok->Type = TT_CtorInitializerColon;
Nico Weberf2ff8122013-05-26 05:39:26 +0000313 } else if (Contexts.back().ColonIsObjCDictLiteral) {
314 Tok->Type = TT_ObjCDictLiteral;
Daniel Jasper4e778092013-02-06 10:05:46 +0000315 } else if (Contexts.back().ColonIsObjCMethodExpr ||
Manuel Klimekb3987012013-05-29 14:47:47 +0000316 Line.First->Type == TT_ObjCMethodSpecifier) {
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000317 Tok->Type = TT_ObjCMethodExpr;
Manuel Klimekb3987012013-05-29 14:47:47 +0000318 Tok->Previous->Type = TT_ObjCSelectorName;
Alexander Kornienko00895102013-06-05 14:09:10 +0000319 if (Tok->Previous->CodePointCount >
320 Contexts.back().LongestObjCSelectorName) {
321 Contexts.back().LongestObjCSelectorName =
322 Tok->Previous->CodePointCount;
323 }
Daniel Jasper4e778092013-02-06 10:05:46 +0000324 if (Contexts.back().FirstObjCSelectorName == NULL)
Manuel Klimekb3987012013-05-29 14:47:47 +0000325 Contexts.back().FirstObjCSelectorName = Tok->Previous;
Daniel Jasper4e778092013-02-06 10:05:46 +0000326 } else if (Contexts.back().ColonIsForRangeExpr) {
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000327 Tok->Type = TT_RangeBasedForLoopColon;
Daniel Jasper6cabab42013-02-14 08:42:54 +0000328 } else if (Contexts.size() == 1) {
329 Tok->Type = TT_InheritanceColon;
Daniel Jasper923ebef2013-03-14 13:45:21 +0000330 } else if (Contexts.back().ContextKind == tok::l_paren) {
331 Tok->Type = TT_InlineASMColon;
Daniel Jasper63d7ced2013-02-05 10:07:47 +0000332 }
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000333 break;
334 case tok::kw_if:
335 case tok::kw_while:
336 if (CurrentToken != NULL && CurrentToken->is(tok::l_paren)) {
337 next();
Nico Weber27268772013-06-26 00:30:14 +0000338 if (!parseParens(/*LookForDecls=*/true))
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000339 return false;
340 }
341 break;
342 case tok::kw_for:
Daniel Jasper4e778092013-02-06 10:05:46 +0000343 Contexts.back().ColonIsForRangeExpr = true;
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000344 next();
345 if (!parseParens())
346 return false;
347 break;
348 case tok::l_paren:
349 if (!parseParens())
350 return false;
Daniel Jasper1407bee2013-04-11 14:29:13 +0000351 if (Line.MustBeDeclaration && NameFound && !Contexts.back().IsExpression)
Daniel Jasper3c08a812013-02-24 18:54:32 +0000352 Line.MightBeFunctionDecl = true;
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000353 break;
354 case tok::l_square:
355 if (!parseSquare())
356 return false;
357 break;
358 case tok::l_brace:
359 if (!parseBrace())
360 return false;
361 break;
362 case tok::less:
363 if (parseAngle())
364 Tok->Type = TT_TemplateOpener;
365 else {
366 Tok->Type = TT_BinaryOperator;
367 CurrentToken = Tok;
368 next();
369 }
370 break;
371 case tok::r_paren:
372 case tok::r_square:
373 return false;
374 case tok::r_brace:
375 // Lines can start with '}'.
Manuel Klimekb3987012013-05-29 14:47:47 +0000376 if (Tok->Previous != NULL)
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000377 return false;
378 break;
379 case tok::greater:
380 Tok->Type = TT_BinaryOperator;
381 break;
382 case tok::kw_operator:
Daniel Jasper2b4c9242013-02-11 08:01:18 +0000383 while (CurrentToken && CurrentToken->isNot(tok::l_paren)) {
Alexander Kornienkoe74de282013-03-13 14:41:29 +0000384 if (CurrentToken->isOneOf(tok::star, tok::amp))
Daniel Jasper2b4c9242013-02-11 08:01:18 +0000385 CurrentToken->Type = TT_PointerOrReference;
386 consumeToken();
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000387 }
Daniel Jasper6ea933c2013-05-10 07:59:58 +0000388 if (CurrentToken) {
Daniel Jasper2b4c9242013-02-11 08:01:18 +0000389 CurrentToken->Type = TT_OverloadedOperatorLParen;
Manuel Klimekb3987012013-05-29 14:47:47 +0000390 if (CurrentToken->Previous->Type == TT_BinaryOperator)
391 CurrentToken->Previous->Type = TT_OverloadedOperator;
Daniel Jasper6ea933c2013-05-10 07:59:58 +0000392 }
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000393 break;
394 case tok::question:
395 parseConditional();
396 break;
397 case tok::kw_template:
398 parseTemplateDeclaration();
399 break;
Nico Weberc2e6d2a2013-02-11 15:32:15 +0000400 case tok::identifier:
Manuel Klimekb3987012013-05-29 14:47:47 +0000401 if (Line.First->is(tok::kw_for) &&
402 Tok->Tok.getIdentifierInfo() == &Ident_in)
Nico Weberc2e6d2a2013-02-11 15:32:15 +0000403 Tok->Type = TT_ObjCForIn;
404 break;
Daniel Jasper8ed9f2b2013-04-03 13:36:17 +0000405 case tok::comma:
406 if (Contexts.back().FirstStartOfName)
407 Contexts.back().FirstStartOfName->PartOfMultiVariableDeclStmt = true;
408 break;
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000409 default:
410 break;
411 }
412 return true;
413 }
414
415 void parseIncludeDirective() {
416 next();
417 if (CurrentToken != NULL && CurrentToken->is(tok::less)) {
418 next();
419 while (CurrentToken != NULL) {
Manuel Klimekb3987012013-05-29 14:47:47 +0000420 if (CurrentToken->isNot(tok::comment) || CurrentToken->Next)
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000421 CurrentToken->Type = TT_ImplicitStringLiteral;
422 next();
423 }
424 } else {
425 while (CurrentToken != NULL) {
Daniel Jasper3a204412013-02-23 07:46:38 +0000426 if (CurrentToken->is(tok::string_literal))
427 // Mark these string literals as "implicit" literals, too, so that
428 // they are not split or line-wrapped.
429 CurrentToken->Type = TT_ImplicitStringLiteral;
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000430 next();
431 }
432 }
433 }
434
435 void parseWarningOrError() {
436 next();
437 // We still want to format the whitespace left of the first token of the
438 // warning or error.
439 next();
440 while (CurrentToken != NULL) {
441 CurrentToken->Type = TT_ImplicitStringLiteral;
442 next();
443 }
444 }
445
446 void parsePreprocessorDirective() {
447 next();
448 if (CurrentToken == NULL)
449 return;
450 // Hashes in the middle of a line can lead to any strange token
451 // sequence.
Manuel Klimekb3987012013-05-29 14:47:47 +0000452 if (CurrentToken->Tok.getIdentifierInfo() == NULL)
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000453 return;
Manuel Klimekb3987012013-05-29 14:47:47 +0000454 switch (CurrentToken->Tok.getIdentifierInfo()->getPPKeywordID()) {
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000455 case tok::pp_include:
456 case tok::pp_import:
457 parseIncludeDirective();
458 break;
459 case tok::pp_error:
460 case tok::pp_warning:
461 parseWarningOrError();
462 break;
Daniel Jasperaae7bad2013-04-23 13:54:04 +0000463 case tok::pp_if:
464 case tok::pp_elif:
465 parseLine();
466 break;
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000467 default:
468 break;
469 }
Daniel Jasper5b7e7b02013-02-05 09:34:14 +0000470 while (CurrentToken != NULL)
471 next();
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000472 }
473
Nico Weber95e8e462013-02-12 16:17:07 +0000474public:
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000475 LineType parseLine() {
476 int PeriodsAndArrows = 0;
Manuel Klimekb3987012013-05-29 14:47:47 +0000477 FormatToken *LastPeriodOrArrow = NULL;
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000478 bool CanBeBuilderTypeStmt = true;
479 if (CurrentToken->is(tok::hash)) {
480 parsePreprocessorDirective();
481 return LT_PreprocessorDirective;
482 }
483 while (CurrentToken != NULL) {
484 if (CurrentToken->is(tok::kw_virtual))
485 KeywordVirtualFound = true;
Alexander Kornienkoe74de282013-03-13 14:41:29 +0000486 if (CurrentToken->isOneOf(tok::period, tok::arrow)) {
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000487 ++PeriodsAndArrows;
Daniel Jasper24849712013-03-01 16:48:32 +0000488 LastPeriodOrArrow = CurrentToken;
489 }
Manuel Klimekb3987012013-05-29 14:47:47 +0000490 FormatToken *TheToken = CurrentToken;
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000491 if (!consumeToken())
492 return LT_Invalid;
Manuel Klimekb3987012013-05-29 14:47:47 +0000493 if (TheToken->getPrecedence() > prec::Assignment &&
Daniel Jasper82282dc2013-02-18 13:52:06 +0000494 TheToken->Type == TT_BinaryOperator)
Daniel Jasper4a544e52013-02-15 20:33:06 +0000495 CanBeBuilderTypeStmt = false;
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000496 }
497 if (KeywordVirtualFound)
498 return LT_VirtualFunctionDecl;
499
500 // Assume a builder-type call if there are 2 or more "." and "->".
Daniel Jasper24849712013-03-01 16:48:32 +0000501 if (PeriodsAndArrows >= 2 && CanBeBuilderTypeStmt) {
502 LastPeriodOrArrow->LastInChainOfCalls = true;
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000503 return LT_BuilderTypeCall;
Daniel Jasper24849712013-03-01 16:48:32 +0000504 }
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000505
Manuel Klimekb3987012013-05-29 14:47:47 +0000506 if (Line.First->Type == TT_ObjCMethodSpecifier) {
Daniel Jasper4e778092013-02-06 10:05:46 +0000507 if (Contexts.back().FirstObjCSelectorName != NULL)
508 Contexts.back().FirstObjCSelectorName->LongestObjCSelectorName =
509 Contexts.back().LongestObjCSelectorName;
Daniel Jasper63d7ced2013-02-05 10:07:47 +0000510 return LT_ObjCMethodDecl;
511 }
512
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000513 return LT_Other;
514 }
515
Nico Weber95e8e462013-02-12 16:17:07 +0000516private:
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000517 void next() {
Daniel Jasper01786732013-02-04 07:21:18 +0000518 if (CurrentToken != NULL) {
519 determineTokenType(*CurrentToken);
Daniel Jasper4e778092013-02-06 10:05:46 +0000520 CurrentToken->BindingStrength = Contexts.back().BindingStrength;
Daniel Jasper01786732013-02-04 07:21:18 +0000521 }
522
Manuel Klimekb3987012013-05-29 14:47:47 +0000523 if (CurrentToken != NULL)
524 CurrentToken = CurrentToken->Next;
Daniel Jasperd0f349b2013-02-18 12:44:35 +0000525
526 // Reset token type in case we have already looked at it and then recovered
527 // from an error (e.g. failure to find the matching >).
528 if (CurrentToken != NULL)
529 CurrentToken->Type = TT_Unknown;
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000530 }
531
Daniel Jasper4e778092013-02-06 10:05:46 +0000532 /// \brief A struct to hold information valid in a specific context, e.g.
533 /// a pair of parenthesis.
534 struct Context {
Daniel Jasper923ebef2013-03-14 13:45:21 +0000535 Context(tok::TokenKind ContextKind, unsigned BindingStrength,
536 bool IsExpression)
537 : ContextKind(ContextKind), BindingStrength(BindingStrength),
538 LongestObjCSelectorName(0), ColonIsForRangeExpr(false),
Nico Weberf2ff8122013-05-26 05:39:26 +0000539 ColonIsObjCDictLiteral(false), ColonIsObjCMethodExpr(false),
540 FirstObjCSelectorName(NULL), FirstStartOfName(NULL),
541 IsExpression(IsExpression), CanBeExpression(true) {}
Daniel Jasper01786732013-02-04 07:21:18 +0000542
Daniel Jasper923ebef2013-03-14 13:45:21 +0000543 tok::TokenKind ContextKind;
Daniel Jasper4e778092013-02-06 10:05:46 +0000544 unsigned BindingStrength;
545 unsigned LongestObjCSelectorName;
546 bool ColonIsForRangeExpr;
Nico Weberf2ff8122013-05-26 05:39:26 +0000547 bool ColonIsObjCDictLiteral;
Daniel Jasper4e778092013-02-06 10:05:46 +0000548 bool ColonIsObjCMethodExpr;
Manuel Klimekb3987012013-05-29 14:47:47 +0000549 FormatToken *FirstObjCSelectorName;
550 FormatToken *FirstStartOfName;
Daniel Jasper4e778092013-02-06 10:05:46 +0000551 bool IsExpression;
Daniel Jasper6f21a982013-03-13 07:49:51 +0000552 bool CanBeExpression;
Daniel Jasper4e778092013-02-06 10:05:46 +0000553 };
554
555 /// \brief Puts a new \c Context onto the stack \c Contexts for the lifetime
556 /// of each instance.
557 struct ScopedContextCreator {
558 AnnotatingParser &P;
559
Daniel Jasper923ebef2013-03-14 13:45:21 +0000560 ScopedContextCreator(AnnotatingParser &P, tok::TokenKind ContextKind,
561 unsigned Increase)
562 : P(P) {
Daniel Jasper2a409b62013-07-08 14:34:09 +0000563 P.Contexts.push_back(Context(ContextKind,
564 P.Contexts.back().BindingStrength + Increase,
565 P.Contexts.back().IsExpression));
Daniel Jasper4e778092013-02-06 10:05:46 +0000566 }
567
568 ~ScopedContextCreator() { P.Contexts.pop_back(); }
569 };
Daniel Jasper01786732013-02-04 07:21:18 +0000570
Manuel Klimekb3987012013-05-29 14:47:47 +0000571 void determineTokenType(FormatToken &Current) {
572 if (Current.getPrecedence() == prec::Assignment &&
573 (!Current.Previous || Current.Previous->isNot(tok::kw_operator))) {
Daniel Jasper4e778092013-02-06 10:05:46 +0000574 Contexts.back().IsExpression = true;
Manuel Klimekb3987012013-05-29 14:47:47 +0000575 for (FormatToken *Previous = Current.Previous;
Nico Weber95e8e462013-02-12 16:17:07 +0000576 Previous && Previous->isNot(tok::comma);
Manuel Klimekb3987012013-05-29 14:47:47 +0000577 Previous = Previous->Previous) {
Daniel Jasper9c65b062013-02-27 11:43:50 +0000578 if (Previous->is(tok::r_square))
579 Previous = Previous->MatchingParen;
Daniel Jasper01786732013-02-04 07:21:18 +0000580 if (Previous->Type == TT_BinaryOperator &&
Alexander Kornienkoe74de282013-03-13 14:41:29 +0000581 Previous->isOneOf(tok::star, tok::amp)) {
Daniel Jasper01786732013-02-04 07:21:18 +0000582 Previous->Type = TT_PointerOrReference;
583 }
Daniel Jasper01786732013-02-04 07:21:18 +0000584 }
Alexander Kornienkoe74de282013-03-13 14:41:29 +0000585 } else if (Current.isOneOf(tok::kw_return, tok::kw_throw) ||
Nico Weber95e8e462013-02-12 16:17:07 +0000586 (Current.is(tok::l_paren) && !Line.MustBeDeclaration &&
Daniel Jasper378d93d2013-05-13 07:14:40 +0000587 !Line.InPPDirective &&
Manuel Klimekb3987012013-05-29 14:47:47 +0000588 (!Current.Previous || Current.Previous->isNot(tok::kw_for)))) {
Daniel Jasper4e778092013-02-06 10:05:46 +0000589 Contexts.back().IsExpression = true;
Alexander Kornienkoe74de282013-03-13 14:41:29 +0000590 } else if (Current.isOneOf(tok::r_paren, tok::greater, tok::comma)) {
Manuel Klimekb3987012013-05-29 14:47:47 +0000591 for (FormatToken *Previous = Current.Previous;
Alexander Kornienkoe74de282013-03-13 14:41:29 +0000592 Previous && Previous->isOneOf(tok::star, tok::amp);
Manuel Klimekb3987012013-05-29 14:47:47 +0000593 Previous = Previous->Previous)
Nico Weber95e8e462013-02-12 16:17:07 +0000594 Previous->Type = TT_PointerOrReference;
Manuel Klimekb3987012013-05-29 14:47:47 +0000595 } else if (Current.Previous &&
596 Current.Previous->Type == TT_CtorInitializerColon) {
Daniel Jasperd0f349b2013-02-18 12:44:35 +0000597 Contexts.back().IsExpression = true;
Daniel Jasper6f21a982013-03-13 07:49:51 +0000598 } else if (Current.is(tok::kw_new)) {
599 Contexts.back().CanBeExpression = false;
Daniel Jasper16a69ef2013-05-03 14:41:24 +0000600 } else if (Current.is(tok::semi)) {
601 // This should be the condition or increment in a for-loop.
602 Contexts.back().IsExpression = true;
Nico Weber95e8e462013-02-12 16:17:07 +0000603 }
Daniel Jasper01786732013-02-04 07:21:18 +0000604
605 if (Current.Type == TT_Unknown) {
Daniel Jasper6ac431c2013-07-02 09:47:29 +0000606 if (isStartOfName(Current)) {
Daniel Jasper8ed9f2b2013-04-03 13:36:17 +0000607 Contexts.back().FirstStartOfName = &Current;
Daniel Jasper3c08a812013-02-24 18:54:32 +0000608 Current.Type = TT_StartOfName;
Daniel Jasper1407bee2013-04-11 14:29:13 +0000609 NameFound = true;
Daniel Jasper2ca37412013-07-09 14:36:48 +0000610 } else if (Current.is(tok::kw_auto)) {
611 AutoFound = true;
Daniel Jasper3262f4c2013-07-11 14:33:06 +0000612 } else if (Current.is(tok::arrow) && AutoFound &&
613 Line.MustBeDeclaration) {
Daniel Jasper2ca37412013-07-09 14:36:48 +0000614 Current.Type = TT_TrailingReturnArrow;
Alexander Kornienkoe74de282013-03-13 14:41:29 +0000615 } else if (Current.isOneOf(tok::star, tok::amp, tok::ampamp)) {
Daniel Jasper4e778092013-02-06 10:05:46 +0000616 Current.Type =
Daniel Jasperd6104f62013-07-05 13:30:40 +0000617 determineStarAmpUsage(Current, Contexts.back().CanBeExpression &&
618 Contexts.back().IsExpression);
Alexander Kornienkoe74de282013-03-13 14:41:29 +0000619 } else if (Current.isOneOf(tok::minus, tok::plus, tok::caret)) {
Daniel Jasper01786732013-02-04 07:21:18 +0000620 Current.Type = determinePlusMinusCaretUsage(Current);
Alexander Kornienkoe74de282013-03-13 14:41:29 +0000621 } else if (Current.isOneOf(tok::minusminus, tok::plusplus)) {
Daniel Jasper01786732013-02-04 07:21:18 +0000622 Current.Type = determineIncrementUsage(Current);
623 } else if (Current.is(tok::exclaim)) {
624 Current.Type = TT_UnaryOperator;
Daniel Jasperac3223e2013-04-10 09:49:49 +0000625 } else if (Current.isBinaryOperator()) {
Daniel Jasper01786732013-02-04 07:21:18 +0000626 Current.Type = TT_BinaryOperator;
627 } else if (Current.is(tok::comment)) {
Alexander Kornienko00895102013-06-05 14:09:10 +0000628 if (Current.TokenText.startswith("//"))
Daniel Jasper01786732013-02-04 07:21:18 +0000629 Current.Type = TT_LineComment;
630 else
631 Current.Type = TT_BlockComment;
Nico Weber37d69312013-02-13 04:13:13 +0000632 } else if (Current.is(tok::r_paren)) {
Daniel Jasperb8b42952013-05-31 16:14:28 +0000633 FormatToken *LeftOfParens = NULL;
634 if (Current.MatchingParen)
Alexander Kornienko0bdc6432013-07-04 14:47:51 +0000635 LeftOfParens = Current.MatchingParen->getPreviousNonComment();
Daniel Jasperb8b42952013-05-31 16:14:28 +0000636 bool IsCast = false;
637 bool ParensAreEmpty = Current.Previous == Current.MatchingParen;
638 bool ParensAreType = !Current.Previous ||
Manuel Klimekb3987012013-05-29 14:47:47 +0000639 Current.Previous->Type == TT_PointerOrReference ||
Daniel Jasperb8b42952013-05-31 16:14:28 +0000640 Current.Previous->Type == TT_TemplateCloser ||
641 isSimpleTypeSpecifier(*Current.Previous);
Nico Weber37d69312013-02-13 04:13:13 +0000642 bool ParensCouldEndDecl =
Manuel Klimekb3987012013-05-29 14:47:47 +0000643 Current.Next &&
644 Current.Next->isOneOf(tok::equal, tok::semi, tok::l_brace);
Daniel Jasper6a365aa2013-03-13 17:13:53 +0000645 bool IsSizeOfOrAlignOf =
Daniel Jasperb8b42952013-05-31 16:14:28 +0000646 LeftOfParens &&
647 LeftOfParens->isOneOf(tok::kw_sizeof, tok::kw_alignof);
648 if (ParensAreType && !ParensCouldEndDecl && !IsSizeOfOrAlignOf &&
Daniel Jasper0c368782013-07-15 15:04:42 +0000649 (Contexts.back().IsExpression ||
650 (Current.Next && Current.Next->isBinaryOperator())))
Daniel Jasperb8b42952013-05-31 16:14:28 +0000651 IsCast = true;
Daniel Jasper2a409b62013-07-08 14:34:09 +0000652 if (Current.Next && Current.Next->isNot(tok::string_literal) &&
Daniel Jasperb8b42952013-05-31 16:14:28 +0000653 (Current.Next->Tok.isLiteral() ||
654 Current.Next->isOneOf(tok::kw_sizeof, tok::kw_alignof)))
655 IsCast = true;
656 // If there is an identifier after the (), it is likely a cast, unless
657 // there is also an identifier before the ().
Daniel Jasperff1a2e52013-06-06 08:20:20 +0000658 if (LeftOfParens && (LeftOfParens->Tok.getIdentifierInfo() == NULL ||
659 LeftOfParens->is(tok::kw_return)) &&
Daniel Jasper526df0f2013-07-08 14:58:01 +0000660 LeftOfParens->Type != TT_OverloadedOperator &&
Nico Weber465e8612013-06-25 00:55:57 +0000661 LeftOfParens->Type != TT_TemplateCloser && Current.Next &&
662 Current.Next->is(tok::identifier))
Daniel Jasperb8b42952013-05-31 16:14:28 +0000663 IsCast = true;
664 if (IsCast && !ParensAreEmpty)
Nico Weber37d69312013-02-13 04:13:13 +0000665 Current.Type = TT_CastRParen;
Manuel Klimekb3987012013-05-29 14:47:47 +0000666 } else if (Current.is(tok::at) && Current.Next) {
667 switch (Current.Next->Tok.getObjCKeywordID()) {
Daniel Jasper01786732013-02-04 07:21:18 +0000668 case tok::objc_interface:
669 case tok::objc_implementation:
670 case tok::objc_protocol:
671 Current.Type = TT_ObjCDecl;
672 break;
673 case tok::objc_property:
674 Current.Type = TT_ObjCProperty;
675 break;
676 default:
677 break;
678 }
Daniel Jasper5ad390d2013-05-28 11:30:49 +0000679 } else if (Current.is(tok::period)) {
Alexander Kornienko0bdc6432013-07-04 14:47:51 +0000680 FormatToken *PreviousNoComment = Current.getPreviousNonComment();
Daniel Jasper5ad390d2013-05-28 11:30:49 +0000681 if (PreviousNoComment &&
682 PreviousNoComment->isOneOf(tok::comma, tok::l_brace))
683 Current.Type = TT_DesignatedInitializerPeriod;
Daniel Jasper01786732013-02-04 07:21:18 +0000684 }
685 }
686 }
687
Daniel Jasper6ac431c2013-07-02 09:47:29 +0000688 /// \brief Take a guess at whether \p Tok starts a name of a function or
689 /// variable declaration.
690 ///
691 /// This is a heuristic based on whether \p Tok is an identifier following
692 /// something that is likely a type.
693 bool isStartOfName(const FormatToken &Tok) {
694 if (Tok.isNot(tok::identifier) || Tok.Previous == NULL)
695 return false;
696
697 // Skip "const" as it does not have an influence on whether this is a name.
698 FormatToken *PreviousNotConst = Tok.Previous;
699 while (PreviousNotConst != NULL && PreviousNotConst->is(tok::kw_const))
700 PreviousNotConst = PreviousNotConst->Previous;
701
702 if (PreviousNotConst == NULL)
703 return false;
704
Daniel Jasper2a409b62013-07-08 14:34:09 +0000705 bool IsPPKeyword = PreviousNotConst->is(tok::identifier) &&
706 PreviousNotConst->Previous &&
707 PreviousNotConst->Previous->is(tok::hash);
Daniel Jasper6ac431c2013-07-02 09:47:29 +0000708
709 return (!IsPPKeyword && PreviousNotConst->is(tok::identifier)) ||
710 PreviousNotConst->Type == TT_PointerOrReference ||
711 PreviousNotConst->Type == TT_TemplateCloser ||
712 isSimpleTypeSpecifier(*PreviousNotConst);
713 }
714
Daniel Jasper01786732013-02-04 07:21:18 +0000715 /// \brief Return the type of the given token assuming it is * or &.
Manuel Klimekb3987012013-05-29 14:47:47 +0000716 TokenType determineStarAmpUsage(const FormatToken &Tok, bool IsExpression) {
Alexander Kornienko0bdc6432013-07-04 14:47:51 +0000717 const FormatToken *PrevToken = Tok.getPreviousNonComment();
Daniel Jasper01786732013-02-04 07:21:18 +0000718 if (PrevToken == NULL)
719 return TT_UnaryOperator;
720
Alexander Kornienko0bdc6432013-07-04 14:47:51 +0000721 const FormatToken *NextToken = Tok.getNextNonComment();
Daniel Jasper01786732013-02-04 07:21:18 +0000722 if (NextToken == NULL)
723 return TT_Unknown;
724
Daniel Jasper431f5912013-05-28 08:33:00 +0000725 if (PrevToken->is(tok::coloncolon) ||
726 (PrevToken->is(tok::l_paren) && !IsExpression))
Daniel Jasper8a5d7cd2013-03-01 17:13:29 +0000727 return TT_PointerOrReference;
728
Alexander Kornienkoe74de282013-03-13 14:41:29 +0000729 if (PrevToken->isOneOf(tok::l_paren, tok::l_square, tok::l_brace,
Daniel Jasperd3cf17b2013-03-14 10:50:25 +0000730 tok::comma, tok::semi, tok::kw_return, tok::colon,
Daniel Jasperdbef71e2013-05-07 14:17:18 +0000731 tok::equal, tok::kw_delete) ||
Alexander Kornienkoe74de282013-03-13 14:41:29 +0000732 PrevToken->Type == TT_BinaryOperator ||
Daniel Jasper01786732013-02-04 07:21:18 +0000733 PrevToken->Type == TT_UnaryOperator || PrevToken->Type == TT_CastRParen)
734 return TT_UnaryOperator;
735
Nico Webere8a97982013-02-06 06:20:11 +0000736 if (NextToken->is(tok::l_square))
737 return TT_PointerOrReference;
738
Manuel Klimekb3987012013-05-29 14:47:47 +0000739 if (PrevToken->Tok.isLiteral() ||
Alexander Kornienkoe74de282013-03-13 14:41:29 +0000740 PrevToken->isOneOf(tok::r_paren, tok::r_square) ||
Manuel Klimekb3987012013-05-29 14:47:47 +0000741 NextToken->Tok.isLiteral() || NextToken->isUnaryOperator())
Daniel Jasper01786732013-02-04 07:21:18 +0000742 return TT_BinaryOperator;
743
Daniel Jasper01786732013-02-04 07:21:18 +0000744 // It is very unlikely that we are going to find a pointer or reference type
745 // definition on the RHS of an assignment.
746 if (IsExpression)
747 return TT_BinaryOperator;
748
749 return TT_PointerOrReference;
750 }
751
Manuel Klimekb3987012013-05-29 14:47:47 +0000752 TokenType determinePlusMinusCaretUsage(const FormatToken &Tok) {
Alexander Kornienko0bdc6432013-07-04 14:47:51 +0000753 const FormatToken *PrevToken = Tok.getPreviousNonComment();
Daniel Jasperb8b42952013-05-31 16:14:28 +0000754 if (PrevToken == NULL || PrevToken->Type == TT_CastRParen)
Daniel Jasper01786732013-02-04 07:21:18 +0000755 return TT_UnaryOperator;
756
757 // Use heuristics to recognize unary operators.
Alexander Kornienkoe74de282013-03-13 14:41:29 +0000758 if (PrevToken->isOneOf(tok::equal, tok::l_paren, tok::comma, tok::l_square,
759 tok::question, tok::colon, tok::kw_return,
760 tok::kw_case, tok::at, tok::l_brace))
Daniel Jasper01786732013-02-04 07:21:18 +0000761 return TT_UnaryOperator;
762
Nico Weberee0feec2013-02-05 16:21:00 +0000763 // There can't be two consecutive binary operators.
Daniel Jasper01786732013-02-04 07:21:18 +0000764 if (PrevToken->Type == TT_BinaryOperator)
765 return TT_UnaryOperator;
766
767 // Fall back to marking the token as binary operator.
768 return TT_BinaryOperator;
769 }
770
771 /// \brief Determine whether ++/-- are pre- or post-increments/-decrements.
Manuel Klimekb3987012013-05-29 14:47:47 +0000772 TokenType determineIncrementUsage(const FormatToken &Tok) {
Alexander Kornienko0bdc6432013-07-04 14:47:51 +0000773 const FormatToken *PrevToken = Tok.getPreviousNonComment();
Daniel Jasperb8b42952013-05-31 16:14:28 +0000774 if (PrevToken == NULL || PrevToken->Type == TT_CastRParen)
Daniel Jasper01786732013-02-04 07:21:18 +0000775 return TT_UnaryOperator;
Alexander Kornienkoe74de282013-03-13 14:41:29 +0000776 if (PrevToken->isOneOf(tok::r_paren, tok::r_square, tok::identifier))
Daniel Jasper01786732013-02-04 07:21:18 +0000777 return TT_TrailingUnaryOperator;
778
779 return TT_UnaryOperator;
780 }
Daniel Jasper4e778092013-02-06 10:05:46 +0000781
Daniel Jasper8ed9f2b2013-04-03 13:36:17 +0000782 // FIXME: This is copy&pasted from Sema. Put it in a common place and remove
783 // duplication.
784 /// \brief Determine whether the token kind starts a simple-type-specifier.
Manuel Klimekb3987012013-05-29 14:47:47 +0000785 bool isSimpleTypeSpecifier(const FormatToken &Tok) const {
786 switch (Tok.Tok.getKind()) {
Daniel Jasper8ed9f2b2013-04-03 13:36:17 +0000787 case tok::kw_short:
788 case tok::kw_long:
789 case tok::kw___int64:
790 case tok::kw___int128:
791 case tok::kw_signed:
792 case tok::kw_unsigned:
793 case tok::kw_void:
794 case tok::kw_char:
795 case tok::kw_int:
796 case tok::kw_half:
797 case tok::kw_float:
798 case tok::kw_double:
799 case tok::kw_wchar_t:
800 case tok::kw_bool:
801 case tok::kw___underlying_type:
Daniel Jasper8ed9f2b2013-04-03 13:36:17 +0000802 case tok::annot_typename:
803 case tok::kw_char16_t:
804 case tok::kw_char32_t:
805 case tok::kw_typeof:
806 case tok::kw_decltype:
Alexander Kornienko00895102013-06-05 14:09:10 +0000807 return true;
Daniel Jasper8ed9f2b2013-04-03 13:36:17 +0000808 default:
Alexander Kornienko00895102013-06-05 14:09:10 +0000809 return false;
Daniel Jasper8ed9f2b2013-04-03 13:36:17 +0000810 }
Daniel Jasper8ed9f2b2013-04-03 13:36:17 +0000811 }
812
Daniel Jasper4e778092013-02-06 10:05:46 +0000813 SmallVector<Context, 8> Contexts;
814
Daniel Jasper4e778092013-02-06 10:05:46 +0000815 AnnotatedLine &Line;
Manuel Klimekb3987012013-05-29 14:47:47 +0000816 FormatToken *CurrentToken;
Daniel Jasper4e778092013-02-06 10:05:46 +0000817 bool KeywordVirtualFound;
Daniel Jasper1407bee2013-04-11 14:29:13 +0000818 bool NameFound;
Daniel Jasper2ca37412013-07-09 14:36:48 +0000819 bool AutoFound;
Nico Weberc2e6d2a2013-02-11 15:32:15 +0000820 IdentifierInfo &Ident_in;
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000821};
822
Daniel Jasper29f123b2013-02-08 15:28:42 +0000823/// \brief Parses binary expressions by inserting fake parenthesis based on
824/// operator precedence.
825class ExpressionParser {
826public:
Daniel Jasper9acb8b42013-06-06 09:11:58 +0000827 ExpressionParser(AnnotatedLine &Line) : Current(Line.First) {
828 // Skip leading "}", e.g. in "} else if (...) {".
829 if (Current->is(tok::r_brace))
830 next();
831 }
Daniel Jasper29f123b2013-02-08 15:28:42 +0000832
833 /// \brief Parse expressions with the given operatore precedence.
Daniel Jasper237d4c12013-02-23 21:01:55 +0000834 void parse(int Precedence = 0) {
Daniel Jasperc01897c2013-05-31 14:56:12 +0000835 // Conditional expressions need to be parsed separately for proper nesting.
836 if (Precedence == prec::Conditional + 1) {
837 parseConditionalExpr();
838 return;
839 }
Daniel Jasper29f123b2013-02-08 15:28:42 +0000840 if (Precedence > prec::PointerToMember || Current == NULL)
841 return;
842
Manuel Klimekb3987012013-05-29 14:47:47 +0000843 FormatToken *Start = Current;
Daniel Jasper29f123b2013-02-08 15:28:42 +0000844 bool OperatorFound = false;
845
Daniel Jasper237d4c12013-02-23 21:01:55 +0000846 while (Current) {
Daniel Jasper29f123b2013-02-08 15:28:42 +0000847 // Consume operators with higher precedence.
Daniel Jasperbf71ba22013-04-08 20:33:42 +0000848 parse(Precedence + 1);
Daniel Jasper29f123b2013-02-08 15:28:42 +0000849
Daniel Jasper237d4c12013-02-23 21:01:55 +0000850 int CurrentPrecedence = 0;
851 if (Current) {
852 if (Current->Type == TT_ConditionalExpr)
Daniel Jasperb8b42952013-05-31 16:14:28 +0000853 CurrentPrecedence = 1 + (int)prec::Conditional;
Daniel Jasperbf71ba22013-04-08 20:33:42 +0000854 else if (Current->is(tok::semi) || Current->Type == TT_InlineASMColon)
Daniel Jasper237d4c12013-02-23 21:01:55 +0000855 CurrentPrecedence = 1;
856 else if (Current->Type == TT_BinaryOperator || Current->is(tok::comma))
Daniel Jasperb8b42952013-05-31 16:14:28 +0000857 CurrentPrecedence = 1 + (int)Current->getPrecedence();
Daniel Jasper237d4c12013-02-23 21:01:55 +0000858 }
859
Daniel Jasper29f123b2013-02-08 15:28:42 +0000860 // At the end of the line or when an operator with higher precedence is
861 // found, insert fake parenthesis and return.
Daniel Jasperac3223e2013-04-10 09:49:49 +0000862 if (Current == NULL || Current->closesScope() ||
Daniel Jasper237d4c12013-02-23 21:01:55 +0000863 (CurrentPrecedence != 0 && CurrentPrecedence < Precedence)) {
Daniel Jasperc01897c2013-05-31 14:56:12 +0000864 if (OperatorFound)
865 addFakeParenthesis(Start, prec::Level(Precedence - 1));
Daniel Jasper29f123b2013-02-08 15:28:42 +0000866 return;
867 }
868
869 // Consume scopes: (), [], <> and {}
Daniel Jasperac3223e2013-04-10 09:49:49 +0000870 if (Current->opensScope()) {
871 while (Current && !Current->closesScope()) {
Daniel Jasper29f123b2013-02-08 15:28:42 +0000872 next();
873 parse();
874 }
875 next();
876 } else {
877 // Operator found.
Daniel Jasper237d4c12013-02-23 21:01:55 +0000878 if (CurrentPrecedence == Precedence)
Daniel Jasper29f123b2013-02-08 15:28:42 +0000879 OperatorFound = true;
880
881 next();
882 }
883 }
884 }
885
886private:
Daniel Jasperc01897c2013-05-31 14:56:12 +0000887 void addFakeParenthesis(FormatToken *Start, prec::Level Precedence) {
888 Start->FakeLParens.push_back(Precedence);
889 if (Current)
890 ++Current->Previous->FakeRParens;
891 }
892
893 void parseConditionalExpr() {
894 FormatToken *Start = Current;
895 parse(prec::LogicalOr + 1);
896 if (!Current || !Current->is(tok::question))
897 return;
898 next();
899 parse(prec::LogicalOr + 1);
900 if (!Current || Current->Type != TT_ConditionalExpr)
901 return;
902 next();
903 parseConditionalExpr();
904 addFakeParenthesis(Start, prec::Conditional);
905 }
906
Daniel Jasper29f123b2013-02-08 15:28:42 +0000907 void next() {
Alexander Kornienkod71b15b2013-06-17 13:19:53 +0000908 if (Current)
909 Current = Current->Next;
910 while (Current && Current->isTrailingComment())
Manuel Klimekb3987012013-05-29 14:47:47 +0000911 Current = Current->Next;
Daniel Jasper29f123b2013-02-08 15:28:42 +0000912 }
913
Manuel Klimekb3987012013-05-29 14:47:47 +0000914 FormatToken *Current;
Daniel Jasper29f123b2013-02-08 15:28:42 +0000915};
916
Craig Topper14e66492013-07-01 04:03:19 +0000917} // end anonymous namespace
918
Daniel Jasper8ff690a2013-02-06 14:22:40 +0000919void TokenAnnotator::annotate(AnnotatedLine &Line) {
Alexander Kornienko00895102013-06-05 14:09:10 +0000920 AnnotatingParser Parser(Line, Ident_in);
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000921 Line.Type = Parser.parseLine();
922 if (Line.Type == LT_Invalid)
923 return;
924
Daniel Jasper29f123b2013-02-08 15:28:42 +0000925 ExpressionParser ExprParser(Line);
926 ExprParser.parse();
927
Manuel Klimekb3987012013-05-29 14:47:47 +0000928 if (Line.First->Type == TT_ObjCMethodSpecifier)
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000929 Line.Type = LT_ObjCMethodDecl;
Manuel Klimekb3987012013-05-29 14:47:47 +0000930 else if (Line.First->Type == TT_ObjCDecl)
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000931 Line.Type = LT_ObjCDecl;
Manuel Klimekb3987012013-05-29 14:47:47 +0000932 else if (Line.First->Type == TT_ObjCProperty)
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000933 Line.Type = LT_ObjCProperty;
934
Manuel Klimekb3987012013-05-29 14:47:47 +0000935 Line.First->SpacesRequiredBefore = 1;
936 Line.First->CanBreakBefore = Line.First->MustBreakBefore;
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000937}
938
Daniel Jasper8ff690a2013-02-06 14:22:40 +0000939void TokenAnnotator::calculateFormattingInformation(AnnotatedLine &Line) {
Alexander Kornienko00895102013-06-05 14:09:10 +0000940 Line.First->TotalLength = Line.First->CodePointCount;
Manuel Klimekb3987012013-05-29 14:47:47 +0000941 if (!Line.First->Next)
Daniel Jasper8ff690a2013-02-06 14:22:40 +0000942 return;
Manuel Klimekb3987012013-05-29 14:47:47 +0000943 FormatToken *Current = Line.First->Next;
Daniel Jasper8ff690a2013-02-06 14:22:40 +0000944 while (Current != NULL) {
Daniel Jasper729a7432013-02-11 12:36:37 +0000945 if (Current->Type == TT_LineComment)
946 Current->SpacesRequiredBefore = Style.SpacesBeforeTrailingComments;
947 else
948 Current->SpacesRequiredBefore =
949 spaceRequiredBefore(Line, *Current) ? 1 : 0;
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000950
Daniel Jasper561211d2013-07-16 20:28:33 +0000951 if (Current->is(tok::comment)) {
Manuel Klimekb3987012013-05-29 14:47:47 +0000952 Current->MustBreakBefore = Current->NewlinesBefore > 0;
953 } else if (Current->Previous->isTrailingComment() ||
Daniel Jasper8ff690a2013-02-06 14:22:40 +0000954 (Current->is(tok::string_literal) &&
Manuel Klimekb3987012013-05-29 14:47:47 +0000955 Current->Previous->is(tok::string_literal))) {
Daniel Jasper8ff690a2013-02-06 14:22:40 +0000956 Current->MustBreakBefore = true;
Daniel Jasper561211d2013-07-16 20:28:33 +0000957 } else if (Current->Previous->IsUnterminatedLiteral) {
958 Current->MustBreakBefore = true;
Manuel Klimekb3987012013-05-29 14:47:47 +0000959 } else if (Current->is(tok::lessless) && Current->Next &&
960 Current->Previous->is(tok::string_literal) &&
961 Current->Next->is(tok::string_literal)) {
Daniel Jasper8ff690a2013-02-06 14:22:40 +0000962 Current->MustBreakBefore = true;
Manuel Klimekb3987012013-05-29 14:47:47 +0000963 } else if (Current->Previous->ClosesTemplateDeclaration &&
Daniel Jasperbbc87762013-05-29 12:07:31 +0000964 Style.AlwaysBreakTemplateDeclarations) {
965 Current->MustBreakBefore = true;
Daniel Jasper8ff690a2013-02-06 14:22:40 +0000966 }
967 Current->CanBreakBefore =
968 Current->MustBreakBefore || canBreakBefore(Line, *Current);
Daniel Jasper215c57f2013-07-17 15:38:19 +0000969 if (Current->MustBreakBefore ||
970 (Current->is(tok::string_literal) &&
971 Current->TokenText.find("\\\n") != StringRef::npos))
Manuel Klimekb3987012013-05-29 14:47:47 +0000972 Current->TotalLength = Current->Previous->TotalLength + Style.ColumnLimit;
Daniel Jasper8ff690a2013-02-06 14:22:40 +0000973 else
Daniel Jasper2a409b62013-07-08 14:34:09 +0000974 Current->TotalLength = Current->Previous->TotalLength +
975 Current->CodePointCount +
976 Current->SpacesRequiredBefore;
Daniel Jasper8ff690a2013-02-06 14:22:40 +0000977 // FIXME: Only calculate this if CanBreakBefore is true once static
978 // initializers etc. are sorted out.
979 // FIXME: Move magic numbers to a better place.
980 Current->SplitPenalty =
981 20 * Current->BindingStrength + splitPenalty(Line, *Current);
982
Manuel Klimekb3987012013-05-29 14:47:47 +0000983 Current = Current->Next;
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000984 }
Daniel Jasperbf71ba22013-04-08 20:33:42 +0000985
Manuel Klimeke573c3f2013-05-22 12:51:29 +0000986 calculateUnbreakableTailLengths(Line);
Daniel Jasperbf71ba22013-04-08 20:33:42 +0000987 DEBUG({
988 printDebugInfo(Line);
989 });
Daniel Jasper32d28ee2013-01-29 21:01:14 +0000990}
991
Manuel Klimeke573c3f2013-05-22 12:51:29 +0000992void TokenAnnotator::calculateUnbreakableTailLengths(AnnotatedLine &Line) {
993 unsigned UnbreakableTailLength = 0;
Manuel Klimekb3987012013-05-29 14:47:47 +0000994 FormatToken *Current = Line.Last;
Manuel Klimeke573c3f2013-05-22 12:51:29 +0000995 while (Current != NULL) {
996 Current->UnbreakableTailLength = UnbreakableTailLength;
997 if (Current->CanBreakBefore ||
998 Current->isOneOf(tok::comment, tok::string_literal)) {
999 UnbreakableTailLength = 0;
1000 } else {
1001 UnbreakableTailLength +=
Alexander Kornienko00895102013-06-05 14:09:10 +00001002 Current->CodePointCount + Current->SpacesRequiredBefore;
Manuel Klimeke573c3f2013-05-22 12:51:29 +00001003 }
Manuel Klimekb3987012013-05-29 14:47:47 +00001004 Current = Current->Previous;
Manuel Klimeke573c3f2013-05-22 12:51:29 +00001005 }
1006}
1007
Daniel Jasper8ff690a2013-02-06 14:22:40 +00001008unsigned TokenAnnotator::splitPenalty(const AnnotatedLine &Line,
Manuel Klimekb3987012013-05-29 14:47:47 +00001009 const FormatToken &Tok) {
1010 const FormatToken &Left = *Tok.Previous;
1011 const FormatToken &Right = Tok;
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001012
Daniel Jasper5ad390d2013-05-28 11:30:49 +00001013 if (Left.is(tok::semi))
1014 return 0;
1015 if (Left.is(tok::comma))
1016 return 1;
Daniel Jasper011c35d2013-07-12 11:19:37 +00001017 if (Right.is(tok::l_square))
1018 return 150;
Daniel Jasper5ad390d2013-05-28 11:30:49 +00001019
Daniel Jasper6561f6a2013-07-09 07:43:55 +00001020 if (Right.Type == TT_StartOfName || Right.is(tok::kw_operator)) {
Manuel Klimekb3987012013-05-29 14:47:47 +00001021 if (Line.First->is(tok::kw_for) && Right.PartOfMultiVariableDeclStmt)
Daniel Jasper3c08a812013-02-24 18:54:32 +00001022 return 3;
Daniel Jasperc18cff32013-07-11 12:34:23 +00001023 if (Left.Type == TT_StartOfName)
1024 return 20;
Daniel Jasper3c08a812013-02-24 18:54:32 +00001025 else if (Line.MightBeFunctionDecl && Right.BindingStrength == 1)
1026 // FIXME: Clean up hack of using BindingStrength to find top-level names.
1027 return Style.PenaltyReturnTypeOnItsOwnLine;
1028 else
Daniel Jasper1407bee2013-04-11 14:29:13 +00001029 return 200;
Daniel Jasper3c08a812013-02-24 18:54:32 +00001030 }
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001031 if (Left.is(tok::equal) && Right.is(tok::l_brace))
1032 return 150;
Daniel Jasper198c8bf2013-07-05 07:58:34 +00001033 if (Left.Type == TT_CastRParen)
1034 return 100;
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001035 if (Left.is(tok::coloncolon))
1036 return 500;
Daniel Jasper6b119d62013-04-05 17:22:09 +00001037 if (Left.isOneOf(tok::kw_class, tok::kw_struct))
1038 return 5000;
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001039
Daniel Jasper6cabab42013-02-14 08:42:54 +00001040 if (Left.Type == TT_RangeBasedForLoopColon ||
1041 Left.Type == TT_InheritanceColon)
Daniel Jasper84a1a632013-02-26 13:18:08 +00001042 return 2;
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001043
Daniel Jasper5ad390d2013-05-28 11:30:49 +00001044 if (Right.isOneOf(tok::arrow, tok::period) &&
1045 Right.Type != TT_DesignatedInitializerPeriod) {
Daniel Jasper515f65d2013-02-18 13:24:21 +00001046 if (Line.Type == LT_BuilderTypeCall)
Daniel Jasper6a365aa2013-03-13 17:13:53 +00001047 return prec::PointerToMember;
Alexander Kornienkoe74de282013-03-13 14:41:29 +00001048 if (Left.isOneOf(tok::r_paren, tok::r_square) && Left.MatchingParen &&
1049 Left.MatchingParen->ParameterCount > 0)
Daniel Jasper518ee342013-02-26 13:59:14 +00001050 return 20; // Should be smaller than breaking at a nested comma.
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001051 return 150;
1052 }
1053
Daniel Jasper20a0f8c2013-07-11 21:02:56 +00001054 // Breaking before a trailing 'const' or not-function-like annotation is bad.
1055 if (Left.is(tok::r_paren) &&
1056 (Right.is(tok::kw_const) || (Right.is(tok::identifier) && Right.Next &&
1057 Right.Next->isNot(tok::l_paren))))
Daniel Jasper5ad72bb2013-05-22 08:28:26 +00001058 return 150;
1059
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001060 // In for-loops, prefer breaking at ',' and ';'.
Manuel Klimekb3987012013-05-29 14:47:47 +00001061 if (Line.First->is(tok::kw_for) && Left.is(tok::equal))
Daniel Jasper7d812812013-02-21 15:00:29 +00001062 return 4;
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001063
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001064 // In Objective-C method expressions, prefer breaking before "param:" over
1065 // breaking after it.
Daniel Jasper63d7ced2013-02-05 10:07:47 +00001066 if (Right.Type == TT_ObjCSelectorName)
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001067 return 0;
Daniel Jasper63d7ced2013-02-05 10:07:47 +00001068 if (Left.is(tok::colon) && Left.Type == TT_ObjCMethodExpr)
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001069 return 20;
1070
Daniel Jasper1407bee2013-04-11 14:29:13 +00001071 if (Left.is(tok::l_paren) && Line.MightBeFunctionDecl)
1072 return 100;
Daniel Jasperac3223e2013-04-10 09:49:49 +00001073 if (Left.opensScope())
Daniel Jasper64f09282013-03-20 13:53:11 +00001074 return Left.ParameterCount > 1 ? prec::Comma : 20;
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001075
Daniel Jasper4e8a7b42013-02-06 21:04:05 +00001076 if (Right.is(tok::lessless)) {
1077 if (Left.is(tok::string_literal)) {
Alexander Kornienko00895102013-06-05 14:09:10 +00001078 StringRef Content = Left.TokenText;
Daniel Jasperbfa1edd2013-03-14 14:00:17 +00001079 Content = Content.drop_back(1).drop_front(1).trim();
1080 if (Content.size() > 1 &&
1081 (Content.back() == ':' || Content.back() == '='))
Daniel Jasper9637dda2013-07-15 14:33:14 +00001082 return 25;
Daniel Jasper4e8a7b42013-02-06 21:04:05 +00001083 }
Daniel Jasper0c368782013-07-15 15:04:42 +00001084 return 1; // Breaking at a << is really cheap.
Daniel Jasper4e8a7b42013-02-06 21:04:05 +00001085 }
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001086 if (Left.Type == TT_ConditionalExpr)
Daniel Jasper518ee342013-02-26 13:59:14 +00001087 return prec::Conditional;
Manuel Klimekb3987012013-05-29 14:47:47 +00001088 prec::Level Level = Left.getPrecedence();
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001089
1090 if (Level != prec::Unknown)
1091 return Level;
Daniel Jasper24849712013-03-01 16:48:32 +00001092
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001093 return 3;
1094}
1095
Daniel Jasper8ff690a2013-02-06 14:22:40 +00001096bool TokenAnnotator::spaceRequiredBetween(const AnnotatedLine &Line,
Manuel Klimekb3987012013-05-29 14:47:47 +00001097 const FormatToken &Left,
1098 const FormatToken &Right) {
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001099 if (Right.is(tok::hashhash))
1100 return Left.is(tok::hash);
Alexander Kornienkoe74de282013-03-13 14:41:29 +00001101 if (Left.isOneOf(tok::hashhash, tok::hash))
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001102 return Right.is(tok::hash);
Alexander Kornienkoe74de282013-03-13 14:41:29 +00001103 if (Right.isOneOf(tok::r_paren, tok::semi, tok::comma))
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001104 return false;
1105 if (Right.is(tok::less) &&
1106 (Left.is(tok::kw_template) ||
1107 (Line.Type == LT_ObjCDecl && Style.ObjCSpaceBeforeProtocolList)))
1108 return true;
1109 if (Left.is(tok::arrow) || Right.is(tok::arrow))
1110 return false;
Alexander Kornienkoe74de282013-03-13 14:41:29 +00001111 if (Left.isOneOf(tok::exclaim, tok::tilde))
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001112 return false;
1113 if (Left.is(tok::at) &&
Alexander Kornienkoe74de282013-03-13 14:41:29 +00001114 Right.isOneOf(tok::identifier, tok::string_literal, tok::char_constant,
1115 tok::numeric_constant, tok::l_paren, tok::l_brace,
1116 tok::kw_true, tok::kw_false))
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001117 return false;
1118 if (Left.is(tok::coloncolon))
1119 return false;
1120 if (Right.is(tok::coloncolon))
Alexander Kornienkoe74de282013-03-13 14:41:29 +00001121 return !Left.isOneOf(tok::identifier, tok::greater, tok::l_paren);
1122 if (Left.is(tok::less) || Right.isOneOf(tok::greater, tok::less))
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001123 return false;
Daniel Jasperc47d7f12013-07-01 09:47:25 +00001124 if (Right.is(tok::ellipsis))
1125 return false;
Alexander Kornienko3fd9ccd2013-03-12 16:28:18 +00001126 if (Right.Type == TT_PointerOrReference)
Manuel Klimekb3987012013-05-29 14:47:47 +00001127 return Left.Tok.isLiteral() ||
Alexander Kornienko3fd9ccd2013-03-12 16:28:18 +00001128 ((Left.Type != TT_PointerOrReference) && Left.isNot(tok::l_paren) &&
1129 !Style.PointerBindsToType);
Daniel Jasper3ff4a2f2013-05-28 15:27:10 +00001130 if (Right.Type == TT_FunctionTypeLParen && Left.isNot(tok::l_paren) &&
Daniel Jasper395228f2013-05-08 14:58:20 +00001131 (Left.Type != TT_PointerOrReference || Style.PointerBindsToType))
1132 return true;
Alexander Kornienko3fd9ccd2013-03-12 16:28:18 +00001133 if (Left.Type == TT_PointerOrReference)
Daniel Jasper3a1847e2013-07-01 09:34:09 +00001134 return Right.Tok.isLiteral() || Right.Type == TT_BlockComment ||
Daniel Jasper9322aae2013-03-20 09:53:18 +00001135 ((Right.Type != TT_PointerOrReference) &&
Daniel Jasper81d2d382013-04-01 17:13:26 +00001136 Right.isNot(tok::l_paren) && Style.PointerBindsToType &&
Manuel Klimekb3987012013-05-29 14:47:47 +00001137 Left.Previous &&
1138 !Left.Previous->isOneOf(tok::l_paren, tok::coloncolon));
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001139 if (Right.is(tok::star) && Left.is(tok::l_paren))
1140 return false;
Nico Weber051860e2013-02-10 02:08:05 +00001141 if (Left.is(tok::l_square))
1142 return Left.Type == TT_ObjCArrayLiteral && Right.isNot(tok::r_square);
1143 if (Right.is(tok::r_square))
1144 return Right.Type == TT_ObjCArrayLiteral;
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001145 if (Right.is(tok::l_square) && Right.Type != TT_ObjCMethodExpr)
1146 return false;
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001147 if (Left.is(tok::colon))
1148 return Left.Type != TT_ObjCMethodExpr;
1149 if (Right.is(tok::colon))
1150 return Right.Type != TT_ObjCMethodExpr;
1151 if (Left.is(tok::l_paren))
1152 return false;
1153 if (Right.is(tok::l_paren)) {
Daniel Jaspere0fa4c52013-07-17 20:25:02 +00001154 if (Left.is(tok::r_paren) && Left.MatchingParen &&
1155 Left.MatchingParen->Previous &&
1156 Left.MatchingParen->Previous->is(tok::kw___attribute))
1157 return true;
Alexander Kornienkoe74de282013-03-13 14:41:29 +00001158 return Line.Type == LT_ObjCDecl ||
1159 Left.isOneOf(tok::kw_if, tok::kw_for, tok::kw_while, tok::kw_switch,
1160 tok::kw_return, tok::kw_catch, tok::kw_new,
Daniel Jasper454cb702013-05-03 14:50:50 +00001161 tok::kw_delete, tok::semi);
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001162 }
Manuel Klimekb3987012013-05-29 14:47:47 +00001163 if (Left.is(tok::at) && Right.Tok.getObjCKeywordID() != tok::objc_not_keyword)
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001164 return false;
1165 if (Left.is(tok::l_brace) && Right.is(tok::r_brace))
Daniel Jasper2424eef2013-05-23 10:15:45 +00001166 return false; // No spaces in "{}".
1167 if (Left.is(tok::l_brace) || Right.is(tok::r_brace))
Daniel Jasperb5dc3f42013-07-16 18:22:10 +00001168 return !Style.Cpp11BracedListStyle;
Daniel Jasper1bee0732013-05-23 18:05:18 +00001169 if (Right.Type == TT_UnaryOperator)
1170 return !Left.isOneOf(tok::l_paren, tok::l_square, tok::at) &&
1171 (Left.isNot(tok::colon) || Left.Type != TT_ObjCMethodExpr);
Daniel Jasperce933562013-05-23 21:35:49 +00001172 if (Left.isOneOf(tok::identifier, tok::greater, tok::r_square) &&
Alexander Kornienko0bdc6432013-07-04 14:47:51 +00001173 Right.is(tok::l_brace) && Right.getNextNonComment())
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001174 return false;
Daniel Jasper5ad390d2013-05-28 11:30:49 +00001175 if (Left.is(tok::period) || Right.is(tok::period))
1176 return false;
Nico Weber861576b2013-06-26 00:15:19 +00001177 if (Left.Type == TT_BlockComment && Left.TokenText.endswith("=*/"))
1178 return false;
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001179 return true;
1180}
1181
Daniel Jasper8ff690a2013-02-06 14:22:40 +00001182bool TokenAnnotator::spaceRequiredBefore(const AnnotatedLine &Line,
Manuel Klimekb3987012013-05-29 14:47:47 +00001183 const FormatToken &Tok) {
1184 if (Tok.Tok.getIdentifierInfo() && Tok.Previous->Tok.getIdentifierInfo())
Daniel Jasper2b4c9242013-02-11 08:01:18 +00001185 return true; // Never ever merge two identifiers.
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001186 if (Line.Type == LT_ObjCMethodDecl) {
Manuel Klimekb3987012013-05-29 14:47:47 +00001187 if (Tok.Previous->Type == TT_ObjCMethodSpecifier)
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001188 return true;
Manuel Klimekb3987012013-05-29 14:47:47 +00001189 if (Tok.Previous->is(tok::r_paren) && Tok.is(tok::identifier))
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001190 // Don't space between ')' and <id>
1191 return false;
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001192 }
1193 if (Line.Type == LT_ObjCProperty &&
Manuel Klimekb3987012013-05-29 14:47:47 +00001194 (Tok.is(tok::equal) || Tok.Previous->is(tok::equal)))
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001195 return false;
1196
Daniel Jasper2ca37412013-07-09 14:36:48 +00001197 if (Tok.Type == TT_TrailingReturnArrow ||
1198 Tok.Previous->Type == TT_TrailingReturnArrow)
1199 return true;
Manuel Klimekb3987012013-05-29 14:47:47 +00001200 if (Tok.Previous->is(tok::comma))
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001201 return true;
Daniel Jasper9c3c7b32013-02-28 13:40:17 +00001202 if (Tok.is(tok::comma))
1203 return false;
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001204 if (Tok.Type == TT_CtorInitializerColon || Tok.Type == TT_ObjCBlockLParen)
1205 return true;
Manuel Klimekb3987012013-05-29 14:47:47 +00001206 if (Tok.Previous->Tok.is(tok::kw_operator))
Daniel Jasper2b4c9242013-02-11 08:01:18 +00001207 return false;
1208 if (Tok.Type == TT_OverloadedOperatorLParen)
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001209 return false;
1210 if (Tok.is(tok::colon))
Manuel Klimekb3987012013-05-29 14:47:47 +00001211 return !Line.First->isOneOf(tok::kw_case, tok::kw_default) &&
Alexander Kornienko0bdc6432013-07-04 14:47:51 +00001212 Tok.getNextNonComment() != NULL && Tok.Type != TT_ObjCMethodExpr;
Manuel Klimekb3987012013-05-29 14:47:47 +00001213 if (Tok.Previous->Type == TT_UnaryOperator ||
1214 Tok.Previous->Type == TT_CastRParen)
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001215 return false;
Manuel Klimekb3987012013-05-29 14:47:47 +00001216 if (Tok.Previous->is(tok::greater) && Tok.is(tok::greater)) {
Daniel Jasper29f123b2013-02-08 15:28:42 +00001217 return Tok.Type == TT_TemplateCloser &&
Manuel Klimekb3987012013-05-29 14:47:47 +00001218 Tok.Previous->Type == TT_TemplateCloser &&
Daniel Jasper29f123b2013-02-08 15:28:42 +00001219 Style.Standard != FormatStyle::LS_Cpp11;
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001220 }
Alexander Kornienko54a38bd2013-03-20 16:41:56 +00001221 if (Tok.isOneOf(tok::arrowstar, tok::periodstar) ||
Manuel Klimekb3987012013-05-29 14:47:47 +00001222 Tok.Previous->isOneOf(tok::arrowstar, tok::periodstar))
Daniel Jasper9c3c7b32013-02-28 13:40:17 +00001223 return false;
Manuel Klimekb3987012013-05-29 14:47:47 +00001224 if (Tok.Type == TT_BinaryOperator || Tok.Previous->Type == TT_BinaryOperator)
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001225 return true;
Manuel Klimekb3987012013-05-29 14:47:47 +00001226 if (Tok.Previous->Type == TT_TemplateCloser && Tok.is(tok::l_paren))
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001227 return false;
Manuel Klimekb3987012013-05-29 14:47:47 +00001228 if (Tok.is(tok::less) && Line.First->is(tok::hash))
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001229 return true;
1230 if (Tok.Type == TT_TrailingUnaryOperator)
1231 return false;
Manuel Klimekb3987012013-05-29 14:47:47 +00001232 return spaceRequiredBetween(Line, *Tok.Previous, Tok);
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001233}
1234
Daniel Jasper8ff690a2013-02-06 14:22:40 +00001235bool TokenAnnotator::canBreakBefore(const AnnotatedLine &Line,
Manuel Klimekb3987012013-05-29 14:47:47 +00001236 const FormatToken &Right) {
1237 const FormatToken &Left = *Right.Previous;
Daniel Jasper6561f6a2013-07-09 07:43:55 +00001238 if (Right.Type == TT_StartOfName || Right.is(tok::kw_operator))
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001239 return true;
Nico Weberf2ff8122013-05-26 05:39:26 +00001240 if (Right.is(tok::colon) &&
1241 (Right.Type == TT_ObjCDictLiteral || Right.Type == TT_ObjCMethodExpr))
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001242 return false;
Nico Weberf2ff8122013-05-26 05:39:26 +00001243 if (Left.is(tok::colon) &&
1244 (Left.Type == TT_ObjCDictLiteral || Left.Type == TT_ObjCMethodExpr))
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001245 return true;
Daniel Jasper63d7ced2013-02-05 10:07:47 +00001246 if (Right.Type == TT_ObjCSelectorName)
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001247 return true;
1248 if (Left.ClosesTemplateDeclaration)
1249 return true;
1250 if (Right.Type == TT_ConditionalExpr || Right.is(tok::question))
1251 return true;
Daniel Jasper6cabab42013-02-14 08:42:54 +00001252 if (Right.Type == TT_RangeBasedForLoopColon ||
Daniel Jasper27b91cc2013-04-05 17:21:59 +00001253 Right.Type == TT_OverloadedOperatorLParen)
Daniel Jasper6cabab42013-02-14 08:42:54 +00001254 return false;
Daniel Jasperc194c952013-05-06 06:45:09 +00001255 if (Left.Type == TT_RangeBasedForLoopColon)
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001256 return true;
Daniel Jasper7d812812013-02-21 15:00:29 +00001257 if (Right.Type == TT_RangeBasedForLoopColon)
1258 return false;
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001259 if (Left.Type == TT_PointerOrReference || Left.Type == TT_TemplateCloser ||
1260 Left.Type == TT_UnaryOperator || Left.Type == TT_ConditionalExpr ||
Alexander Kornienkoe74de282013-03-13 14:41:29 +00001261 Left.isOneOf(tok::question, tok::kw_operator))
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001262 return false;
1263 if (Left.is(tok::equal) && Line.Type == LT_VirtualFunctionDecl)
1264 return false;
Daniel Jasper198c8bf2013-07-05 07:58:34 +00001265 if (Left.Previous) {
1266 if (Left.is(tok::l_paren) && Right.is(tok::l_paren) &&
1267 Left.Previous->is(tok::kw___attribute))
1268 return false;
Daniel Jasper2ca37412013-07-09 14:36:48 +00001269 if (Left.is(tok::l_paren) && (Left.Previous->Type == TT_BinaryOperator ||
1270 Left.Previous->is(tok::r_paren)))
Daniel Jasper198c8bf2013-07-05 07:58:34 +00001271 return false;
1272 }
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001273
Daniel Jasper65d2c382013-06-06 16:08:57 +00001274 if (Right.isTrailingComment())
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001275 // We rely on MustBreakBefore being set correctly here as we should not
1276 // change the "binding" behavior of a comment.
1277 return false;
1278
Daniel Jasper5ad72bb2013-05-22 08:28:26 +00001279 // We only break before r_brace if there was a corresponding break before
1280 // the l_brace, which is tracked by BreakBeforeClosingBrace.
1281 if (Right.isOneOf(tok::r_brace, tok::r_paren, tok::greater))
1282 return false;
1283
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001284 // Allow breaking after a trailing 'const', e.g. after a method declaration,
1285 // unless it is follow by ';', '{' or '='.
Manuel Klimekb3987012013-05-29 14:47:47 +00001286 if (Left.is(tok::kw_const) && Left.Previous != NULL &&
1287 Left.Previous->is(tok::r_paren))
Alexander Kornienkoe74de282013-03-13 14:41:29 +00001288 return !Right.isOneOf(tok::l_brace, tok::semi, tok::equal);
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001289
Daniel Jasper8ef19a22013-03-14 09:50:46 +00001290 if (Right.is(tok::kw___attribute))
1291 return true;
1292
Daniel Jasper3a204412013-02-23 07:46:38 +00001293 if (Left.is(tok::identifier) && Right.is(tok::string_literal))
1294 return true;
Daniel Jasperac3223e2013-04-10 09:49:49 +00001295 return (Left.isBinaryOperator() && Left.isNot(tok::lessless)) ||
Daniel Jasper6b119d62013-04-05 17:22:09 +00001296 Left.isOneOf(tok::comma, tok::coloncolon, tok::semi, tok::l_brace,
1297 tok::kw_class, tok::kw_struct) ||
Alexander Kornienkoe74de282013-03-13 14:41:29 +00001298 Right.isOneOf(tok::lessless, tok::arrow, tok::period, tok::colon) ||
Daniel Jasper198c8bf2013-07-05 07:58:34 +00001299 (Left.is(tok::r_paren) &&
Daniel Jaspere033e872013-05-21 09:16:31 +00001300 Right.isOneOf(tok::identifier, tok::kw_const, tok::kw___attribute)) ||
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001301 (Left.is(tok::l_paren) && !Right.is(tok::r_paren)) ||
Daniel Jasper011c35d2013-07-12 11:19:37 +00001302 Right.is(tok::l_square);
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001303}
1304
Daniel Jasperbf71ba22013-04-08 20:33:42 +00001305void TokenAnnotator::printDebugInfo(const AnnotatedLine &Line) {
1306 llvm::errs() << "AnnotatedTokens:\n";
Manuel Klimekb3987012013-05-29 14:47:47 +00001307 const FormatToken *Tok = Line.First;
Daniel Jasperbf71ba22013-04-08 20:33:42 +00001308 while (Tok) {
Manuel Klimekb3987012013-05-29 14:47:47 +00001309 llvm::errs() << " M=" << Tok->MustBreakBefore
Daniel Jasperc7bd68f2013-07-10 14:02:49 +00001310 << " C=" << Tok->CanBreakBefore << " T=" << Tok->Type
1311 << " S=" << Tok->SpacesRequiredBefore
1312 << " P=" << Tok->SplitPenalty << " Name=" << Tok->Tok.getName()
1313 << " PPK=" << Tok->PackingKind << " FakeLParens=";
Daniel Jasperbf71ba22013-04-08 20:33:42 +00001314 for (unsigned i = 0, e = Tok->FakeLParens.size(); i != e; ++i)
1315 llvm::errs() << Tok->FakeLParens[i] << "/";
1316 llvm::errs() << " FakeRParens=" << Tok->FakeRParens << "\n";
Manuel Klimekb3987012013-05-29 14:47:47 +00001317 Tok = Tok->Next;
Daniel Jasperbf71ba22013-04-08 20:33:42 +00001318 }
1319 llvm::errs() << "----\n";
1320}
1321
Daniel Jasper32d28ee2013-01-29 21:01:14 +00001322} // namespace format
1323} // namespace clang