Daniel Jasper | de0328a | 2013-08-16 11:20:30 +0000 | [diff] [blame] | 1 | //===--- ContinuationIndenter.cpp - Format C++ code -----------------------===// |
| 2 | // |
| 3 | // The LLVM Compiler Infrastructure |
| 4 | // |
| 5 | // This file is distributed under the University of Illinois Open Source |
| 6 | // License. See LICENSE.TXT for details. |
| 7 | // |
| 8 | //===----------------------------------------------------------------------===// |
| 9 | /// |
| 10 | /// \file |
| 11 | /// \brief This file implements the continuation indenter. |
| 12 | /// |
| 13 | //===----------------------------------------------------------------------===// |
| 14 | |
| 15 | #define DEBUG_TYPE "format-formatter" |
| 16 | |
| 17 | #include "BreakableToken.h" |
| 18 | #include "ContinuationIndenter.h" |
| 19 | #include "WhitespaceManager.h" |
| 20 | #include "clang/Basic/OperatorPrecedence.h" |
| 21 | #include "clang/Basic/SourceManager.h" |
| 22 | #include "clang/Format/Format.h" |
| 23 | #include "llvm/Support/Debug.h" |
| 24 | #include <string> |
| 25 | |
| 26 | namespace clang { |
| 27 | namespace format { |
| 28 | |
| 29 | // Returns the length of everything up to the first possible line break after |
| 30 | // the ), ], } or > matching \c Tok. |
| 31 | static unsigned getLengthToMatchingParen(const FormatToken &Tok) { |
| 32 | if (Tok.MatchingParen == NULL) |
| 33 | return 0; |
| 34 | FormatToken *End = Tok.MatchingParen; |
| 35 | while (End->Next && !End->Next->CanBreakBefore) { |
| 36 | End = End->Next; |
| 37 | } |
| 38 | return End->TotalLength - Tok.TotalLength + 1; |
| 39 | } |
| 40 | |
Daniel Jasper | b27c4b7 | 2013-08-27 11:09:05 +0000 | [diff] [blame] | 41 | // Returns \c true if \c Tok starts a binary expression. |
| 42 | static bool startsBinaryExpression(const FormatToken &Tok) { |
| 43 | for (unsigned i = 0, e = Tok.FakeLParens.size(); i != e; ++i) { |
| 44 | if (Tok.FakeLParens[i] > prec::Unknown) |
| 45 | return true; |
| 46 | } |
| 47 | return false; |
| 48 | } |
| 49 | |
Daniel Jasper | 4c6e005 | 2013-08-27 14:24:43 +0000 | [diff] [blame] | 50 | // Returns \c true if \c Tok is the "." or "->" of a call and starts the next |
| 51 | // segment of a builder type call. |
| 52 | static bool startsSegmentOfBuilderTypeCall(const FormatToken &Tok) { |
| 53 | return Tok.isMemberAccess() && Tok.Previous && Tok.Previous->closesScope(); |
| 54 | } |
| 55 | |
Daniel Jasper | de0328a | 2013-08-16 11:20:30 +0000 | [diff] [blame] | 56 | ContinuationIndenter::ContinuationIndenter(const FormatStyle &Style, |
| 57 | SourceManager &SourceMgr, |
| 58 | const AnnotatedLine &Line, |
| 59 | unsigned FirstIndent, |
| 60 | WhitespaceManager &Whitespaces, |
| 61 | encoding::Encoding Encoding, |
| 62 | bool BinPackInconclusiveFunctions) |
| 63 | : Style(Style), SourceMgr(SourceMgr), Line(Line), FirstIndent(FirstIndent), |
| 64 | Whitespaces(Whitespaces), Encoding(Encoding), |
| 65 | BinPackInconclusiveFunctions(BinPackInconclusiveFunctions) {} |
| 66 | |
| 67 | LineState ContinuationIndenter::getInitialState() { |
| 68 | // Initialize state dependent on indent. |
| 69 | LineState State; |
| 70 | State.Column = FirstIndent; |
| 71 | State.NextToken = Line.First; |
| 72 | State.Stack.push_back(ParenState(FirstIndent, FirstIndent, |
| 73 | /*AvoidBinPacking=*/false, |
| 74 | /*NoLineBreak=*/false)); |
| 75 | State.LineContainsContinuedForLoopSection = false; |
| 76 | State.ParenLevel = 0; |
| 77 | State.StartOfStringLiteral = 0; |
| 78 | State.StartOfLineLevel = State.ParenLevel; |
| 79 | State.LowestLevelOnLine = State.ParenLevel; |
| 80 | State.IgnoreStackForComparison = false; |
| 81 | |
| 82 | // The first token has already been indented and thus consumed. |
| 83 | moveStateToNextToken(State, /*DryRun=*/false, |
| 84 | /*Newline=*/false); |
| 85 | return State; |
| 86 | } |
| 87 | |
| 88 | bool ContinuationIndenter::canBreak(const LineState &State) { |
| 89 | const FormatToken &Current = *State.NextToken; |
| 90 | const FormatToken &Previous = *Current.Previous; |
| 91 | assert(&Previous == Current.Previous); |
| 92 | if (!Current.CanBreakBefore && |
| 93 | !(Current.is(tok::r_brace) && State.Stack.back().BreakBeforeClosingBrace)) |
| 94 | return false; |
| 95 | // The opening "{" of a braced list has to be on the same line as the first |
| 96 | // element if it is nested in another braced init list or function call. |
| 97 | if (!Current.MustBreakBefore && Previous.is(tok::l_brace) && |
| 98 | Previous.Previous && |
| 99 | Previous.Previous->isOneOf(tok::l_brace, tok::l_paren, tok::comma)) |
| 100 | return false; |
| 101 | // This prevents breaks like: |
| 102 | // ... |
| 103 | // SomeParameter, OtherParameter).DoSomething( |
| 104 | // ... |
| 105 | // As they hide "DoSomething" and are generally bad for readability. |
| 106 | if (Previous.opensScope() && State.LowestLevelOnLine < State.StartOfLineLevel) |
| 107 | return false; |
Daniel Jasper | 4c6e005 | 2013-08-27 14:24:43 +0000 | [diff] [blame] | 108 | if (Current.isMemberAccess() && State.Stack.back().ContainsUnwrappedBuilder) |
| 109 | return false; |
Daniel Jasper | de0328a | 2013-08-16 11:20:30 +0000 | [diff] [blame] | 110 | return !State.Stack.back().NoLineBreak; |
| 111 | } |
| 112 | |
| 113 | bool ContinuationIndenter::mustBreak(const LineState &State) { |
| 114 | const FormatToken &Current = *State.NextToken; |
| 115 | const FormatToken &Previous = *Current.Previous; |
| 116 | if (Current.MustBreakBefore || Current.Type == TT_InlineASMColon) |
| 117 | return true; |
| 118 | if (!Style.Cpp11BracedListStyle && Current.is(tok::r_brace) && |
| 119 | State.Stack.back().BreakBeforeClosingBrace) |
| 120 | return true; |
| 121 | if (Previous.is(tok::semi) && State.LineContainsContinuedForLoopSection) |
| 122 | return true; |
| 123 | if (Style.BreakConstructorInitializersBeforeComma) { |
| 124 | if (Previous.Type == TT_CtorInitializerComma) |
| 125 | return false; |
| 126 | if (Current.Type == TT_CtorInitializerComma) |
| 127 | return true; |
| 128 | } |
| 129 | if ((Previous.isOneOf(tok::comma, tok::semi) || Current.is(tok::question) || |
| 130 | (Current.Type == TT_ConditionalExpr && |
| 131 | !(Current.is(tok::colon) && Previous.is(tok::question)))) && |
| 132 | State.Stack.back().BreakBeforeParameter && !Current.isTrailingComment() && |
| 133 | !Current.isOneOf(tok::r_paren, tok::r_brace)) |
| 134 | return true; |
| 135 | if (Style.AlwaysBreakBeforeMultilineStrings && |
Daniel Jasper | f438cb7 | 2013-08-23 11:57:34 +0000 | [diff] [blame] | 136 | State.Column > State.Stack.back().Indent && // Breaking saves columns. |
| 137 | Previous.isNot(tok::lessless) && Previous.Type != TT_InlineASMColon && |
| 138 | NextIsMultilineString(State)) |
Daniel Jasper | de0328a | 2013-08-16 11:20:30 +0000 | [diff] [blame] | 139 | return true; |
| 140 | |
| 141 | if (!Style.BreakBeforeBinaryOperators) { |
| 142 | // If we need to break somewhere inside the LHS of a binary expression, we |
| 143 | // should also break after the operator. Otherwise, the formatting would |
| 144 | // hide the operator precedence, e.g. in: |
| 145 | // if (aaaaaaaaaaaaaa == |
| 146 | // bbbbbbbbbbbbbb && c) {.. |
| 147 | // For comparisons, we only apply this rule, if the LHS is a binary |
| 148 | // expression itself as otherwise, the line breaks seem superfluous. |
| 149 | // We need special cases for ">>" which we have split into two ">" while |
| 150 | // lexing in order to make template parsing easier. |
| 151 | // |
| 152 | // FIXME: We'll need something similar for styles that break before binary |
| 153 | // operators. |
| 154 | bool IsComparison = (Previous.getPrecedence() == prec::Relational || |
| 155 | Previous.getPrecedence() == prec::Equality) && |
| 156 | Previous.Previous && |
| 157 | Previous.Previous->Type != TT_BinaryOperator; // For >>. |
| 158 | bool LHSIsBinaryExpr = |
| 159 | Previous.Previous && Previous.Previous->FakeRParens > 0; |
| 160 | if (Previous.Type == TT_BinaryOperator && |
| 161 | (!IsComparison || LHSIsBinaryExpr) && |
| 162 | Current.Type != TT_BinaryOperator && // For >>. |
| 163 | !Current.isTrailingComment() && |
| 164 | !Previous.isOneOf(tok::lessless, tok::question) && |
| 165 | Previous.getPrecedence() != prec::Assignment && |
| 166 | State.Stack.back().BreakBeforeParameter) |
| 167 | return true; |
| 168 | } |
| 169 | |
| 170 | // Same as above, but for the first "<<" operator. |
| 171 | if (Current.is(tok::lessless) && State.Stack.back().BreakBeforeParameter && |
| 172 | State.Stack.back().FirstLessLess == 0) |
| 173 | return true; |
| 174 | |
| 175 | // FIXME: Comparing LongestObjCSelectorName to 0 is a hacky way of finding |
| 176 | // out whether it is the first parameter. Clean this up. |
| 177 | if (Current.Type == TT_ObjCSelectorName && |
| 178 | Current.LongestObjCSelectorName == 0 && |
| 179 | State.Stack.back().BreakBeforeParameter) |
| 180 | return true; |
| 181 | if ((Current.Type == TT_CtorInitializerColon || |
| 182 | (Previous.ClosesTemplateDeclaration && State.ParenLevel == 0))) |
| 183 | return true; |
| 184 | |
| 185 | if ((Current.Type == TT_StartOfName || Current.is(tok::kw_operator)) && |
| 186 | Line.MightBeFunctionDecl && State.Stack.back().BreakBeforeParameter && |
| 187 | State.ParenLevel == 0) |
| 188 | return true; |
Daniel Jasper | 4c6e005 | 2013-08-27 14:24:43 +0000 | [diff] [blame] | 189 | if (startsSegmentOfBuilderTypeCall(Current) && |
| 190 | State.Stack.back().CallContinuation != 0) |
| 191 | return true; |
Daniel Jasper | de0328a | 2013-08-16 11:20:30 +0000 | [diff] [blame] | 192 | return false; |
| 193 | } |
| 194 | |
| 195 | unsigned ContinuationIndenter::addTokenToState(LineState &State, bool Newline, |
Daniel Jasper | 8de9ed0 | 2013-08-22 15:00:41 +0000 | [diff] [blame] | 196 | bool DryRun, |
| 197 | unsigned ExtraSpaces) { |
Daniel Jasper | de0328a | 2013-08-16 11:20:30 +0000 | [diff] [blame] | 198 | const FormatToken &Current = *State.NextToken; |
| 199 | const FormatToken &Previous = *State.NextToken->Previous; |
| 200 | |
| 201 | // Extra penalty that needs to be added because of the way certain line |
| 202 | // breaks are chosen. |
Daniel Jasper | 8de9ed0 | 2013-08-22 15:00:41 +0000 | [diff] [blame] | 203 | unsigned Penalty = 0; |
Daniel Jasper | de0328a | 2013-08-16 11:20:30 +0000 | [diff] [blame] | 204 | |
| 205 | if (State.Stack.size() == 0 || Current.Type == TT_ImplicitStringLiteral) { |
| 206 | // FIXME: Is this correct? |
| 207 | int WhitespaceLength = SourceMgr.getSpellingColumnNumber( |
| 208 | State.NextToken->WhitespaceRange.getEnd()) - |
| 209 | SourceMgr.getSpellingColumnNumber( |
| 210 | State.NextToken->WhitespaceRange.getBegin()); |
| 211 | State.Column += WhitespaceLength + State.NextToken->CodePointCount; |
| 212 | State.NextToken = State.NextToken->Next; |
| 213 | return 0; |
| 214 | } |
| 215 | |
| 216 | // If we are continuing an expression, we want to indent an extra 4 spaces. |
| 217 | unsigned ContinuationIndent = |
| 218 | std::max(State.Stack.back().LastSpace, State.Stack.back().Indent) + 4; |
| 219 | if (Newline) { |
Daniel Jasper | 8de9ed0 | 2013-08-22 15:00:41 +0000 | [diff] [blame] | 220 | // The first line break on any ParenLevel causes an extra penalty in order |
| 221 | // prefer similar line breaks. |
| 222 | if (!State.Stack.back().ContainsLineBreak) |
| 223 | Penalty += 15; |
| 224 | State.Stack.back().ContainsLineBreak = true; |
| 225 | |
| 226 | Penalty += State.NextToken->SplitPenalty; |
| 227 | |
Daniel Jasper | de0328a | 2013-08-16 11:20:30 +0000 | [diff] [blame] | 228 | // Breaking before the first "<<" is generally not desirable if the LHS is |
| 229 | // short. |
| 230 | if (Current.is(tok::lessless) && State.Stack.back().FirstLessLess == 0 && |
| 231 | State.Column <= Style.ColumnLimit / 2) |
Daniel Jasper | 8de9ed0 | 2013-08-22 15:00:41 +0000 | [diff] [blame] | 232 | Penalty += Style.PenaltyBreakFirstLessLess; |
Daniel Jasper | de0328a | 2013-08-16 11:20:30 +0000 | [diff] [blame] | 233 | |
Daniel Jasper | de0328a | 2013-08-16 11:20:30 +0000 | [diff] [blame] | 234 | if (Current.is(tok::r_brace)) { |
| 235 | if (Current.BlockKind == BK_BracedInit) |
| 236 | State.Column = State.Stack[State.Stack.size() - 2].LastSpace; |
| 237 | else |
| 238 | State.Column = FirstIndent; |
| 239 | } else if (Current.is(tok::string_literal) && |
| 240 | State.StartOfStringLiteral != 0) { |
| 241 | State.Column = State.StartOfStringLiteral; |
| 242 | State.Stack.back().BreakBeforeParameter = true; |
| 243 | } else if (Current.is(tok::lessless) && |
| 244 | State.Stack.back().FirstLessLess != 0) { |
| 245 | State.Column = State.Stack.back().FirstLessLess; |
Daniel Jasper | 4c6e005 | 2013-08-27 14:24:43 +0000 | [diff] [blame] | 246 | } else if (Current.isMemberAccess()) { |
Daniel Jasper | de0328a | 2013-08-16 11:20:30 +0000 | [diff] [blame] | 247 | if (State.Stack.back().CallContinuation == 0) { |
| 248 | State.Column = ContinuationIndent; |
| 249 | State.Stack.back().CallContinuation = State.Column; |
| 250 | } else { |
| 251 | State.Column = State.Stack.back().CallContinuation; |
| 252 | } |
| 253 | } else if (Current.Type == TT_ConditionalExpr) { |
| 254 | State.Column = State.Stack.back().QuestionColumn; |
| 255 | } else if (Previous.is(tok::comma) && State.Stack.back().VariablePos != 0) { |
| 256 | State.Column = State.Stack.back().VariablePos; |
| 257 | } else if (Previous.ClosesTemplateDeclaration || |
| 258 | ((Current.Type == TT_StartOfName || |
| 259 | Current.is(tok::kw_operator)) && |
| 260 | State.ParenLevel == 0 && |
| 261 | (!Style.IndentFunctionDeclarationAfterType || |
| 262 | Line.StartsDefinition))) { |
| 263 | State.Column = State.Stack.back().Indent; |
| 264 | } else if (Current.Type == TT_ObjCSelectorName) { |
| 265 | if (State.Stack.back().ColonPos > Current.CodePointCount) { |
| 266 | State.Column = State.Stack.back().ColonPos - Current.CodePointCount; |
| 267 | } else { |
| 268 | State.Column = State.Stack.back().Indent; |
| 269 | State.Stack.back().ColonPos = State.Column + Current.CodePointCount; |
| 270 | } |
| 271 | } else if (Current.is(tok::l_square) && Current.Type != TT_ObjCMethodExpr) { |
| 272 | if (State.Stack.back().StartOfArraySubscripts != 0) |
| 273 | State.Column = State.Stack.back().StartOfArraySubscripts; |
| 274 | else |
| 275 | State.Column = ContinuationIndent; |
| 276 | } else if (Current.Type == TT_StartOfName || |
| 277 | Previous.isOneOf(tok::coloncolon, tok::equal) || |
| 278 | Previous.Type == TT_ObjCMethodExpr) { |
| 279 | State.Column = ContinuationIndent; |
| 280 | } else if (Current.Type == TT_CtorInitializerColon) { |
| 281 | State.Column = FirstIndent + Style.ConstructorInitializerIndentWidth; |
| 282 | } else if (Current.Type == TT_CtorInitializerComma) { |
| 283 | State.Column = State.Stack.back().Indent; |
| 284 | } else { |
| 285 | State.Column = State.Stack.back().Indent; |
| 286 | // Ensure that we fall back to indenting 4 spaces instead of just |
| 287 | // flushing continuations left. |
| 288 | if (State.Column == FirstIndent) |
| 289 | State.Column += 4; |
| 290 | } |
| 291 | |
| 292 | if (Current.is(tok::question)) |
| 293 | State.Stack.back().BreakBeforeParameter = true; |
| 294 | if ((Previous.isOneOf(tok::comma, tok::semi) && |
| 295 | !State.Stack.back().AvoidBinPacking) || |
| 296 | Previous.Type == TT_BinaryOperator) |
| 297 | State.Stack.back().BreakBeforeParameter = false; |
| 298 | if (Previous.Type == TT_TemplateCloser && State.ParenLevel == 0) |
| 299 | State.Stack.back().BreakBeforeParameter = false; |
| 300 | |
| 301 | if (!DryRun) { |
| 302 | unsigned NewLines = 1; |
| 303 | if (Current.is(tok::comment)) |
| 304 | NewLines = std::max(NewLines, std::min(Current.NewlinesBefore, |
| 305 | Style.MaxEmptyLinesToKeep + 1)); |
| 306 | Whitespaces.replaceWhitespace(Current, NewLines, State.Column, |
| 307 | State.Column, Line.InPPDirective); |
| 308 | } |
| 309 | |
| 310 | if (!Current.isTrailingComment()) |
| 311 | State.Stack.back().LastSpace = State.Column; |
Daniel Jasper | 4c6e005 | 2013-08-27 14:24:43 +0000 | [diff] [blame] | 312 | if (Current.isMemberAccess()) |
Daniel Jasper | de0328a | 2013-08-16 11:20:30 +0000 | [diff] [blame] | 313 | State.Stack.back().LastSpace += Current.CodePointCount; |
| 314 | State.StartOfLineLevel = State.ParenLevel; |
| 315 | State.LowestLevelOnLine = State.ParenLevel; |
| 316 | |
| 317 | // Any break on this level means that the parent level has been broken |
| 318 | // and we need to avoid bin packing there. |
| 319 | for (unsigned i = 0, e = State.Stack.size() - 1; i != e; ++i) { |
| 320 | State.Stack[i].BreakBeforeParameter = true; |
| 321 | } |
| 322 | const FormatToken *TokenBefore = Current.getPreviousNonComment(); |
| 323 | if (TokenBefore && !TokenBefore->isOneOf(tok::comma, tok::semi) && |
| 324 | TokenBefore->Type != TT_TemplateCloser && |
| 325 | TokenBefore->Type != TT_BinaryOperator && !TokenBefore->opensScope()) |
| 326 | State.Stack.back().BreakBeforeParameter = true; |
| 327 | |
| 328 | // If we break after {, we should also break before the corresponding }. |
| 329 | if (Previous.is(tok::l_brace)) |
| 330 | State.Stack.back().BreakBeforeClosingBrace = true; |
| 331 | |
| 332 | if (State.Stack.back().AvoidBinPacking) { |
| 333 | // If we are breaking after '(', '{', '<', this is not bin packing |
| 334 | // unless AllowAllParametersOfDeclarationOnNextLine is false. |
| 335 | if (!(Previous.isOneOf(tok::l_paren, tok::l_brace) || |
| 336 | Previous.Type == TT_BinaryOperator) || |
| 337 | (!Style.AllowAllParametersOfDeclarationOnNextLine && |
| 338 | Line.MustBeDeclaration)) |
| 339 | State.Stack.back().BreakBeforeParameter = true; |
| 340 | } |
| 341 | |
| 342 | } else { |
| 343 | if (Current.is(tok::equal) && |
| 344 | (Line.First->is(tok::kw_for) || State.ParenLevel == 0) && |
| 345 | State.Stack.back().VariablePos == 0) { |
| 346 | State.Stack.back().VariablePos = State.Column; |
| 347 | // Move over * and & if they are bound to the variable name. |
| 348 | const FormatToken *Tok = &Previous; |
| 349 | while (Tok && State.Stack.back().VariablePos >= Tok->CodePointCount) { |
| 350 | State.Stack.back().VariablePos -= Tok->CodePointCount; |
| 351 | if (Tok->SpacesRequiredBefore != 0) |
| 352 | break; |
| 353 | Tok = Tok->Previous; |
| 354 | } |
| 355 | if (Previous.PartOfMultiVariableDeclStmt) |
| 356 | State.Stack.back().LastSpace = State.Stack.back().VariablePos; |
| 357 | } |
| 358 | |
Daniel Jasper | 8de9ed0 | 2013-08-22 15:00:41 +0000 | [diff] [blame] | 359 | unsigned Spaces = State.NextToken->SpacesRequiredBefore + ExtraSpaces; |
Daniel Jasper | de0328a | 2013-08-16 11:20:30 +0000 | [diff] [blame] | 360 | |
| 361 | if (!DryRun) |
| 362 | Whitespaces.replaceWhitespace(Current, 0, Spaces, State.Column + Spaces); |
| 363 | |
| 364 | if (Current.Type == TT_ObjCSelectorName && |
| 365 | State.Stack.back().ColonPos == 0) { |
| 366 | if (State.Stack.back().Indent + Current.LongestObjCSelectorName > |
| 367 | State.Column + Spaces + Current.CodePointCount) |
| 368 | State.Stack.back().ColonPos = |
| 369 | State.Stack.back().Indent + Current.LongestObjCSelectorName; |
| 370 | else |
| 371 | State.Stack.back().ColonPos = |
| 372 | State.Column + Spaces + Current.CodePointCount; |
| 373 | } |
| 374 | |
| 375 | if (Previous.opensScope() && Previous.Type != TT_ObjCMethodExpr && |
| 376 | Current.Type != TT_LineComment) |
| 377 | State.Stack.back().Indent = State.Column + Spaces; |
| 378 | if (Previous.is(tok::comma) && !Current.isTrailingComment() && |
| 379 | State.Stack.back().AvoidBinPacking) |
| 380 | State.Stack.back().NoLineBreak = true; |
Daniel Jasper | 4c6e005 | 2013-08-27 14:24:43 +0000 | [diff] [blame] | 381 | if (startsSegmentOfBuilderTypeCall(Current)) |
| 382 | State.Stack.back().ContainsUnwrappedBuilder = true; |
Daniel Jasper | de0328a | 2013-08-16 11:20:30 +0000 | [diff] [blame] | 383 | |
| 384 | State.Column += Spaces; |
| 385 | if (Current.is(tok::l_paren) && Previous.isOneOf(tok::kw_if, tok::kw_for)) |
| 386 | // Treat the condition inside an if as if it was a second function |
| 387 | // parameter, i.e. let nested calls have an indent of 4. |
| 388 | State.Stack.back().LastSpace = State.Column + 1; // 1 is length of "(". |
| 389 | else if (Previous.is(tok::comma)) |
| 390 | State.Stack.back().LastSpace = State.Column; |
| 391 | else if ((Previous.Type == TT_BinaryOperator || |
| 392 | Previous.Type == TT_ConditionalExpr || |
Daniel Jasper | f110e20 | 2013-08-21 08:39:01 +0000 | [diff] [blame] | 393 | Previous.Type == TT_UnaryOperator || |
Daniel Jasper | de0328a | 2013-08-16 11:20:30 +0000 | [diff] [blame] | 394 | Previous.Type == TT_CtorInitializerColon) && |
Daniel Jasper | b27c4b7 | 2013-08-27 11:09:05 +0000 | [diff] [blame] | 395 | (Previous.getPrecedence() != prec::Assignment || |
| 396 | startsBinaryExpression(Current))) |
Daniel Jasper | de0328a | 2013-08-16 11:20:30 +0000 | [diff] [blame] | 397 | // Always indent relative to the RHS of the expression unless this is a |
Daniel Jasper | f110e20 | 2013-08-21 08:39:01 +0000 | [diff] [blame] | 398 | // simple assignment without binary expression on the RHS. Also indent |
| 399 | // relative to unary operators and the colons of constructor initializers. |
Daniel Jasper | de0328a | 2013-08-16 11:20:30 +0000 | [diff] [blame] | 400 | State.Stack.back().LastSpace = State.Column; |
| 401 | else if (Previous.Type == TT_InheritanceColon) |
| 402 | State.Stack.back().Indent = State.Column; |
| 403 | else if (Previous.opensScope()) { |
| 404 | // If a function has multiple parameters (including a single parameter |
| 405 | // that is a binary expression) or a trailing call, indent all |
| 406 | // parameters from the opening parenthesis. This avoids confusing |
| 407 | // indents like: |
| 408 | // OuterFunction(InnerFunctionCall( |
| 409 | // ParameterToInnerFunction), |
| 410 | // SecondParameterToOuterFunction); |
| 411 | bool HasMultipleParameters = !Current.FakeLParens.empty(); |
| 412 | bool HasTrailingCall = false; |
| 413 | if (Previous.MatchingParen) { |
| 414 | const FormatToken *Next = Previous.MatchingParen->getNextNonComment(); |
Daniel Jasper | 4c6e005 | 2013-08-27 14:24:43 +0000 | [diff] [blame] | 415 | HasTrailingCall = Next && Next->isMemberAccess(); |
Daniel Jasper | de0328a | 2013-08-16 11:20:30 +0000 | [diff] [blame] | 416 | } |
Daniel Jasper | b27c4b7 | 2013-08-27 11:09:05 +0000 | [diff] [blame] | 417 | if (HasMultipleParameters || |
| 418 | (HasTrailingCall && |
| 419 | State.Stack[State.Stack.size() - 2].CallContinuation == 0)) |
Daniel Jasper | de0328a | 2013-08-16 11:20:30 +0000 | [diff] [blame] | 420 | State.Stack.back().LastSpace = State.Column; |
| 421 | } |
| 422 | } |
| 423 | |
Daniel Jasper | 8de9ed0 | 2013-08-22 15:00:41 +0000 | [diff] [blame] | 424 | return moveStateToNextToken(State, DryRun, Newline) + Penalty; |
Daniel Jasper | de0328a | 2013-08-16 11:20:30 +0000 | [diff] [blame] | 425 | } |
| 426 | |
| 427 | unsigned ContinuationIndenter::moveStateToNextToken(LineState &State, |
| 428 | bool DryRun, bool Newline) { |
| 429 | const FormatToken &Current = *State.NextToken; |
| 430 | assert(State.Stack.size()); |
| 431 | |
| 432 | if (Current.Type == TT_InheritanceColon) |
| 433 | State.Stack.back().AvoidBinPacking = true; |
| 434 | if (Current.is(tok::lessless) && State.Stack.back().FirstLessLess == 0) |
| 435 | State.Stack.back().FirstLessLess = State.Column; |
| 436 | if (Current.is(tok::l_square) && |
| 437 | State.Stack.back().StartOfArraySubscripts == 0) |
| 438 | State.Stack.back().StartOfArraySubscripts = State.Column; |
| 439 | if (Current.is(tok::question)) |
| 440 | State.Stack.back().QuestionColumn = State.Column; |
| 441 | if (!Current.opensScope() && !Current.closesScope()) |
| 442 | State.LowestLevelOnLine = |
| 443 | std::min(State.LowestLevelOnLine, State.ParenLevel); |
Daniel Jasper | 4c6e005 | 2013-08-27 14:24:43 +0000 | [diff] [blame] | 444 | if (Current.isMemberAccess()) |
Daniel Jasper | de0328a | 2013-08-16 11:20:30 +0000 | [diff] [blame] | 445 | State.Stack.back().StartOfFunctionCall = |
| 446 | Current.LastInChainOfCalls ? 0 : State.Column + Current.CodePointCount; |
| 447 | if (Current.Type == TT_CtorInitializerColon) { |
| 448 | // Indent 2 from the column, so: |
| 449 | // SomeClass::SomeClass() |
| 450 | // : First(...), ... |
| 451 | // Next(...) |
| 452 | // ^ line up here. |
| 453 | State.Stack.back().Indent = |
| 454 | State.Column + (Style.BreakConstructorInitializersBeforeComma ? 0 : 2); |
| 455 | if (Style.ConstructorInitializerAllOnOneLineOrOnePerLine) |
| 456 | State.Stack.back().AvoidBinPacking = true; |
| 457 | State.Stack.back().BreakBeforeParameter = false; |
| 458 | } |
| 459 | |
| 460 | // If return returns a binary expression, align after it. |
| 461 | if (Current.is(tok::kw_return) && !Current.FakeLParens.empty()) |
| 462 | State.Stack.back().LastSpace = State.Column + 7; |
| 463 | |
| 464 | // In ObjC method declaration we align on the ":" of parameters, but we need |
| 465 | // to ensure that we indent parameters on subsequent lines by at least 4. |
| 466 | if (Current.Type == TT_ObjCMethodSpecifier) |
| 467 | State.Stack.back().Indent += 4; |
| 468 | |
| 469 | // Insert scopes created by fake parenthesis. |
| 470 | const FormatToken *Previous = Current.getPreviousNonComment(); |
| 471 | // Don't add extra indentation for the first fake parenthesis after |
| 472 | // 'return', assignements or opening <({[. The indentation for these cases |
| 473 | // is special cased. |
| 474 | bool SkipFirstExtraIndent = |
| 475 | Current.is(tok::kw_return) || |
| 476 | (Previous && (Previous->opensScope() || |
| 477 | Previous->getPrecedence() == prec::Assignment)); |
| 478 | for (SmallVectorImpl<prec::Level>::const_reverse_iterator |
| 479 | I = Current.FakeLParens.rbegin(), |
| 480 | E = Current.FakeLParens.rend(); |
| 481 | I != E; ++I) { |
| 482 | ParenState NewParenState = State.Stack.back(); |
| 483 | NewParenState.ContainsLineBreak = false; |
| 484 | NewParenState.Indent = |
| 485 | std::max(std::max(State.Column, NewParenState.Indent), |
| 486 | State.Stack.back().LastSpace); |
| 487 | |
| 488 | // Always indent conditional expressions. Never indent expression where |
| 489 | // the 'operator' is ',', ';' or an assignment (i.e. *I <= |
| 490 | // prec::Assignment) as those have different indentation rules. Indent |
| 491 | // other expression, unless the indentation needs to be skipped. |
| 492 | if (*I == prec::Conditional || |
| 493 | (!SkipFirstExtraIndent && *I > prec::Assignment && |
| 494 | !Style.BreakBeforeBinaryOperators)) |
| 495 | NewParenState.Indent += 4; |
| 496 | if (Previous && !Previous->opensScope()) |
| 497 | NewParenState.BreakBeforeParameter = false; |
| 498 | State.Stack.push_back(NewParenState); |
| 499 | SkipFirstExtraIndent = false; |
| 500 | } |
| 501 | |
| 502 | // If we encounter an opening (, [, { or <, we add a level to our stacks to |
| 503 | // prepare for the following tokens. |
| 504 | if (Current.opensScope()) { |
| 505 | unsigned NewIndent; |
| 506 | unsigned LastSpace = State.Stack.back().LastSpace; |
| 507 | bool AvoidBinPacking; |
| 508 | if (Current.is(tok::l_brace)) { |
| 509 | NewIndent = |
| 510 | LastSpace + (Style.Cpp11BracedListStyle ? 4 : Style.IndentWidth); |
| 511 | const FormatToken *NextNoComment = Current.getNextNonComment(); |
| 512 | AvoidBinPacking = NextNoComment && |
| 513 | NextNoComment->Type == TT_DesignatedInitializerPeriod; |
| 514 | } else { |
| 515 | NewIndent = |
| 516 | 4 + std::max(LastSpace, State.Stack.back().StartOfFunctionCall); |
| 517 | AvoidBinPacking = !Style.BinPackParameters || |
| 518 | (Style.ExperimentalAutoDetectBinPacking && |
| 519 | (Current.PackingKind == PPK_OnePerLine || |
| 520 | (!BinPackInconclusiveFunctions && |
| 521 | Current.PackingKind == PPK_Inconclusive))); |
| 522 | } |
| 523 | |
| 524 | State.Stack.push_back(ParenState(NewIndent, LastSpace, AvoidBinPacking, |
| 525 | State.Stack.back().NoLineBreak)); |
| 526 | ++State.ParenLevel; |
| 527 | } |
| 528 | |
| 529 | // If this '[' opens an ObjC call, determine whether all parameters fit into |
| 530 | // one line and put one per line if they don't. |
| 531 | if (Current.is(tok::l_square) && Current.Type == TT_ObjCMethodExpr && |
| 532 | Current.MatchingParen != NULL) { |
| 533 | if (getLengthToMatchingParen(Current) + State.Column > getColumnLimit()) |
| 534 | State.Stack.back().BreakBeforeParameter = true; |
| 535 | } |
| 536 | |
| 537 | // If we encounter a closing ), ], } or >, we can remove a level from our |
| 538 | // stacks. |
Daniel Jasper | 96df37a | 2013-08-28 09:17:37 +0000 | [diff] [blame] | 539 | if (State.Stack.size() > 1 && |
| 540 | (Current.isOneOf(tok::r_paren, tok::r_square) || |
| 541 | (Current.is(tok::r_brace) && State.NextToken != Line.First) || |
| 542 | State.NextToken->Type == TT_TemplateCloser)) { |
Daniel Jasper | de0328a | 2013-08-16 11:20:30 +0000 | [diff] [blame] | 543 | State.Stack.pop_back(); |
| 544 | --State.ParenLevel; |
| 545 | } |
| 546 | if (Current.is(tok::r_square)) { |
| 547 | // If this ends the array subscript expr, reset the corresponding value. |
| 548 | const FormatToken *NextNonComment = Current.getNextNonComment(); |
| 549 | if (NextNonComment && NextNonComment->isNot(tok::l_square)) |
| 550 | State.Stack.back().StartOfArraySubscripts = 0; |
| 551 | } |
| 552 | |
| 553 | // Remove scopes created by fake parenthesis. |
| 554 | for (unsigned i = 0, e = Current.FakeRParens; i != e; ++i) { |
| 555 | unsigned VariablePos = State.Stack.back().VariablePos; |
| 556 | State.Stack.pop_back(); |
| 557 | State.Stack.back().VariablePos = VariablePos; |
| 558 | } |
| 559 | |
| 560 | if (Current.is(tok::string_literal) && State.StartOfStringLiteral == 0) { |
| 561 | State.StartOfStringLiteral = State.Column; |
| 562 | } else if (!Current.isOneOf(tok::comment, tok::identifier, tok::hash, |
| 563 | tok::string_literal)) { |
| 564 | State.StartOfStringLiteral = 0; |
| 565 | } |
| 566 | |
| 567 | State.Column += Current.CodePointCount; |
Daniel Jasper | de0328a | 2013-08-16 11:20:30 +0000 | [diff] [blame] | 568 | State.NextToken = State.NextToken->Next; |
Daniel Jasper | b27c4b7 | 2013-08-27 11:09:05 +0000 | [diff] [blame] | 569 | unsigned Penalty = breakProtrudingToken(Current, State, DryRun); |
Daniel Jasper | de0328a | 2013-08-16 11:20:30 +0000 | [diff] [blame] | 570 | |
Daniel Jasper | 8de9ed0 | 2013-08-22 15:00:41 +0000 | [diff] [blame] | 571 | // If the previous has a special role, let it consume tokens as appropriate. |
| 572 | // It is necessary to start at the previous token for the only implemented |
| 573 | // role (comma separated list). That way, the decision whether or not to break |
| 574 | // after the "{" is already done and both options are tried and evaluated. |
| 575 | // FIXME: This is ugly, find a better way. |
| 576 | if (Previous && Previous->Role) |
| 577 | Penalty += Previous->Role->format(State, this, DryRun); |
| 578 | |
| 579 | return Penalty; |
Daniel Jasper | de0328a | 2013-08-16 11:20:30 +0000 | [diff] [blame] | 580 | } |
| 581 | |
Alexander Kornienko | d7b837e | 2013-08-29 17:32:57 +0000 | [diff] [blame^] | 582 | unsigned |
| 583 | ContinuationIndenter::addMultilineStringLiteral(const FormatToken &Current, |
| 584 | LineState &State) { |
| 585 | StringRef Text = Current.TokenText; |
| 586 | // We can only affect layout of the first and the last line, so the penalty |
| 587 | // for all other lines is constant, and we ignore it. |
| 588 | size_t FirstLineBreak = Text.find('\n'); |
| 589 | size_t LastLineBreak = Text.find_last_of('\n'); |
| 590 | assert(FirstLineBreak != StringRef::npos); |
| 591 | unsigned StartColumn = State.Column - Current.CodePointCount; |
| 592 | State.Column = |
| 593 | encoding::getCodePointCount(Text.substr(LastLineBreak + 1), Encoding); |
| 594 | |
| 595 | // Break before further function parameters on all levels. |
| 596 | for (unsigned i = 0, e = State.Stack.size(); i != e; ++i) |
| 597 | State.Stack[i].BreakBeforeParameter = true; |
| 598 | |
| 599 | unsigned ColumnsUsed = |
| 600 | StartColumn + |
| 601 | encoding::getCodePointCount(Text.substr(0, FirstLineBreak), Encoding); |
| 602 | if (ColumnsUsed > getColumnLimit()) |
| 603 | return Style.PenaltyExcessCharacter * (ColumnsUsed - getColumnLimit()); |
| 604 | return 0; |
| 605 | } |
| 606 | |
Daniel Jasper | de0328a | 2013-08-16 11:20:30 +0000 | [diff] [blame] | 607 | unsigned ContinuationIndenter::breakProtrudingToken(const FormatToken &Current, |
| 608 | LineState &State, |
| 609 | bool DryRun) { |
Daniel Jasper | f93551c | 2013-08-23 10:05:49 +0000 | [diff] [blame] | 610 | if (!Current.isOneOf(tok::string_literal, tok::comment)) |
| 611 | return 0; |
| 612 | |
Daniel Jasper | de0328a | 2013-08-16 11:20:30 +0000 | [diff] [blame] | 613 | llvm::OwningPtr<BreakableToken> Token; |
| 614 | unsigned StartColumn = State.Column - Current.CodePointCount; |
Daniel Jasper | de0328a | 2013-08-16 11:20:30 +0000 | [diff] [blame] | 615 | |
| 616 | if (Current.is(tok::string_literal) && |
| 617 | Current.Type != TT_ImplicitStringLiteral) { |
Alexander Kornienko | d7b837e | 2013-08-29 17:32:57 +0000 | [diff] [blame^] | 618 | // Don't break string literals with (in case of non-raw strings, escaped) |
| 619 | // newlines. As clang-format must not change the string's content, it is |
| 620 | // unlikely that we'll end up with a better format. |
| 621 | if (Current.IsMultiline) |
| 622 | return addMultilineStringLiteral(Current, State); |
| 623 | |
Daniel Jasper | de0328a | 2013-08-16 11:20:30 +0000 | [diff] [blame] | 624 | // Only break up default narrow strings. |
| 625 | if (!Current.TokenText.startswith("\"")) |
| 626 | return 0; |
Daniel Jasper | de0328a | 2013-08-16 11:20:30 +0000 | [diff] [blame] | 627 | // Exempts unterminated string literals from line breaking. The user will |
| 628 | // likely want to terminate the string before any line breaking is done. |
| 629 | if (Current.IsUnterminatedLiteral) |
| 630 | return 0; |
| 631 | |
| 632 | Token.reset(new BreakableStringLiteral(Current, StartColumn, |
| 633 | Line.InPPDirective, Encoding)); |
| 634 | } else if (Current.Type == TT_BlockComment && Current.isTrailingComment()) { |
Alexander Kornienko | d7b837e | 2013-08-29 17:32:57 +0000 | [diff] [blame^] | 635 | unsigned OriginalStartColumn = |
| 636 | SourceMgr.getSpellingColumnNumber(Current.getStartOfNonWhitespace()) - |
| 637 | 1; |
Daniel Jasper | de0328a | 2013-08-16 11:20:30 +0000 | [diff] [blame] | 638 | Token.reset(new BreakableBlockComment( |
| 639 | Style, Current, StartColumn, OriginalStartColumn, !Current.Previous, |
| 640 | Line.InPPDirective, Encoding)); |
| 641 | } else if (Current.Type == TT_LineComment && |
| 642 | (Current.Previous == NULL || |
| 643 | Current.Previous->Type != TT_ImplicitStringLiteral)) { |
| 644 | // Don't break line comments with escaped newlines. These look like |
| 645 | // separate line comments, but in fact contain a single line comment with |
| 646 | // multiple lines including leading whitespace and the '//' markers. |
| 647 | // |
| 648 | // FIXME: If we want to handle them correctly, we'll need to adjust |
| 649 | // leading whitespace in consecutive lines when changing indentation of |
| 650 | // the first line similar to what we do with block comments. |
Alexander Kornienko | d7b837e | 2013-08-29 17:32:57 +0000 | [diff] [blame^] | 651 | if (Current.IsMultiline) { |
| 652 | StringRef::size_type EscapedNewlinePos = Current.TokenText.find("\\\n"); |
| 653 | assert(EscapedNewlinePos != StringRef::npos); |
Daniel Jasper | de0328a | 2013-08-16 11:20:30 +0000 | [diff] [blame] | 654 | State.Column = |
| 655 | StartColumn + |
| 656 | encoding::getCodePointCount( |
| 657 | Current.TokenText.substr(0, EscapedNewlinePos), Encoding) + |
| 658 | 1; |
| 659 | return 0; |
| 660 | } |
| 661 | |
| 662 | Token.reset(new BreakableLineComment(Current, StartColumn, |
| 663 | Line.InPPDirective, Encoding)); |
| 664 | } else { |
| 665 | return 0; |
| 666 | } |
| 667 | if (Current.UnbreakableTailLength >= getColumnLimit()) |
| 668 | return 0; |
| 669 | |
| 670 | unsigned RemainingSpace = getColumnLimit() - Current.UnbreakableTailLength; |
| 671 | bool BreakInserted = false; |
| 672 | unsigned Penalty = 0; |
| 673 | unsigned RemainingTokenColumns = 0; |
| 674 | for (unsigned LineIndex = 0, EndIndex = Token->getLineCount(); |
| 675 | LineIndex != EndIndex; ++LineIndex) { |
| 676 | if (!DryRun) |
| 677 | Token->replaceWhitespaceBefore(LineIndex, Whitespaces); |
| 678 | unsigned TailOffset = 0; |
| 679 | RemainingTokenColumns = |
| 680 | Token->getLineLengthAfterSplit(LineIndex, TailOffset, StringRef::npos); |
| 681 | while (RemainingTokenColumns > RemainingSpace) { |
| 682 | BreakableToken::Split Split = |
| 683 | Token->getSplit(LineIndex, TailOffset, getColumnLimit()); |
| 684 | if (Split.first == StringRef::npos) { |
| 685 | // The last line's penalty is handled in addNextStateToQueue(). |
| 686 | if (LineIndex < EndIndex - 1) |
| 687 | Penalty += Style.PenaltyExcessCharacter * |
| 688 | (RemainingTokenColumns - RemainingSpace); |
| 689 | break; |
| 690 | } |
| 691 | assert(Split.first != 0); |
| 692 | unsigned NewRemainingTokenColumns = Token->getLineLengthAfterSplit( |
| 693 | LineIndex, TailOffset + Split.first + Split.second, StringRef::npos); |
| 694 | assert(NewRemainingTokenColumns < RemainingTokenColumns); |
| 695 | if (!DryRun) |
| 696 | Token->insertBreak(LineIndex, TailOffset, Split, Whitespaces); |
Daniel Jasper | 2739af3 | 2013-08-28 10:03:58 +0000 | [diff] [blame] | 697 | Penalty += Current.SplitPenalty; |
Daniel Jasper | de0328a | 2013-08-16 11:20:30 +0000 | [diff] [blame] | 698 | unsigned ColumnsUsed = |
| 699 | Token->getLineLengthAfterSplit(LineIndex, TailOffset, Split.first); |
| 700 | if (ColumnsUsed > getColumnLimit()) { |
| 701 | Penalty += |
| 702 | Style.PenaltyExcessCharacter * (ColumnsUsed - getColumnLimit()); |
| 703 | } |
| 704 | TailOffset += Split.first + Split.second; |
| 705 | RemainingTokenColumns = NewRemainingTokenColumns; |
| 706 | BreakInserted = true; |
| 707 | } |
| 708 | } |
| 709 | |
| 710 | State.Column = RemainingTokenColumns; |
| 711 | |
| 712 | if (BreakInserted) { |
| 713 | // If we break the token inside a parameter list, we need to break before |
| 714 | // the next parameter on all levels, so that the next parameter is clearly |
| 715 | // visible. Line comments already introduce a break. |
| 716 | if (Current.Type != TT_LineComment) { |
| 717 | for (unsigned i = 0, e = State.Stack.size(); i != e; ++i) |
| 718 | State.Stack[i].BreakBeforeParameter = true; |
| 719 | } |
| 720 | |
Daniel Jasper | 2739af3 | 2013-08-28 10:03:58 +0000 | [diff] [blame] | 721 | Penalty += Current.is(tok::string_literal) ? Style.PenaltyBreakString |
| 722 | : Style.PenaltyBreakComment; |
| 723 | |
Daniel Jasper | de0328a | 2013-08-16 11:20:30 +0000 | [diff] [blame] | 724 | State.Stack.back().LastSpace = StartColumn; |
| 725 | } |
| 726 | return Penalty; |
| 727 | } |
| 728 | |
| 729 | unsigned ContinuationIndenter::getColumnLimit() const { |
| 730 | // In preprocessor directives reserve two chars for trailing " \" |
| 731 | return Style.ColumnLimit - (Line.InPPDirective ? 2 : 0); |
| 732 | } |
| 733 | |
Daniel Jasper | f438cb7 | 2013-08-23 11:57:34 +0000 | [diff] [blame] | 734 | bool ContinuationIndenter::NextIsMultilineString(const LineState &State) { |
| 735 | const FormatToken &Current = *State.NextToken; |
| 736 | if (!Current.is(tok::string_literal)) |
| 737 | return false; |
Alexander Kornienko | d7b837e | 2013-08-29 17:32:57 +0000 | [diff] [blame^] | 738 | // We never consider raw string literals "multiline" for the purpose of |
| 739 | // AlwaysBreakBeforeMultilineStrings implementation. |
| 740 | if (Current.TokenText.startswith("R\"")) |
| 741 | return false; |
| 742 | if (Current.IsMultiline) |
| 743 | return true; |
Daniel Jasper | f438cb7 | 2013-08-23 11:57:34 +0000 | [diff] [blame] | 744 | if (Current.getNextNonComment() && |
| 745 | Current.getNextNonComment()->is(tok::string_literal)) |
| 746 | return true; // Implicit concatenation. |
| 747 | if (State.Column + Current.CodePointCount + Current.UnbreakableTailLength > |
| 748 | Style.ColumnLimit) |
| 749 | return true; // String will be split. |
Alexander Kornienko | d7b837e | 2013-08-29 17:32:57 +0000 | [diff] [blame^] | 750 | return false; |
Daniel Jasper | f438cb7 | 2013-08-23 11:57:34 +0000 | [diff] [blame] | 751 | } |
| 752 | |
Daniel Jasper | de0328a | 2013-08-16 11:20:30 +0000 | [diff] [blame] | 753 | } // namespace format |
| 754 | } // namespace clang |