blob: 84f07ab28e8d67ee413ac6499299bc85b6f25dca [file] [log] [blame]
Daniel Jasperf7935112012-12-03 18:12:45 +00001//===--- Format.cpp - Format C++ code -------------------------------------===//
2//
3// The LLVM Compiler Infrastructure
4//
5// This file is distributed under the University of Illinois Open Source
6// License. See LICENSE.TXT for details.
7//
8//===----------------------------------------------------------------------===//
9///
10/// \file
11/// \brief This file implements functions declared in Format.h. This will be
12/// split into separate files as we go.
13///
Daniel Jasperf7935112012-12-03 18:12:45 +000014//===----------------------------------------------------------------------===//
15
Manuel Klimek24998102013-01-16 14:55:28 +000016#define DEBUG_TYPE "format-formatter"
17
Alexander Kornienkocb45bc12013-04-15 14:28:00 +000018#include "BreakableToken.h"
Daniel Jasper7a6d09b2013-01-29 21:01:14 +000019#include "TokenAnnotator.h"
Chandler Carruth3a022472012-12-04 09:13:33 +000020#include "UnwrappedLineParser.h"
Alexander Kornienkocb45bc12013-04-15 14:28:00 +000021#include "WhitespaceManager.h"
Daniel Jasperec04c0d2013-05-16 10:40:07 +000022#include "clang/Basic/Diagnostic.h"
Daniel Jasperab7654e2012-12-21 10:20:02 +000023#include "clang/Basic/OperatorPrecedence.h"
Chandler Carruth44eb4f62013-01-02 10:28:36 +000024#include "clang/Basic/SourceManager.h"
Manuel Klimek24998102013-01-16 14:55:28 +000025#include "clang/Format/Format.h"
Daniel Jasperf7935112012-12-03 18:12:45 +000026#include "clang/Lex/Lexer.h"
Alexander Kornienkoffd6d042013-03-27 11:52:18 +000027#include "llvm/ADT/STLExtras.h"
Manuel Klimek2ef908e2013-02-13 10:46:36 +000028#include "llvm/Support/Allocator.h"
Manuel Klimek24998102013-01-16 14:55:28 +000029#include "llvm/Support/Debug.h"
Alexander Kornienkod6538332013-05-07 15:32:14 +000030#include "llvm/Support/YAMLTraits.h"
Manuel Klimek2ef908e2013-02-13 10:46:36 +000031#include <queue>
Daniel Jasper8b529712012-12-04 13:02:32 +000032#include <string>
33
Alexander Kornienkod6538332013-05-07 15:32:14 +000034namespace llvm {
35namespace yaml {
36template <>
37struct ScalarEnumerationTraits<clang::format::FormatStyle::LanguageStandard> {
Manuel Klimeka8eb9142013-05-13 12:51:40 +000038 static void enumeration(IO &IO,
39 clang::format::FormatStyle::LanguageStandard &Value) {
40 IO.enumCase(Value, "C++03", clang::format::FormatStyle::LS_Cpp03);
41 IO.enumCase(Value, "C++11", clang::format::FormatStyle::LS_Cpp11);
42 IO.enumCase(Value, "Auto", clang::format::FormatStyle::LS_Auto);
43 }
44};
45
Daniel Jasper12f9d8e2013-05-14 09:30:02 +000046template <>
Manuel Klimeka8eb9142013-05-13 12:51:40 +000047struct ScalarEnumerationTraits<clang::format::FormatStyle::BraceBreakingStyle> {
48 static void
49 enumeration(IO &IO, clang::format::FormatStyle::BraceBreakingStyle &Value) {
50 IO.enumCase(Value, "Attach", clang::format::FormatStyle::BS_Attach);
51 IO.enumCase(Value, "Linux", clang::format::FormatStyle::BS_Linux);
52 IO.enumCase(Value, "Stroustrup", clang::format::FormatStyle::BS_Stroustrup);
Alexander Kornienkod6538332013-05-07 15:32:14 +000053 }
54};
55
56template <> struct MappingTraits<clang::format::FormatStyle> {
57 static void mapping(llvm::yaml::IO &IO, clang::format::FormatStyle &Style) {
Alexander Kornienko49149672013-05-10 11:56:10 +000058 if (IO.outputting()) {
59 StringRef StylesArray[] = { "LLVM", "Google", "Chromium", "Mozilla" };
60 ArrayRef<StringRef> Styles(StylesArray);
61 for (size_t i = 0, e = Styles.size(); i < e; ++i) {
62 StringRef StyleName(Styles[i]);
Alexander Kornienko006b5c82013-05-19 00:53:30 +000063 clang::format::FormatStyle PredefinedStyle;
64 if (clang::format::getPredefinedStyle(StyleName, &PredefinedStyle) &&
65 Style == PredefinedStyle) {
Alexander Kornienko49149672013-05-10 11:56:10 +000066 IO.mapOptional("# BasedOnStyle", StyleName);
67 break;
68 }
69 }
70 } else {
Alexander Kornienkod6538332013-05-07 15:32:14 +000071 StringRef BasedOnStyle;
72 IO.mapOptional("BasedOnStyle", BasedOnStyle);
Alexander Kornienkod6538332013-05-07 15:32:14 +000073 if (!BasedOnStyle.empty())
Alexander Kornienko006b5c82013-05-19 00:53:30 +000074 if (!clang::format::getPredefinedStyle(BasedOnStyle, &Style)) {
75 IO.setError(Twine("Unknown value for BasedOnStyle: ", BasedOnStyle));
76 return;
77 }
Alexander Kornienkod6538332013-05-07 15:32:14 +000078 }
79
80 IO.mapOptional("AccessModifierOffset", Style.AccessModifierOffset);
81 IO.mapOptional("AlignEscapedNewlinesLeft", Style.AlignEscapedNewlinesLeft);
82 IO.mapOptional("AllowAllParametersOfDeclarationOnNextLine",
83 Style.AllowAllParametersOfDeclarationOnNextLine);
84 IO.mapOptional("AllowShortIfStatementsOnASingleLine",
85 Style.AllowShortIfStatementsOnASingleLine);
Daniel Jasper3a685df2013-05-16 12:12:21 +000086 IO.mapOptional("AllowShortLoopsOnASingleLine",
87 Style.AllowShortLoopsOnASingleLine);
Daniel Jasper61e6bbf2013-05-29 12:07:31 +000088 IO.mapOptional("AlwaysBreakTemplateDeclarations",
89 Style.AlwaysBreakTemplateDeclarations);
Alexander Kornienko58611712013-07-04 12:02:44 +000090 IO.mapOptional("AlwaysBreakBeforeMultilineStrings",
91 Style.AlwaysBreakBeforeMultilineStrings);
Alexander Kornienkod6538332013-05-07 15:32:14 +000092 IO.mapOptional("BinPackParameters", Style.BinPackParameters);
93 IO.mapOptional("ColumnLimit", Style.ColumnLimit);
94 IO.mapOptional("ConstructorInitializerAllOnOneLineOrOnePerLine",
95 Style.ConstructorInitializerAllOnOneLineOrOnePerLine);
96 IO.mapOptional("DerivePointerBinding", Style.DerivePointerBinding);
97 IO.mapOptional("IndentCaseLabels", Style.IndentCaseLabels);
98 IO.mapOptional("MaxEmptyLinesToKeep", Style.MaxEmptyLinesToKeep);
99 IO.mapOptional("ObjCSpaceBeforeProtocolList",
100 Style.ObjCSpaceBeforeProtocolList);
Alexander Kornienkodd7ece52013-06-07 16:02:52 +0000101 IO.mapOptional("PenaltyBreakComment", Style.PenaltyBreakComment);
102 IO.mapOptional("PenaltyBreakString", Style.PenaltyBreakString);
Alexander Kornienkod6538332013-05-07 15:32:14 +0000103 IO.mapOptional("PenaltyExcessCharacter", Style.PenaltyExcessCharacter);
104 IO.mapOptional("PenaltyReturnTypeOnItsOwnLine",
105 Style.PenaltyReturnTypeOnItsOwnLine);
106 IO.mapOptional("PointerBindsToType", Style.PointerBindsToType);
107 IO.mapOptional("SpacesBeforeTrailingComments",
108 Style.SpacesBeforeTrailingComments);
Daniel Jasper5bd0b9e2013-05-23 18:05:18 +0000109 IO.mapOptional("SpacesInBracedLists", Style.SpacesInBracedLists);
Alexander Kornienkod6538332013-05-07 15:32:14 +0000110 IO.mapOptional("Standard", Style.Standard);
Manuel Klimek13b97d82013-05-13 08:42:42 +0000111 IO.mapOptional("IndentWidth", Style.IndentWidth);
Manuel Klimekb9eae4c2013-05-13 09:22:11 +0000112 IO.mapOptional("UseTab", Style.UseTab);
Manuel Klimeka8eb9142013-05-13 12:51:40 +0000113 IO.mapOptional("BreakBeforeBraces", Style.BreakBeforeBraces);
Manuel Klimek836c2862013-06-21 17:25:42 +0000114 IO.mapOptional("IndentFunctionDeclarationAfterType",
115 Style.IndentFunctionDeclarationAfterType);
Alexander Kornienkod6538332013-05-07 15:32:14 +0000116 }
117};
118}
119}
120
Daniel Jasperf7935112012-12-03 18:12:45 +0000121namespace clang {
122namespace format {
123
Daniel Jasperf7935112012-12-03 18:12:45 +0000124FormatStyle getLLVMStyle() {
125 FormatStyle LLVMStyle;
Daniel Jasperf7935112012-12-03 18:12:45 +0000126 LLVMStyle.AccessModifierOffset = -2;
Alexander Kornienkoc8602662013-05-06 14:11:27 +0000127 LLVMStyle.AlignEscapedNewlinesLeft = false;
Daniel Jasperf7db4332013-01-29 16:03:49 +0000128 LLVMStyle.AllowAllParametersOfDeclarationOnNextLine = true;
Daniel Jasper1b750ed2013-01-14 16:24:39 +0000129 LLVMStyle.AllowShortIfStatementsOnASingleLine = false;
Daniel Jasper3a685df2013-05-16 12:12:21 +0000130 LLVMStyle.AllowShortLoopsOnASingleLine = false;
Daniel Jasper61e6bbf2013-05-29 12:07:31 +0000131 LLVMStyle.AlwaysBreakTemplateDeclarations = false;
Alexander Kornienko58611712013-07-04 12:02:44 +0000132 LLVMStyle.AlwaysBreakBeforeMultilineStrings = false;
Alexander Kornienkoc8602662013-05-06 14:11:27 +0000133 LLVMStyle.BinPackParameters = true;
134 LLVMStyle.ColumnLimit = 80;
135 LLVMStyle.ConstructorInitializerAllOnOneLineOrOnePerLine = false;
136 LLVMStyle.DerivePointerBinding = false;
137 LLVMStyle.IndentCaseLabels = false;
138 LLVMStyle.MaxEmptyLinesToKeep = 1;
Nico Webera6087752013-01-10 20:12:55 +0000139 LLVMStyle.ObjCSpaceBeforeProtocolList = true;
Alexander Kornienkodd7ece52013-06-07 16:02:52 +0000140 LLVMStyle.PenaltyBreakComment = 45;
141 LLVMStyle.PenaltyBreakString = 1000;
Daniel Jasper3a9370c2013-02-04 07:21:18 +0000142 LLVMStyle.PenaltyExcessCharacter = 1000000;
Daniel Jasper6728fc12013-04-11 14:29:13 +0000143 LLVMStyle.PenaltyReturnTypeOnItsOwnLine = 75;
Alexander Kornienkoc8602662013-05-06 14:11:27 +0000144 LLVMStyle.PointerBindsToType = false;
145 LLVMStyle.SpacesBeforeTrailingComments = 1;
Daniel Jaspere5777d22013-05-23 10:15:45 +0000146 LLVMStyle.SpacesInBracedLists = true;
Alexander Kornienkoc8602662013-05-06 14:11:27 +0000147 LLVMStyle.Standard = FormatStyle::LS_Cpp03;
Manuel Klimek13b97d82013-05-13 08:42:42 +0000148 LLVMStyle.IndentWidth = 2;
Manuel Klimekb9eae4c2013-05-13 09:22:11 +0000149 LLVMStyle.UseTab = false;
Manuel Klimeka8eb9142013-05-13 12:51:40 +0000150 LLVMStyle.BreakBeforeBraces = FormatStyle::BS_Attach;
Manuel Klimek836c2862013-06-21 17:25:42 +0000151 LLVMStyle.IndentFunctionDeclarationAfterType = false;
Daniel Jasperf7935112012-12-03 18:12:45 +0000152 return LLVMStyle;
153}
154
155FormatStyle getGoogleStyle() {
156 FormatStyle GoogleStyle;
Daniel Jasperf7935112012-12-03 18:12:45 +0000157 GoogleStyle.AccessModifierOffset = -1;
Alexander Kornienkoc8602662013-05-06 14:11:27 +0000158 GoogleStyle.AlignEscapedNewlinesLeft = true;
Daniel Jasperf7db4332013-01-29 16:03:49 +0000159 GoogleStyle.AllowAllParametersOfDeclarationOnNextLine = true;
Daniel Jasper085a2ed2013-04-24 13:46:00 +0000160 GoogleStyle.AllowShortIfStatementsOnASingleLine = true;
Daniel Jasper5bd0b9e2013-05-23 18:05:18 +0000161 GoogleStyle.AllowShortLoopsOnASingleLine = true;
Daniel Jasper61e6bbf2013-05-29 12:07:31 +0000162 GoogleStyle.AlwaysBreakTemplateDeclarations = true;
Alexander Kornienko58611712013-07-04 12:02:44 +0000163 GoogleStyle.AlwaysBreakBeforeMultilineStrings = true;
Alexander Kornienkoc8602662013-05-06 14:11:27 +0000164 GoogleStyle.BinPackParameters = true;
165 GoogleStyle.ColumnLimit = 80;
166 GoogleStyle.ConstructorInitializerAllOnOneLineOrOnePerLine = true;
167 GoogleStyle.DerivePointerBinding = true;
168 GoogleStyle.IndentCaseLabels = true;
169 GoogleStyle.MaxEmptyLinesToKeep = 1;
Nico Webera6087752013-01-10 20:12:55 +0000170 GoogleStyle.ObjCSpaceBeforeProtocolList = false;
Alexander Kornienkodd7ece52013-06-07 16:02:52 +0000171 GoogleStyle.PenaltyBreakComment = 45;
172 GoogleStyle.PenaltyBreakString = 1000;
Daniel Jasper3a9370c2013-02-04 07:21:18 +0000173 GoogleStyle.PenaltyExcessCharacter = 1000000;
Daniel Jasper6728fc12013-04-11 14:29:13 +0000174 GoogleStyle.PenaltyReturnTypeOnItsOwnLine = 200;
Alexander Kornienkoc8602662013-05-06 14:11:27 +0000175 GoogleStyle.PointerBindsToType = true;
176 GoogleStyle.SpacesBeforeTrailingComments = 2;
Daniel Jaspere5777d22013-05-23 10:15:45 +0000177 GoogleStyle.SpacesInBracedLists = false;
Alexander Kornienkoc8602662013-05-06 14:11:27 +0000178 GoogleStyle.Standard = FormatStyle::LS_Auto;
Manuel Klimek13b97d82013-05-13 08:42:42 +0000179 GoogleStyle.IndentWidth = 2;
Manuel Klimekb9eae4c2013-05-13 09:22:11 +0000180 GoogleStyle.UseTab = false;
Manuel Klimeka8eb9142013-05-13 12:51:40 +0000181 GoogleStyle.BreakBeforeBraces = FormatStyle::BS_Attach;
Manuel Klimek836c2862013-06-21 17:25:42 +0000182 GoogleStyle.IndentFunctionDeclarationAfterType = true;
Daniel Jasperf7935112012-12-03 18:12:45 +0000183 return GoogleStyle;
184}
185
Daniel Jasper1b750ed2013-01-14 16:24:39 +0000186FormatStyle getChromiumStyle() {
187 FormatStyle ChromiumStyle = getGoogleStyle();
Daniel Jasperf7db4332013-01-29 16:03:49 +0000188 ChromiumStyle.AllowAllParametersOfDeclarationOnNextLine = false;
Daniel Jasper085a2ed2013-04-24 13:46:00 +0000189 ChromiumStyle.AllowShortIfStatementsOnASingleLine = false;
Daniel Jasper3a685df2013-05-16 12:12:21 +0000190 ChromiumStyle.AllowShortLoopsOnASingleLine = false;
Daniel Jasper2cf17bf2013-02-27 09:47:53 +0000191 ChromiumStyle.BinPackParameters = false;
Daniel Jasper7fce3ab2013-02-06 14:22:40 +0000192 ChromiumStyle.Standard = FormatStyle::LS_Cpp03;
193 ChromiumStyle.DerivePointerBinding = false;
Daniel Jasper1b750ed2013-01-14 16:24:39 +0000194 return ChromiumStyle;
195}
196
Alexander Kornienkoc8602662013-05-06 14:11:27 +0000197FormatStyle getMozillaStyle() {
198 FormatStyle MozillaStyle = getLLVMStyle();
199 MozillaStyle.AllowAllParametersOfDeclarationOnNextLine = false;
200 MozillaStyle.ConstructorInitializerAllOnOneLineOrOnePerLine = true;
201 MozillaStyle.DerivePointerBinding = true;
202 MozillaStyle.IndentCaseLabels = true;
203 MozillaStyle.ObjCSpaceBeforeProtocolList = false;
204 MozillaStyle.PenaltyReturnTypeOnItsOwnLine = 200;
205 MozillaStyle.PointerBindsToType = true;
206 return MozillaStyle;
207}
208
Alexander Kornienko006b5c82013-05-19 00:53:30 +0000209bool getPredefinedStyle(StringRef Name, FormatStyle *Style) {
Alexander Kornienkod6538332013-05-07 15:32:14 +0000210 if (Name.equals_lower("llvm"))
Alexander Kornienko006b5c82013-05-19 00:53:30 +0000211 *Style = getLLVMStyle();
212 else if (Name.equals_lower("chromium"))
213 *Style = getChromiumStyle();
214 else if (Name.equals_lower("mozilla"))
215 *Style = getMozillaStyle();
216 else if (Name.equals_lower("google"))
217 *Style = getGoogleStyle();
218 else
219 return false;
Alexander Kornienkod6538332013-05-07 15:32:14 +0000220
Alexander Kornienko006b5c82013-05-19 00:53:30 +0000221 return true;
Alexander Kornienkod6538332013-05-07 15:32:14 +0000222}
223
224llvm::error_code parseConfiguration(StringRef Text, FormatStyle *Style) {
Alexander Kornienko06e00332013-05-20 15:18:01 +0000225 if (Text.trim().empty())
226 return llvm::make_error_code(llvm::errc::invalid_argument);
Alexander Kornienkod6538332013-05-07 15:32:14 +0000227 llvm::yaml::Input Input(Text);
228 Input >> *Style;
229 return Input.error();
230}
231
232std::string configurationAsText(const FormatStyle &Style) {
233 std::string Text;
234 llvm::raw_string_ostream Stream(Text);
235 llvm::yaml::Output Output(Stream);
236 // We use the same mapping method for input and output, so we need a non-const
237 // reference here.
238 FormatStyle NonConstStyle = Style;
239 Output << NonConstStyle;
Alexander Kornienko9a38ec22013-05-13 12:56:35 +0000240 return Stream.str();
Alexander Kornienkod6538332013-05-07 15:32:14 +0000241}
242
Daniel Jasperacc33662013-02-08 08:22:00 +0000243// Returns the length of everything up to the first possible line break after
244// the ), ], } or > matching \c Tok.
Manuel Klimek6e6310e2013-05-29 14:47:47 +0000245static unsigned getLengthToMatchingParen(const FormatToken &Tok) {
Daniel Jasperacc33662013-02-08 08:22:00 +0000246 if (Tok.MatchingParen == NULL)
247 return 0;
Manuel Klimek6e6310e2013-05-29 14:47:47 +0000248 FormatToken *End = Tok.MatchingParen;
249 while (End->Next && !End->Next->CanBreakBefore) {
250 End = End->Next;
Daniel Jasperacc33662013-02-08 08:22:00 +0000251 }
252 return End->TotalLength - Tok.TotalLength + 1;
253}
254
Craig Topperaf35e852013-06-30 22:29:28 +0000255namespace {
256
Daniel Jasperf7935112012-12-03 18:12:45 +0000257class UnwrappedLineFormatter {
258public:
Manuel Klimekb2c6dbe2013-01-10 19:17:33 +0000259 UnwrappedLineFormatter(const FormatStyle &Style, SourceManager &SourceMgr,
Daniel Jasperf1e4b7d2013-01-14 13:08:07 +0000260 const AnnotatedLine &Line, unsigned FirstIndent,
Manuel Klimek6e6310e2013-05-29 14:47:47 +0000261 const FormatToken *RootToken,
Alexander Kornienkoffcc0102013-06-05 14:09:10 +0000262 WhitespaceManager &Whitespaces,
263 encoding::Encoding Encoding)
Daniel Jasper2af6bbe2012-12-18 21:05:13 +0000264 : Style(Style), SourceMgr(SourceMgr), Line(Line),
Daniel Jasperaa701fa2013-01-18 08:44:07 +0000265 FirstIndent(FirstIndent), RootToken(RootToken),
Alexander Kornienkoffcc0102013-06-05 14:09:10 +0000266 Whitespaces(Whitespaces), Count(0), Encoding(Encoding) {}
Daniel Jasperf7935112012-12-03 18:12:45 +0000267
Manuel Klimek1abf7892013-01-04 23:34:14 +0000268 /// \brief Formats an \c UnwrappedLine.
Manuel Klimek4fe43002013-05-22 12:51:29 +0000269 void format(const AnnotatedLine *NextLine) {
Daniel Jaspere9de2602012-12-06 09:56:08 +0000270 // Initialize state dependent on indent.
Daniel Jasper337816e2013-01-11 10:22:12 +0000271 LineState State;
Manuel Klimek0b689fd2013-01-10 18:45:26 +0000272 State.Column = FirstIndent;
Manuel Klimek6e6310e2013-05-29 14:47:47 +0000273 State.NextToken = RootToken;
Daniel Jasper97b89482013-03-13 07:49:51 +0000274 State.Stack.push_back(
Nico Weber9096fc02013-06-26 00:30:14 +0000275 ParenState(FirstIndent, FirstIndent, /*AvoidBinPacking=*/false,
276 /*NoLineBreak=*/false));
Daniel Jasperfbde69e2012-12-21 14:37:20 +0000277 State.LineContainsContinuedForLoopSection = false;
Daniel Jasper400adc62013-02-08 15:28:42 +0000278 State.ParenLevel = 0;
Manuel Klimek02f640a2013-02-20 15:25:48 +0000279 State.StartOfStringLiteral = 0;
Daniel Jasper40c36c52013-02-18 11:05:07 +0000280 State.StartOfLineLevel = State.ParenLevel;
Daniel Jasper0e90c3d2013-07-05 09:14:35 +0000281 State.LowestLevelOnLine = State.ParenLevel;
Daniel Jasperf8114cf2013-05-22 05:27:42 +0000282 State.IgnoreStackForComparison = false;
Daniel Jaspere9de2602012-12-06 09:56:08 +0000283
284 // The first token has already been indented and thus consumed.
Nico Weber9096fc02013-06-26 00:30:14 +0000285 moveStateToNextToken(State, /*DryRun=*/false);
Daniel Jasperf7935112012-12-03 18:12:45 +0000286
Daniel Jasper4b866272013-02-01 11:00:45 +0000287 // If everything fits on a single line, just put it there.
Daniel Jasperc22f5b42013-02-28 11:05:57 +0000288 unsigned ColumnLimit = Style.ColumnLimit;
289 if (NextLine && NextLine->InPPDirective &&
Manuel Klimek6e6310e2013-05-29 14:47:47 +0000290 !NextLine->First->HasUnescapedNewline)
Daniel Jasperc22f5b42013-02-28 11:05:57 +0000291 ColumnLimit = getColumnLimit();
292 if (Line.Last->TotalLength <= ColumnLimit - FirstIndent) {
Daniel Jasper4b866272013-02-01 11:00:45 +0000293 while (State.NextToken != NULL) {
Daniel Jasper2af6bbe2012-12-18 21:05:13 +0000294 addTokenToState(false, false, State);
Daniel Jasper2af6bbe2012-12-18 21:05:13 +0000295 }
Daniel Jasperf7935112012-12-03 18:12:45 +0000296 }
Daniel Jasper4b866272013-02-01 11:00:45 +0000297
Daniel Jasperacc33662013-02-08 08:22:00 +0000298 // If the ObjC method declaration does not fit on a line, we should format
299 // it with one arg per line.
300 if (Line.Type == LT_ObjCMethodDecl)
301 State.Stack.back().BreakBeforeParameter = true;
302
Daniel Jasper4b866272013-02-01 11:00:45 +0000303 // Find best solution in solution space.
Manuel Klimek4fe43002013-05-22 12:51:29 +0000304 analyzeSolutionSpace(State);
Daniel Jasperf7935112012-12-03 18:12:45 +0000305 }
306
307private:
Manuel Klimek6e6310e2013-05-29 14:47:47 +0000308 void DebugTokenState(const FormatToken &FormatTok) {
309 const Token &Tok = FormatTok.Tok;
Alexander Kornienko49149672013-05-10 11:56:10 +0000310 llvm::dbgs() << StringRef(SourceMgr.getCharacterData(Tok.getLocation()),
Daniel Jasperbbc84152013-01-29 11:27:30 +0000311 Tok.getLength());
Alexander Kornienko49149672013-05-10 11:56:10 +0000312 llvm::dbgs();
Manuel Klimek24998102013-01-16 14:55:28 +0000313 }
314
Daniel Jasper337816e2013-01-11 10:22:12 +0000315 struct ParenState {
Daniel Jasperb9ebd5d2013-02-05 09:41:21 +0000316 ParenState(unsigned Indent, unsigned LastSpace, bool AvoidBinPacking,
Daniel Jaspercc960fa2013-04-22 07:59:53 +0000317 bool NoLineBreak)
Daniel Jasper400adc62013-02-08 15:28:42 +0000318 : Indent(Indent), LastSpace(LastSpace), FirstLessLess(0),
319 BreakBeforeClosingBrace(false), QuestionColumn(0),
Daniel Jasperacc33662013-02-08 08:22:00 +0000320 AvoidBinPacking(AvoidBinPacking), BreakBeforeParameter(false),
Daniel Jaspercc960fa2013-04-22 07:59:53 +0000321 NoLineBreak(NoLineBreak), ColonPos(0), StartOfFunctionCall(0),
322 NestedNameSpecifierContinuation(0), CallContinuation(0),
Daniel Jaspercc3044c2013-05-13 09:19:24 +0000323 VariablePos(0), ForFakeParenthesis(false) {}
Daniel Jasper6d822722012-12-24 16:43:00 +0000324
Daniel Jasperf7935112012-12-03 18:12:45 +0000325 /// \brief The position to which a specific parenthesis level needs to be
326 /// indented.
Daniel Jasper337816e2013-01-11 10:22:12 +0000327 unsigned Indent;
Daniel Jasperf7935112012-12-03 18:12:45 +0000328
Daniel Jaspere9de2602012-12-06 09:56:08 +0000329 /// \brief The position of the last space on each level.
330 ///
331 /// Used e.g. to break like:
332 /// functionCall(Parameter, otherCall(
333 /// OtherParameter));
Daniel Jasper337816e2013-01-11 10:22:12 +0000334 unsigned LastSpace;
Daniel Jasperf7935112012-12-03 18:12:45 +0000335
Daniel Jaspere9de2602012-12-06 09:56:08 +0000336 /// \brief The position the first "<<" operator encountered on each level.
337 ///
338 /// Used to align "<<" operators. 0 if no such operator has been encountered
339 /// on a level.
Daniel Jasper337816e2013-01-11 10:22:12 +0000340 unsigned FirstLessLess;
Daniel Jaspere9de2602012-12-06 09:56:08 +0000341
Manuel Klimek0ddd57a2013-01-10 15:58:26 +0000342 /// \brief Whether a newline needs to be inserted before the block's closing
343 /// brace.
344 ///
345 /// We only want to insert a newline before the closing brace if there also
346 /// was a newline after the beginning left brace.
Daniel Jasper337816e2013-01-11 10:22:12 +0000347 bool BreakBeforeClosingBrace;
348
Daniel Jasperca6623b2013-01-28 12:45:14 +0000349 /// \brief The column of a \c ? in a conditional expression;
350 unsigned QuestionColumn;
351
Daniel Jasper8a8ce242013-01-31 14:59:26 +0000352 /// \brief Avoid bin packing, i.e. multiple parameters/elements on multiple
353 /// lines, in this context.
354 bool AvoidBinPacking;
355
356 /// \brief Break after the next comma (or all the commas in this context if
357 /// \c AvoidBinPacking is \c true).
Daniel Jasperacc33662013-02-08 08:22:00 +0000358 bool BreakBeforeParameter;
Daniel Jasper8a8ce242013-01-31 14:59:26 +0000359
Daniel Jaspercc960fa2013-04-22 07:59:53 +0000360 /// \brief Line breaking in this context would break a formatting rule.
361 bool NoLineBreak;
Daniel Jasper2408a8c2013-01-11 11:37:55 +0000362
Daniel Jasper1ac3e052013-02-05 10:07:47 +0000363 /// \brief The position of the colon in an ObjC method declaration/call.
364 unsigned ColonPos;
Daniel Jasperdc7d5812013-02-20 12:56:39 +0000365
Daniel Jasperf9a84b52013-03-01 16:48:32 +0000366 /// \brief The start of the most recent function in a builder-type call.
367 unsigned StartOfFunctionCall;
368
Daniel Jasperc238c872013-04-02 14:33:13 +0000369 /// \brief If a nested name specifier was broken over multiple lines, this
370 /// contains the start column of the second line. Otherwise 0.
371 unsigned NestedNameSpecifierContinuation;
372
373 /// \brief If a call expression was broken over multiple lines, this
374 /// contains the start column of the second line. Otherwise 0.
375 unsigned CallContinuation;
376
Daniel Jaspera628c982013-04-03 13:36:17 +0000377 /// \brief The column of the first variable name in a variable declaration.
378 ///
379 /// Used to align further variables if necessary.
380 unsigned VariablePos;
381
Daniel Jaspercc3044c2013-05-13 09:19:24 +0000382 /// \brief \c true if this \c ParenState was created for a fake parenthesis.
383 ///
384 /// Does not need to be considered for memoization / the comparison function
385 /// as otherwise identical states will have the same fake/non-fake
386 /// \c ParenStates.
387 bool ForFakeParenthesis;
388
Daniel Jasper337816e2013-01-11 10:22:12 +0000389 bool operator<(const ParenState &Other) const {
390 if (Indent != Other.Indent)
Daniel Jasperfd8c4b12013-01-11 14:23:32 +0000391 return Indent < Other.Indent;
Daniel Jasper337816e2013-01-11 10:22:12 +0000392 if (LastSpace != Other.LastSpace)
393 return LastSpace < Other.LastSpace;
394 if (FirstLessLess != Other.FirstLessLess)
395 return FirstLessLess < Other.FirstLessLess;
Daniel Jasper2408a8c2013-01-11 11:37:55 +0000396 if (BreakBeforeClosingBrace != Other.BreakBeforeClosingBrace)
397 return BreakBeforeClosingBrace;
Daniel Jasperca6623b2013-01-28 12:45:14 +0000398 if (QuestionColumn != Other.QuestionColumn)
399 return QuestionColumn < Other.QuestionColumn;
Daniel Jasper8a8ce242013-01-31 14:59:26 +0000400 if (AvoidBinPacking != Other.AvoidBinPacking)
401 return AvoidBinPacking;
Daniel Jasperacc33662013-02-08 08:22:00 +0000402 if (BreakBeforeParameter != Other.BreakBeforeParameter)
403 return BreakBeforeParameter;
Daniel Jaspercc960fa2013-04-22 07:59:53 +0000404 if (NoLineBreak != Other.NoLineBreak)
405 return NoLineBreak;
Daniel Jasper1ac3e052013-02-05 10:07:47 +0000406 if (ColonPos != Other.ColonPos)
407 return ColonPos < Other.ColonPos;
Daniel Jasperf9a84b52013-03-01 16:48:32 +0000408 if (StartOfFunctionCall != Other.StartOfFunctionCall)
409 return StartOfFunctionCall < Other.StartOfFunctionCall;
Daniel Jasperc238c872013-04-02 14:33:13 +0000410 if (CallContinuation != Other.CallContinuation)
411 return CallContinuation < Other.CallContinuation;
Daniel Jaspera628c982013-04-03 13:36:17 +0000412 if (VariablePos != Other.VariablePos)
413 return VariablePos < Other.VariablePos;
Daniel Jasper7b7877a2013-01-12 07:36:22 +0000414 return false;
Daniel Jasper337816e2013-01-11 10:22:12 +0000415 }
416 };
417
418 /// \brief The current state when indenting a unwrapped line.
419 ///
420 /// As the indenting tries different combinations this is copied by value.
421 struct LineState {
422 /// \brief The number of used columns in the current line.
423 unsigned Column;
424
425 /// \brief The token that needs to be next formatted.
Manuel Klimek6e6310e2013-05-29 14:47:47 +0000426 const FormatToken *NextToken;
Daniel Jasper337816e2013-01-11 10:22:12 +0000427
Daniel Jasperfbde69e2012-12-21 14:37:20 +0000428 /// \brief \c true if this line contains a continued for-loop section.
429 bool LineContainsContinuedForLoopSection;
430
Daniel Jasper400adc62013-02-08 15:28:42 +0000431 /// \brief The level of nesting inside (), [], <> and {}.
432 unsigned ParenLevel;
433
Daniel Jasper40c36c52013-02-18 11:05:07 +0000434 /// \brief The \c ParenLevel at the start of this line.
435 unsigned StartOfLineLevel;
436
Daniel Jasper0e90c3d2013-07-05 09:14:35 +0000437 /// \brief The lowest \c ParenLevel on the current line.
438 unsigned LowestLevelOnLine;
Daniel Jasper32a796b2013-05-27 11:50:16 +0000439
Manuel Klimek02f640a2013-02-20 15:25:48 +0000440 /// \brief The start column of the string literal, if we're in a string
441 /// literal sequence, 0 otherwise.
442 unsigned StartOfStringLiteral;
443
Daniel Jasper337816e2013-01-11 10:22:12 +0000444 /// \brief A stack keeping track of properties applying to parenthesis
445 /// levels.
446 std::vector<ParenState> Stack;
447
Daniel Jasperf8114cf2013-05-22 05:27:42 +0000448 /// \brief Ignore the stack of \c ParenStates for state comparison.
449 ///
450 /// In long and deeply nested unwrapped lines, the current algorithm can
451 /// be insufficient for finding the best formatting with a reasonable amount
452 /// of time and memory. Setting this flag will effectively lead to the
453 /// algorithm not analyzing some combinations. However, these combinations
454 /// rarely contain the optimal solution: In short, accepting a higher
455 /// penalty early would need to lead to different values in the \c
456 /// ParenState stack (in an otherwise identical state) and these different
457 /// values would need to lead to a significant amount of avoided penalty
458 /// later.
459 ///
460 /// FIXME: Come up with a better algorithm instead.
461 bool IgnoreStackForComparison;
462
Daniel Jasper337816e2013-01-11 10:22:12 +0000463 /// \brief Comparison operator to be able to used \c LineState in \c map.
464 bool operator<(const LineState &Other) const {
Daniel Jasper58f427e2013-02-19 09:28:55 +0000465 if (NextToken != Other.NextToken)
466 return NextToken < Other.NextToken;
467 if (Column != Other.Column)
468 return Column < Other.Column;
Daniel Jasper58f427e2013-02-19 09:28:55 +0000469 if (LineContainsContinuedForLoopSection !=
Alexander Kornienkocb45bc12013-04-15 14:28:00 +0000470 Other.LineContainsContinuedForLoopSection)
Daniel Jasperfbde69e2012-12-21 14:37:20 +0000471 return LineContainsContinuedForLoopSection;
Daniel Jasper58f427e2013-02-19 09:28:55 +0000472 if (ParenLevel != Other.ParenLevel)
473 return ParenLevel < Other.ParenLevel;
474 if (StartOfLineLevel != Other.StartOfLineLevel)
475 return StartOfLineLevel < Other.StartOfLineLevel;
Daniel Jasper0e90c3d2013-07-05 09:14:35 +0000476 if (LowestLevelOnLine != Other.LowestLevelOnLine)
477 return LowestLevelOnLine < Other.LowestLevelOnLine;
Manuel Klimek02f640a2013-02-20 15:25:48 +0000478 if (StartOfStringLiteral != Other.StartOfStringLiteral)
479 return StartOfStringLiteral < Other.StartOfStringLiteral;
Daniel Jasperf8114cf2013-05-22 05:27:42 +0000480 if (IgnoreStackForComparison || Other.IgnoreStackForComparison)
481 return false;
Daniel Jasper58f427e2013-02-19 09:28:55 +0000482 return Stack < Other.Stack;
Daniel Jasperf7935112012-12-03 18:12:45 +0000483 }
484 };
485
Daniel Jasper6021c4a2012-12-04 14:54:30 +0000486 /// \brief Appends the next token to \p State and updates information
487 /// necessary for indentation.
488 ///
Nico Weberf579ab32013-06-26 02:42:46 +0000489 /// Puts the token on the current line if \p Newline is \c false and adds a
Daniel Jasper6021c4a2012-12-04 14:54:30 +0000490 /// line break and necessary indentation otherwise.
491 ///
492 /// If \p DryRun is \c false, also creates and stores the required
493 /// \c Replacement.
Manuel Klimek1998ea22013-02-20 10:15:13 +0000494 unsigned addTokenToState(bool Newline, bool DryRun, LineState &State) {
Manuel Klimek6e6310e2013-05-29 14:47:47 +0000495 const FormatToken &Current = *State.NextToken;
496 const FormatToken &Previous = *State.NextToken->Previous;
Daniel Jasperf7935112012-12-03 18:12:45 +0000497
Daniel Jasper291f9362013-03-20 15:58:10 +0000498 if (State.Stack.size() == 0 || Current.Type == TT_ImplicitStringLiteral) {
Manuel Klimek5c24cca2013-05-23 10:56:37 +0000499 // FIXME: Is this correct?
Manuel Klimek6e6310e2013-05-29 14:47:47 +0000500 int WhitespaceLength = SourceMgr.getSpellingColumnNumber(
501 State.NextToken->WhitespaceRange.getEnd()) -
502 SourceMgr.getSpellingColumnNumber(
503 State.NextToken->WhitespaceRange.getBegin());
Alexander Kornienkoffcc0102013-06-05 14:09:10 +0000504 State.Column += WhitespaceLength + State.NextToken->CodePointCount;
Manuel Klimek6e6310e2013-05-29 14:47:47 +0000505 State.NextToken = State.NextToken->Next;
Manuel Klimek1998ea22013-02-20 10:15:13 +0000506 return 0;
Daniel Jasper4b866272013-02-01 11:00:45 +0000507 }
508
Daniel Jasper5188e6b2013-04-03 07:21:51 +0000509 // If we are continuing an expression, we want to indent an extra 4 spaces.
510 unsigned ContinuationIndent =
Daniel Jasperc238c872013-04-02 14:33:13 +0000511 std::max(State.Stack.back().LastSpace, State.Stack.back().Indent) + 4;
Daniel Jasperf7935112012-12-03 18:12:45 +0000512 if (Newline) {
Manuel Klimek8e07a1b2013-01-10 11:52:21 +0000513 if (Current.is(tok::r_brace)) {
Manuel Klimek13b97d82013-05-13 08:42:42 +0000514 State.Column = Line.Level * Style.IndentWidth;
Daniel Jasper399d24b2013-01-09 07:06:56 +0000515 } else if (Current.is(tok::string_literal) &&
Manuel Klimek02f640a2013-02-20 15:25:48 +0000516 State.StartOfStringLiteral != 0) {
517 State.Column = State.StartOfStringLiteral;
Daniel Jasper2ec3ffb82013-02-18 11:59:17 +0000518 State.Stack.back().BreakBeforeParameter = true;
Daniel Jasper399d24b2013-01-09 07:06:56 +0000519 } else if (Current.is(tok::lessless) &&
Daniel Jasper400adc62013-02-08 15:28:42 +0000520 State.Stack.back().FirstLessLess != 0) {
521 State.Column = State.Stack.back().FirstLessLess;
Daniel Jasperbca4bbe2013-05-28 11:30:49 +0000522 } else if (Current.isOneOf(tok::period, tok::arrow) &&
523 Current.Type != TT_DesignatedInitializerPeriod) {
Daniel Jasper5188e6b2013-04-03 07:21:51 +0000524 if (State.Stack.back().CallContinuation == 0) {
525 State.Column = ContinuationIndent;
Daniel Jasperc238c872013-04-02 14:33:13 +0000526 State.Stack.back().CallContinuation = State.Column;
Daniel Jasper5188e6b2013-04-03 07:21:51 +0000527 } else {
528 State.Column = State.Stack.back().CallContinuation;
529 }
Daniel Jasperca6623b2013-01-28 12:45:14 +0000530 } else if (Current.Type == TT_ConditionalExpr) {
531 State.Column = State.Stack.back().QuestionColumn;
Daniel Jaspera628c982013-04-03 13:36:17 +0000532 } else if (Previous.is(tok::comma) &&
533 State.Stack.back().VariablePos != 0) {
534 State.Column = State.Stack.back().VariablePos;
Daniel Jasper26d1b1d2013-02-24 18:54:32 +0000535 } else if (Previous.ClosesTemplateDeclaration ||
Daniel Jasper8e357692013-05-06 08:27:33 +0000536 (Current.Type == TT_StartOfName && State.ParenLevel == 0 &&
Manuel Klimek836c2862013-06-21 17:25:42 +0000537 (!Style.IndentFunctionDeclarationAfterType ||
538 Line.StartsDefinition))) {
Daniel Jasperc238c872013-04-02 14:33:13 +0000539 State.Column = State.Stack.back().Indent;
Daniel Jasper1ac3e052013-02-05 10:07:47 +0000540 } else if (Current.Type == TT_ObjCSelectorName) {
Alexander Kornienkoffcc0102013-06-05 14:09:10 +0000541 if (State.Stack.back().ColonPos > Current.CodePointCount) {
542 State.Column = State.Stack.back().ColonPos - Current.CodePointCount;
Daniel Jasper1ac3e052013-02-05 10:07:47 +0000543 } else {
544 State.Column = State.Stack.back().Indent;
Alexander Kornienkoffcc0102013-06-05 14:09:10 +0000545 State.Stack.back().ColonPos = State.Column + Current.CodePointCount;
Daniel Jasper1ac3e052013-02-05 10:07:47 +0000546 }
Daniel Jasper0f0234e2013-05-08 10:00:18 +0000547 } else if (Current.Type == TT_StartOfName ||
548 Previous.isOneOf(tok::coloncolon, tok::equal) ||
Daniel Jasperc238c872013-04-02 14:33:13 +0000549 Previous.Type == TT_ObjCMethodExpr) {
Daniel Jasper5188e6b2013-04-03 07:21:51 +0000550 State.Column = ContinuationIndent;
Daniel Jasperfbde69e2012-12-21 14:37:20 +0000551 } else {
Daniel Jasper400adc62013-02-08 15:28:42 +0000552 State.Column = State.Stack.back().Indent;
Daniel Jasper5188e6b2013-04-03 07:21:51 +0000553 // Ensure that we fall back to indenting 4 spaces instead of just
554 // flushing continuations left.
Daniel Jasperc238c872013-04-02 14:33:13 +0000555 if (State.Column == FirstIndent)
556 State.Column += 4;
Daniel Jasperfbde69e2012-12-21 14:37:20 +0000557 }
558
Daniel Jasper54a86022013-02-15 11:07:25 +0000559 if (Current.is(tok::question))
Daniel Jaspercd8599e2013-02-23 21:01:55 +0000560 State.Stack.back().BreakBeforeParameter = true;
Daniel Jasperd69fc772013-05-08 14:12:04 +0000561 if ((Previous.isOneOf(tok::comma, tok::semi) &&
562 !State.Stack.back().AvoidBinPacking) ||
563 Previous.Type == TT_BinaryOperator)
Daniel Jasperacc33662013-02-08 08:22:00 +0000564 State.Stack.back().BreakBeforeParameter = false;
Daniel Jasperc6fbc212013-05-15 09:35:08 +0000565 if (Previous.Type == TT_TemplateCloser && State.ParenLevel == 0)
566 State.Stack.back().BreakBeforeParameter = false;
Daniel Jasper8a8ce242013-01-31 14:59:26 +0000567
Manuel Klimekb69e3c62013-01-02 18:33:23 +0000568 if (!DryRun) {
Daniel Jasperfb5e2412013-02-26 13:10:34 +0000569 unsigned NewLines = 1;
Alexander Kornienkof370ad92013-06-12 19:04:12 +0000570 if (Current.is(tok::comment))
Manuel Klimek6e6310e2013-05-29 14:47:47 +0000571 NewLines = std::max(
572 NewLines,
573 std::min(Current.NewlinesBefore, Style.MaxEmptyLinesToKeep + 1));
Manuel Klimek4fe43002013-05-22 12:51:29 +0000574 Whitespaces.replaceWhitespace(Current, NewLines, State.Column,
575 State.Column, Line.InPPDirective);
Manuel Klimekb69e3c62013-01-02 18:33:23 +0000576 }
Daniel Jasperf7935112012-12-03 18:12:45 +0000577
Daniel Jasper400adc62013-02-08 15:28:42 +0000578 State.Stack.back().LastSpace = State.Column;
Daniel Jasperbca4bbe2013-05-28 11:30:49 +0000579 if (Current.isOneOf(tok::arrow, tok::period) &&
580 Current.Type != TT_DesignatedInitializerPeriod)
Alexander Kornienkoffcc0102013-06-05 14:09:10 +0000581 State.Stack.back().LastSpace += Current.CodePointCount;
Daniel Jasper40c36c52013-02-18 11:05:07 +0000582 State.StartOfLineLevel = State.ParenLevel;
Daniel Jasper0e90c3d2013-07-05 09:14:35 +0000583 State.LowestLevelOnLine = State.ParenLevel;
Daniel Jaspercd8599e2013-02-23 21:01:55 +0000584
585 // Any break on this level means that the parent level has been broken
586 // and we need to avoid bin packing there.
587 for (unsigned i = 0, e = State.Stack.size() - 1; i != e; ++i) {
588 State.Stack[i].BreakBeforeParameter = true;
589 }
Alexander Kornienko1efe0a02013-07-04 14:47:51 +0000590 const FormatToken *TokenBefore = Current.getPreviousNonComment();
Daniel Jasper1b8e76f2013-04-15 22:36:37 +0000591 if (TokenBefore && !TokenBefore->isOneOf(tok::comma, tok::semi) &&
Daniel Jasperc6fbc212013-05-15 09:35:08 +0000592 TokenBefore->Type != TT_TemplateCloser &&
Daniel Jasperd69fc772013-05-08 14:12:04 +0000593 TokenBefore->Type != TT_BinaryOperator && !TokenBefore->opensScope())
Daniel Jasper2cf17bf2013-02-27 09:47:53 +0000594 State.Stack.back().BreakBeforeParameter = true;
595
Daniel Jaspercd8599e2013-02-23 21:01:55 +0000596 // If we break after {, we should also break before the corresponding }.
597 if (Previous.is(tok::l_brace))
598 State.Stack.back().BreakBeforeClosingBrace = true;
599
600 if (State.Stack.back().AvoidBinPacking) {
601 // If we are breaking after '(', '{', '<', this is not bin packing
602 // unless AllowAllParametersOfDeclarationOnNextLine is false.
Daniel Jasper571f1af2013-05-14 20:39:56 +0000603 if (!(Previous.isOneOf(tok::l_paren, tok::l_brace) ||
604 Previous.Type == TT_BinaryOperator) ||
Daniel Jaspercd8599e2013-02-23 21:01:55 +0000605 (!Style.AllowAllParametersOfDeclarationOnNextLine &&
606 Line.MustBeDeclaration))
607 State.Stack.back().BreakBeforeParameter = true;
608 }
Daniel Jasperf7935112012-12-03 18:12:45 +0000609 } else {
Daniel Jasper62e68172013-02-25 15:59:54 +0000610 if (Current.is(tok::equal) &&
Manuel Klimek6e6310e2013-05-29 14:47:47 +0000611 (RootToken->is(tok::kw_for) || State.ParenLevel == 0) &&
Daniel Jasper31c96b92013-04-05 09:38:50 +0000612 State.Stack.back().VariablePos == 0) {
613 State.Stack.back().VariablePos = State.Column;
614 // Move over * and & if they are bound to the variable name.
Manuel Klimek6e6310e2013-05-29 14:47:47 +0000615 const FormatToken *Tok = &Previous;
Alexander Kornienkoffcc0102013-06-05 14:09:10 +0000616 while (Tok && State.Stack.back().VariablePos >= Tok->CodePointCount) {
617 State.Stack.back().VariablePos -= Tok->CodePointCount;
Daniel Jasper31c96b92013-04-05 09:38:50 +0000618 if (Tok->SpacesRequiredBefore != 0)
619 break;
Manuel Klimek6e6310e2013-05-29 14:47:47 +0000620 Tok = Tok->Previous;
Daniel Jasper31c96b92013-04-05 09:38:50 +0000621 }
Daniel Jaspera628c982013-04-03 13:36:17 +0000622 if (Previous.PartOfMultiVariableDeclStmt)
623 State.Stack.back().LastSpace = State.Stack.back().VariablePos;
624 }
Daniel Jasperfbde69e2012-12-21 14:37:20 +0000625
Daniel Jaspereef30492013-02-11 12:36:37 +0000626 unsigned Spaces = State.NextToken->SpacesRequiredBefore;
Daniel Jasper6021c4a2012-12-04 14:54:30 +0000627
Daniel Jasperf7935112012-12-03 18:12:45 +0000628 if (!DryRun)
Manuel Klimek4fe43002013-05-22 12:51:29 +0000629 Whitespaces.replaceWhitespace(Current, 0, Spaces,
630 State.Column + Spaces);
Daniel Jasper6021c4a2012-12-04 14:54:30 +0000631
Daniel Jasper1ac3e052013-02-05 10:07:47 +0000632 if (Current.Type == TT_ObjCSelectorName &&
633 State.Stack.back().ColonPos == 0) {
634 if (State.Stack.back().Indent + Current.LongestObjCSelectorName >
Alexander Kornienkoffcc0102013-06-05 14:09:10 +0000635 State.Column + Spaces + Current.CodePointCount)
Daniel Jasper1ac3e052013-02-05 10:07:47 +0000636 State.Stack.back().ColonPos =
637 State.Stack.back().Indent + Current.LongestObjCSelectorName;
638 else
639 State.Stack.back().ColonPos =
Alexander Kornienkoffcc0102013-06-05 14:09:10 +0000640 State.Column + Spaces + Current.CodePointCount;
Daniel Jasper1ac3e052013-02-05 10:07:47 +0000641 }
642
Daniel Jasperc04baae2013-04-10 09:49:49 +0000643 if (Previous.opensScope() && Previous.Type != TT_ObjCMethodExpr &&
Daniel Jasper6bee6822013-04-08 20:33:42 +0000644 Current.Type != TT_LineComment)
Daniel Jasper400adc62013-02-08 15:28:42 +0000645 State.Stack.back().Indent = State.Column + Spaces;
Daniel Jaspercc960fa2013-04-22 07:59:53 +0000646 if (Previous.is(tok::comma) && !Current.isTrailingComment() &&
647 State.Stack.back().AvoidBinPacking)
648 State.Stack.back().NoLineBreak = true;
Daniel Jasper9278eb92013-01-16 14:59:02 +0000649
Daniel Jaspere9de2602012-12-06 09:56:08 +0000650 State.Column += Spaces;
Daniel Jaspera628c982013-04-03 13:36:17 +0000651 if (Current.is(tok::l_paren) && Previous.isOneOf(tok::kw_if, tok::kw_for))
Daniel Jasper39e27382013-01-23 20:41:06 +0000652 // Treat the condition inside an if as if it was a second function
653 // parameter, i.e. let nested calls have an indent of 4.
654 State.Stack.back().LastSpace = State.Column + 1; // 1 is length of "(".
Daniel Jasperd1ae3582013-03-20 12:37:50 +0000655 else if (Previous.is(tok::comma))
Daniel Jasper39e27382013-01-23 20:41:06 +0000656 State.Stack.back().LastSpace = State.Column;
Daniel Jasperca6623b2013-01-28 12:45:14 +0000657 else if ((Previous.Type == TT_BinaryOperator ||
Daniel Jasper65585ed2013-01-28 13:31:35 +0000658 Previous.Type == TT_ConditionalExpr ||
659 Previous.Type == TT_CtorInitializerColon) &&
Manuel Klimek6e6310e2013-05-29 14:47:47 +0000660 !(Previous.getPrecedence() == prec::Assignment &&
Daniel Jasper7b27a102013-05-27 12:45:09 +0000661 Current.FakeLParens.empty()))
662 // Always indent relative to the RHS of the expression unless this is a
663 // simple assignment without binary expression on the RHS.
Daniel Jasper20b09ef2013-01-28 09:35:24 +0000664 State.Stack.back().LastSpace = State.Column;
Daniel Jaspereead02b2013-02-14 08:42:54 +0000665 else if (Previous.Type == TT_InheritanceColon)
666 State.Stack.back().Indent = State.Column;
Daniel Jasperd69fc772013-05-08 14:12:04 +0000667 else if (Previous.opensScope() && !Current.FakeLParens.empty())
668 // If this function has multiple parameters or a binary expression
669 // parameter, indent nested calls from the start of the first parameter.
Daniel Jasper7b5773e92013-01-28 07:35:34 +0000670 State.Stack.back().LastSpace = State.Column;
Daniel Jasperf7935112012-12-03 18:12:45 +0000671 }
Daniel Jasper9278eb92013-01-16 14:59:02 +0000672
Manuel Klimek1998ea22013-02-20 10:15:13 +0000673 return moveStateToNextToken(State, DryRun);
Daniel Jasper6021c4a2012-12-04 14:54:30 +0000674 }
Daniel Jasperf7935112012-12-03 18:12:45 +0000675
Daniel Jasper6021c4a2012-12-04 14:54:30 +0000676 /// \brief Mark the next token as consumed in \p State and modify its stacks
677 /// accordingly.
Manuel Klimek1998ea22013-02-20 10:15:13 +0000678 unsigned moveStateToNextToken(LineState &State, bool DryRun) {
Manuel Klimek6e6310e2013-05-29 14:47:47 +0000679 const FormatToken &Current = *State.NextToken;
Daniel Jasper337816e2013-01-11 10:22:12 +0000680 assert(State.Stack.size());
Daniel Jaspere9de2602012-12-06 09:56:08 +0000681
Daniel Jaspereead02b2013-02-14 08:42:54 +0000682 if (Current.Type == TT_InheritanceColon)
683 State.Stack.back().AvoidBinPacking = true;
Daniel Jasper337816e2013-01-11 10:22:12 +0000684 if (Current.is(tok::lessless) && State.Stack.back().FirstLessLess == 0)
685 State.Stack.back().FirstLessLess = State.Column;
Daniel Jasperca6623b2013-01-28 12:45:14 +0000686 if (Current.is(tok::question))
687 State.Stack.back().QuestionColumn = State.Column;
Daniel Jasper0e90c3d2013-07-05 09:14:35 +0000688 if (!Current.opensScope() && !Current.closesScope())
689 State.LowestLevelOnLine =
690 std::min(State.LowestLevelOnLine, State.ParenLevel);
691 if (Current.isOneOf(tok::period, tok::arrow) &&
692 Line.Type == LT_BuilderTypeCall && State.ParenLevel == 0)
693 State.Stack.back().StartOfFunctionCall =
694 Current.LastInChainOfCalls ? 0
695 : State.Column + Current.CodePointCount;
Daniel Jasper37905f72013-02-21 15:00:29 +0000696 if (Current.Type == TT_CtorInitializerColon) {
Manuel Klimek13b97d82013-05-13 08:42:42 +0000697 // Indent 2 from the column, so:
698 // SomeClass::SomeClass()
699 // : First(...), ...
700 // Next(...)
701 // ^ line up here.
Daniel Jasper6bee6822013-04-08 20:33:42 +0000702 State.Stack.back().Indent = State.Column + 2;
Daniel Jasper37905f72013-02-21 15:00:29 +0000703 if (Style.ConstructorInitializerAllOnOneLineOrOnePerLine)
704 State.Stack.back().AvoidBinPacking = true;
705 State.Stack.back().BreakBeforeParameter = false;
Daniel Jasper8a8ce242013-01-31 14:59:26 +0000706 }
Daniel Jasper5188e6b2013-04-03 07:21:51 +0000707
Daniel Jasper6bee6822013-04-08 20:33:42 +0000708 // If return returns a binary expression, align after it.
709 if (Current.is(tok::kw_return) && !Current.FakeLParens.empty())
710 State.Stack.back().LastSpace = State.Column + 7;
711
Daniel Jasper5188e6b2013-04-03 07:21:51 +0000712 // In ObjC method declaration we align on the ":" of parameters, but we need
713 // to ensure that we indent parameters on subsequent lines by at least 4.
Daniel Jasperc238c872013-04-02 14:33:13 +0000714 if (Current.Type == TT_ObjCMethodSpecifier)
715 State.Stack.back().Indent += 4;
Daniel Jaspere9de2602012-12-06 09:56:08 +0000716
Daniel Jasper400adc62013-02-08 15:28:42 +0000717 // Insert scopes created by fake parenthesis.
Alexander Kornienko1efe0a02013-07-04 14:47:51 +0000718 const FormatToken *Previous = Current.getPreviousNonComment();
Daniel Jasper6bee6822013-04-08 20:33:42 +0000719 // Don't add extra indentation for the first fake parenthesis after
720 // 'return', assignements or opening <({[. The indentation for these cases
721 // is special cased.
722 bool SkipFirstExtraIndent =
723 Current.is(tok::kw_return) ||
Daniel Jasperc04baae2013-04-10 09:49:49 +0000724 (Previous && (Previous->opensScope() ||
Manuel Klimek6e6310e2013-05-29 14:47:47 +0000725 Previous->getPrecedence() == prec::Assignment));
Daniel Jasper6bee6822013-04-08 20:33:42 +0000726 for (SmallVector<prec::Level, 4>::const_reverse_iterator
727 I = Current.FakeLParens.rbegin(),
728 E = Current.FakeLParens.rend();
729 I != E; ++I) {
Daniel Jasper400adc62013-02-08 15:28:42 +0000730 ParenState NewParenState = State.Stack.back();
Daniel Jaspercc3044c2013-05-13 09:19:24 +0000731 NewParenState.ForFakeParenthesis = true;
Daniel Jasper6bee6822013-04-08 20:33:42 +0000732 NewParenState.Indent =
733 std::max(std::max(State.Column, NewParenState.Indent),
734 State.Stack.back().LastSpace);
735
736 // Always indent conditional expressions. Never indent expression where
737 // the 'operator' is ',', ';' or an assignment (i.e. *I <=
738 // prec::Assignment) as those have different indentation rules. Indent
739 // other expression, unless the indentation needs to be skipped.
740 if (*I == prec::Conditional ||
741 (!SkipFirstExtraIndent && *I > prec::Assignment))
742 NewParenState.Indent += 4;
Daniel Jasperc04baae2013-04-10 09:49:49 +0000743 if (Previous && !Previous->opensScope())
Daniel Jasper6bee6822013-04-08 20:33:42 +0000744 NewParenState.BreakBeforeParameter = false;
Daniel Jasper400adc62013-02-08 15:28:42 +0000745 State.Stack.push_back(NewParenState);
Daniel Jasper6bee6822013-04-08 20:33:42 +0000746 SkipFirstExtraIndent = false;
Daniel Jasper400adc62013-02-08 15:28:42 +0000747 }
748
Daniel Jasper2eda23e2012-12-24 13:43:52 +0000749 // If we encounter an opening (, [, { or <, we add a level to our stacks to
Daniel Jasper6021c4a2012-12-04 14:54:30 +0000750 // prepare for the following tokens.
Daniel Jasperc04baae2013-04-10 09:49:49 +0000751 if (Current.opensScope()) {
Daniel Jasper337816e2013-01-11 10:22:12 +0000752 unsigned NewIndent;
Daniel Jaspercc3044c2013-05-13 09:19:24 +0000753 unsigned LastSpace = State.Stack.back().LastSpace;
Daniel Jasper8a8ce242013-01-31 14:59:26 +0000754 bool AvoidBinPacking;
Manuel Klimek73a2fdf2013-01-10 14:36:46 +0000755 if (Current.is(tok::l_brace)) {
Daniel Jaspercc3044c2013-05-13 09:19:24 +0000756 NewIndent = Style.IndentWidth + LastSpace;
Alexander Kornienko1efe0a02013-07-04 14:47:51 +0000757 const FormatToken *NextNoComment = Current.getNextNonComment();
Daniel Jasperbca4bbe2013-05-28 11:30:49 +0000758 AvoidBinPacking = NextNoComment &&
759 NextNoComment->Type == TT_DesignatedInitializerPeriod;
Manuel Klimek73a2fdf2013-01-10 14:36:46 +0000760 } else {
Daniel Jaspercc3044c2013-05-13 09:19:24 +0000761 NewIndent =
762 4 + std::max(LastSpace, State.Stack.back().StartOfFunctionCall);
Daniel Jaspercc960fa2013-04-22 07:59:53 +0000763 AvoidBinPacking = !Style.BinPackParameters;
Manuel Klimek73a2fdf2013-01-10 14:36:46 +0000764 }
Daniel Jaspere3c0e012013-04-25 13:31:51 +0000765
Daniel Jaspercc3044c2013-05-13 09:19:24 +0000766 State.Stack.push_back(ParenState(NewIndent, LastSpace, AvoidBinPacking,
767 State.Stack.back().NoLineBreak));
Daniel Jasper400adc62013-02-08 15:28:42 +0000768 ++State.ParenLevel;
Daniel Jasper6021c4a2012-12-04 14:54:30 +0000769 }
770
Daniel Jasperacc33662013-02-08 08:22:00 +0000771 // If this '[' opens an ObjC call, determine whether all parameters fit into
772 // one line and put one per line if they don't.
773 if (Current.is(tok::l_square) && Current.Type == TT_ObjCMethodExpr &&
774 Current.MatchingParen != NULL) {
775 if (getLengthToMatchingParen(Current) + State.Column > getColumnLimit())
776 State.Stack.back().BreakBeforeParameter = true;
777 }
778
Daniel Jasper2eda23e2012-12-24 13:43:52 +0000779 // If we encounter a closing ), ], } or >, we can remove a level from our
Daniel Jasper6021c4a2012-12-04 14:54:30 +0000780 // stacks.
Alexander Kornienko62b85b92013-03-13 14:41:29 +0000781 if (Current.isOneOf(tok::r_paren, tok::r_square) ||
Manuel Klimek6e6310e2013-05-29 14:47:47 +0000782 (Current.is(tok::r_brace) && State.NextToken != RootToken) ||
Daniel Jasper7c85fde2013-01-08 14:56:18 +0000783 State.NextToken->Type == TT_TemplateCloser) {
Daniel Jasper337816e2013-01-11 10:22:12 +0000784 State.Stack.pop_back();
Daniel Jasper400adc62013-02-08 15:28:42 +0000785 --State.ParenLevel;
786 }
787
788 // Remove scopes created by fake parenthesis.
789 for (unsigned i = 0, e = Current.FakeRParens; i != e; ++i) {
Daniel Jasper6daabe32013-04-04 19:31:00 +0000790 unsigned VariablePos = State.Stack.back().VariablePos;
Daniel Jasper400adc62013-02-08 15:28:42 +0000791 State.Stack.pop_back();
Daniel Jasper6daabe32013-04-04 19:31:00 +0000792 State.Stack.back().VariablePos = VariablePos;
Daniel Jasperf7935112012-12-03 18:12:45 +0000793 }
Manuel Klimek73a2fdf2013-01-10 14:36:46 +0000794
Daniel Jasper47a04442013-05-13 20:50:15 +0000795 if (Current.is(tok::string_literal) && State.StartOfStringLiteral == 0) {
Manuel Klimek02f640a2013-02-20 15:25:48 +0000796 State.StartOfStringLiteral = State.Column;
Daniel Jasper47a04442013-05-13 20:50:15 +0000797 } else if (!Current.isOneOf(tok::comment, tok::identifier, tok::hash,
798 tok::string_literal)) {
Daniel Jasper7dd22c51b2013-05-16 04:26:02 +0000799 State.StartOfStringLiteral = 0;
Manuel Klimek02f640a2013-02-20 15:25:48 +0000800 }
801
Alexander Kornienkoffcc0102013-06-05 14:09:10 +0000802 State.Column += Current.CodePointCount;
Manuel Klimek1998ea22013-02-20 10:15:13 +0000803
Manuel Klimek6e6310e2013-05-29 14:47:47 +0000804 State.NextToken = State.NextToken->Next;
Manuel Klimek73a2fdf2013-01-10 14:36:46 +0000805
Manuel Klimek1998ea22013-02-20 10:15:13 +0000806 return breakProtrudingToken(Current, State, DryRun);
807 }
808
809 /// \brief If the current token sticks out over the end of the line, break
810 /// it if possible.
Manuel Klimek5ecb5fd2013-05-14 09:04:24 +0000811 ///
812 /// \returns An extra penalty if a token was broken, otherwise 0.
813 ///
Alexander Kornienkoaa620e12013-07-01 13:42:42 +0000814 /// The returned penalty will cover the cost of the additional line breaks and
815 /// column limit violation in all lines except for the last one. The penalty
816 /// for the column limit violation in the last line (and in single line
817 /// tokens) is handled in \c addNextStateToQueue.
Manuel Klimek6e6310e2013-05-29 14:47:47 +0000818 unsigned breakProtrudingToken(const FormatToken &Current, LineState &State,
Manuel Klimek4fe43002013-05-22 12:51:29 +0000819 bool DryRun) {
Alexander Kornienkocb45bc12013-04-15 14:28:00 +0000820 llvm::OwningPtr<BreakableToken> Token;
Alexander Kornienkoffcc0102013-06-05 14:09:10 +0000821 unsigned StartColumn = State.Column - Current.CodePointCount;
Manuel Klimek591ab5a2013-05-28 13:42:28 +0000822 unsigned OriginalStartColumn =
Manuel Klimek6e6310e2013-05-29 14:47:47 +0000823 SourceMgr.getSpellingColumnNumber(Current.getStartOfNonWhitespace()) -
Manuel Klimek591ab5a2013-05-28 13:42:28 +0000824 1;
Manuel Klimek9043c742013-05-27 15:23:34 +0000825
Daniel Jasper8bb99e82013-05-16 12:59:13 +0000826 if (Current.is(tok::string_literal) &&
827 Current.Type != TT_ImplicitStringLiteral) {
Alexander Kornienkocb45bc12013-04-15 14:28:00 +0000828 // Only break up default narrow strings.
Alexander Kornienkobe633902013-06-14 11:46:10 +0000829 if (!Current.TokenText.startswith("\""))
Alexander Kornienkocb45bc12013-04-15 14:28:00 +0000830 return 0;
831
Alexander Kornienkobe633902013-06-14 11:46:10 +0000832 Token.reset(new BreakableStringLiteral(Current, StartColumn,
833 Line.InPPDirective, Encoding));
Alexander Kornienkocb45bc12013-04-15 14:28:00 +0000834 } else if (Current.Type == TT_BlockComment) {
Alexander Kornienkobe633902013-06-14 11:46:10 +0000835 Token.reset(new BreakableBlockComment(
Alexander Kornienkoffcc0102013-06-05 14:09:10 +0000836 Style, Current, StartColumn, OriginalStartColumn, !Current.Previous,
Alexander Kornienkobe633902013-06-14 11:46:10 +0000837 Line.InPPDirective, Encoding));
Daniel Jasper4a4be012013-05-06 10:24:51 +0000838 } else if (Current.Type == TT_LineComment &&
Manuel Klimek6e6310e2013-05-29 14:47:47 +0000839 (Current.Previous == NULL ||
840 Current.Previous->Type != TT_ImplicitStringLiteral)) {
Alexander Kornienkobe633902013-06-14 11:46:10 +0000841 Token.reset(new BreakableLineComment(Current, StartColumn,
842 Line.InPPDirective, Encoding));
Alexander Kornienkocb45bc12013-04-15 14:28:00 +0000843 } else {
Manuel Klimek4fe43002013-05-22 12:51:29 +0000844 return 0;
Alexander Kornienkocb45bc12013-04-15 14:28:00 +0000845 }
Alexander Kornienkobe633902013-06-14 11:46:10 +0000846 if (Current.UnbreakableTailLength >= getColumnLimit())
Manuel Klimek5ecb5fd2013-05-14 09:04:24 +0000847 return 0;
Alexander Kornienkocb45bc12013-04-15 14:28:00 +0000848
Alexander Kornienkoa3555e22013-06-19 19:50:11 +0000849 unsigned RemainingSpace = getColumnLimit() - Current.UnbreakableTailLength;
Alexander Kornienkocb45bc12013-04-15 14:28:00 +0000850 bool BreakInserted = false;
851 unsigned Penalty = 0;
Alexander Kornienkoa3555e22013-06-19 19:50:11 +0000852 unsigned RemainingTokenColumns = 0;
Manuel Klimek9043c742013-05-27 15:23:34 +0000853 for (unsigned LineIndex = 0, EndIndex = Token->getLineCount();
854 LineIndex != EndIndex; ++LineIndex) {
Alexander Kornienkobe633902013-06-14 11:46:10 +0000855 if (!DryRun)
856 Token->replaceWhitespaceBefore(LineIndex, Whitespaces);
Alexander Kornienkocb45bc12013-04-15 14:28:00 +0000857 unsigned TailOffset = 0;
Alexander Kornienkoa3555e22013-06-19 19:50:11 +0000858 RemainingTokenColumns = Token->getLineLengthAfterSplit(
Alexander Kornienkodd7ece52013-06-07 16:02:52 +0000859 LineIndex, TailOffset, StringRef::npos);
Alexander Kornienkoffcc0102013-06-05 14:09:10 +0000860 while (RemainingTokenColumns > RemainingSpace) {
Alexander Kornienkocb45bc12013-04-15 14:28:00 +0000861 BreakableToken::Split Split =
Manuel Klimek4fe43002013-05-22 12:51:29 +0000862 Token->getSplit(LineIndex, TailOffset, getColumnLimit());
Alexander Kornienkoaa620e12013-07-01 13:42:42 +0000863 if (Split.first == StringRef::npos) {
864 // The last line's penalty is handled in addNextStateToQueue().
865 if (LineIndex < EndIndex - 1)
866 Penalty += Style.PenaltyExcessCharacter *
867 (RemainingTokenColumns - RemainingSpace);
Alexander Kornienkocb45bc12013-04-15 14:28:00 +0000868 break;
Alexander Kornienkoaa620e12013-07-01 13:42:42 +0000869 }
Alexander Kornienkocb45bc12013-04-15 14:28:00 +0000870 assert(Split.first != 0);
Alexander Kornienkoffcc0102013-06-05 14:09:10 +0000871 unsigned NewRemainingTokenColumns = Token->getLineLengthAfterSplit(
Alexander Kornienkodd7ece52013-06-07 16:02:52 +0000872 LineIndex, TailOffset + Split.first + Split.second,
873 StringRef::npos);
Alexander Kornienkoffcc0102013-06-05 14:09:10 +0000874 assert(NewRemainingTokenColumns < RemainingTokenColumns);
Alexander Kornienkobe633902013-06-14 11:46:10 +0000875 if (!DryRun)
876 Token->insertBreak(LineIndex, TailOffset, Split, Whitespaces);
Alexander Kornienkodd7ece52013-06-07 16:02:52 +0000877 Penalty += Current.is(tok::string_literal) ? Style.PenaltyBreakString
878 : Style.PenaltyBreakComment;
879 unsigned ColumnsUsed =
880 Token->getLineLengthAfterSplit(LineIndex, TailOffset, Split.first);
881 if (ColumnsUsed > getColumnLimit()) {
882 Penalty +=
883 Style.PenaltyExcessCharacter * (ColumnsUsed - getColumnLimit());
884 }
Alexander Kornienkocb45bc12013-04-15 14:28:00 +0000885 TailOffset += Split.first + Split.second;
Alexander Kornienkoffcc0102013-06-05 14:09:10 +0000886 RemainingTokenColumns = NewRemainingTokenColumns;
Alexander Kornienkocb45bc12013-04-15 14:28:00 +0000887 BreakInserted = true;
Manuel Klimek1998ea22013-02-20 10:15:13 +0000888 }
Alexander Kornienkocb45bc12013-04-15 14:28:00 +0000889 }
890
Alexander Kornienkoa3555e22013-06-19 19:50:11 +0000891 State.Column = RemainingTokenColumns;
892
Alexander Kornienkocb45bc12013-04-15 14:28:00 +0000893 if (BreakInserted) {
Alexander Kornienko4d26b6e2013-06-17 12:59:44 +0000894 // If we break the token inside a parameter list, we need to break before
895 // the next parameter on all levels, so that the next parameter is clearly
896 // visible. Line comments already introduce a break.
897 if (Current.Type != TT_LineComment) {
898 for (unsigned i = 0, e = State.Stack.size(); i != e; ++i)
899 State.Stack[i].BreakBeforeParameter = true;
900 }
901
Alexander Kornienkocb45bc12013-04-15 14:28:00 +0000902 State.Stack.back().LastSpace = StartColumn;
Manuel Klimek1998ea22013-02-20 10:15:13 +0000903 }
Manuel Klimek1998ea22013-02-20 10:15:13 +0000904 return Penalty;
905 }
906
Daniel Jasper2df93312013-01-09 10:16:05 +0000907 unsigned getColumnLimit() {
Alexander Kornienkocb45bc12013-04-15 14:28:00 +0000908 // In preprocessor directives reserve two chars for trailing " \"
909 return Style.ColumnLimit - (Line.InPPDirective ? 2 : 0);
Daniel Jasper2df93312013-01-09 10:16:05 +0000910 }
911
Manuel Klimek2ef908e2013-02-13 10:46:36 +0000912 /// \brief An edge in the solution space from \c Previous->State to \c State,
913 /// inserting a newline dependent on the \c NewLine.
914 struct StateNode {
915 StateNode(const LineState &State, bool NewLine, StateNode *Previous)
Daniel Jasper12ef4e52013-02-21 21:33:55 +0000916 : State(State), NewLine(NewLine), Previous(Previous) {}
Manuel Klimek2ef908e2013-02-13 10:46:36 +0000917 LineState State;
918 bool NewLine;
919 StateNode *Previous;
920 };
Daniel Jasper4b866272013-02-01 11:00:45 +0000921
Manuel Klimek2ef908e2013-02-13 10:46:36 +0000922 /// \brief A pair of <penalty, count> that is used to prioritize the BFS on.
923 ///
924 /// In case of equal penalties, we want to prefer states that were inserted
925 /// first. During state generation we make sure that we insert states first
926 /// that break the line as late as possible.
927 typedef std::pair<unsigned, unsigned> OrderedPenalty;
928
929 /// \brief An item in the prioritized BFS search queue. The \c StateNode's
930 /// \c State has the given \c OrderedPenalty.
931 typedef std::pair<OrderedPenalty, StateNode *> QueueItem;
932
933 /// \brief The BFS queue type.
934 typedef std::priority_queue<QueueItem, std::vector<QueueItem>,
935 std::greater<QueueItem> > QueueType;
Daniel Jasper4b866272013-02-01 11:00:45 +0000936
937 /// \brief Analyze the entire solution space starting from \p InitialState.
Daniel Jasperf7935112012-12-03 18:12:45 +0000938 ///
Daniel Jasper4b866272013-02-01 11:00:45 +0000939 /// This implements a variant of Dijkstra's algorithm on the graph that spans
940 /// the solution space (\c LineStates are the nodes). The algorithm tries to
941 /// find the shortest path (the one with lowest penalty) from \p InitialState
942 /// to a state where all tokens are placed.
Manuel Klimek4fe43002013-05-22 12:51:29 +0000943 void analyzeSolutionSpace(LineState &InitialState) {
Manuel Klimek2ef908e2013-02-13 10:46:36 +0000944 std::set<LineState> Seen;
945
Daniel Jasper4b866272013-02-01 11:00:45 +0000946 // Insert start element into queue.
Daniel Jasper687af3b2013-02-14 14:26:07 +0000947 StateNode *Node =
Manuel Klimek2ef908e2013-02-13 10:46:36 +0000948 new (Allocator.Allocate()) StateNode(InitialState, false, NULL);
949 Queue.push(QueueItem(OrderedPenalty(0, Count), Node));
950 ++Count;
Daniel Jasper4b866272013-02-01 11:00:45 +0000951
952 // While not empty, take first element and follow edges.
953 while (!Queue.empty()) {
Manuel Klimek2ef908e2013-02-13 10:46:36 +0000954 unsigned Penalty = Queue.top().first.first;
Daniel Jasper687af3b2013-02-14 14:26:07 +0000955 StateNode *Node = Queue.top().second;
Manuel Klimek2ef908e2013-02-13 10:46:36 +0000956 if (Node->State.NextToken == NULL) {
Alexander Kornienko49149672013-05-10 11:56:10 +0000957 DEBUG(llvm::dbgs() << "\n---\nPenalty for line: " << Penalty << "\n");
Daniel Jasper4b866272013-02-01 11:00:45 +0000958 break;
Daniel Jasper3a9370c2013-02-04 07:21:18 +0000959 }
Manuel Klimek2ef908e2013-02-13 10:46:36 +0000960 Queue.pop();
Daniel Jasper4b866272013-02-01 11:00:45 +0000961
Daniel Jasperf8114cf2013-05-22 05:27:42 +0000962 // Cut off the analysis of certain solutions if the analysis gets too
963 // complex. See description of IgnoreStackForComparison.
964 if (Count > 10000)
965 Node->State.IgnoreStackForComparison = true;
966
Manuel Klimek2ef908e2013-02-13 10:46:36 +0000967 if (!Seen.insert(Node->State).second)
968 // State already examined with lower penalty.
969 continue;
Daniel Jasper4b866272013-02-01 11:00:45 +0000970
Nico Weber9096fc02013-06-26 00:30:14 +0000971 addNextStateToQueue(Penalty, Node, /*NewLine=*/false);
972 addNextStateToQueue(Penalty, Node, /*NewLine=*/true);
Daniel Jasper4b866272013-02-01 11:00:45 +0000973 }
974
975 if (Queue.empty())
976 // We were unable to find a solution, do nothing.
977 // FIXME: Add diagnostic?
Manuel Klimek4fe43002013-05-22 12:51:29 +0000978 return;
Daniel Jasperf7935112012-12-03 18:12:45 +0000979
Daniel Jasper4b866272013-02-01 11:00:45 +0000980 // Reconstruct the solution.
Manuel Klimek2ef908e2013-02-13 10:46:36 +0000981 reconstructPath(InitialState, Queue.top().second);
Alexander Kornienko49149672013-05-10 11:56:10 +0000982 DEBUG(llvm::dbgs() << "Total number of analyzed states: " << Count << "\n");
983 DEBUG(llvm::dbgs() << "---\n");
Manuel Klimek2ef908e2013-02-13 10:46:36 +0000984 }
985
986 void reconstructPath(LineState &State, StateNode *Current) {
Manuel Klimek4c5c28b2013-05-29 15:10:11 +0000987 std::deque<StateNode *> Path;
988 // We do not need a break before the initial token.
989 while (Current->Previous) {
990 Path.push_front(Current);
991 Current = Current->Previous;
992 }
993 for (std::deque<StateNode *>::iterator I = Path.begin(), E = Path.end();
994 I != E; ++I) {
995 DEBUG({
996 if ((*I)->NewLine) {
997 llvm::dbgs() << "Penalty for splitting before "
998 << (*I)->Previous->State.NextToken->Tok.getName() << ": "
999 << (*I)->Previous->State.NextToken->SplitPenalty << "\n";
1000 }
1001 });
1002 addTokenToState((*I)->NewLine, false, State);
1003 }
Daniel Jasper4b866272013-02-01 11:00:45 +00001004 }
1005
Manuel Klimekaf491072013-02-13 10:54:19 +00001006 /// \brief Add the following state to the analysis queue \c Queue.
Daniel Jasper4b866272013-02-01 11:00:45 +00001007 ///
Manuel Klimekaf491072013-02-13 10:54:19 +00001008 /// Assume the current state is \p PreviousNode and has been reached with a
Daniel Jasper4b866272013-02-01 11:00:45 +00001009 /// penalty of \p Penalty. Insert a line break if \p NewLine is \c true.
Manuel Klimekaf491072013-02-13 10:54:19 +00001010 void addNextStateToQueue(unsigned Penalty, StateNode *PreviousNode,
1011 bool NewLine) {
Manuel Klimek2ef908e2013-02-13 10:46:36 +00001012 if (NewLine && !canBreak(PreviousNode->State))
Daniel Jasper4b866272013-02-01 11:00:45 +00001013 return;
Manuel Klimek2ef908e2013-02-13 10:46:36 +00001014 if (!NewLine && mustBreak(PreviousNode->State))
Daniel Jasper4b866272013-02-01 11:00:45 +00001015 return;
Daniel Jasper20b09ef2013-01-28 09:35:24 +00001016 if (NewLine)
Manuel Klimek2ef908e2013-02-13 10:46:36 +00001017 Penalty += PreviousNode->State.NextToken->SplitPenalty;
1018
1019 StateNode *Node = new (Allocator.Allocate())
1020 StateNode(PreviousNode->State, NewLine, PreviousNode);
Manuel Klimek1998ea22013-02-20 10:15:13 +00001021 Penalty += addTokenToState(NewLine, true, Node->State);
Manuel Klimek2ef908e2013-02-13 10:46:36 +00001022 if (Node->State.Column > getColumnLimit()) {
1023 unsigned ExcessCharacters = Node->State.Column - getColumnLimit();
Daniel Jasper3a9370c2013-02-04 07:21:18 +00001024 Penalty += Style.PenaltyExcessCharacter * ExcessCharacters;
Daniel Jasper2df93312013-01-09 10:16:05 +00001025 }
Manuel Klimek2ef908e2013-02-13 10:46:36 +00001026
1027 Queue.push(QueueItem(OrderedPenalty(Penalty, Count), Node));
1028 ++Count;
Daniel Jasper4b866272013-02-01 11:00:45 +00001029 }
Daniel Jasperf7935112012-12-03 18:12:45 +00001030
Daniel Jasper4b866272013-02-01 11:00:45 +00001031 /// \brief Returns \c true, if a line break after \p State is allowed.
1032 bool canBreak(const LineState &State) {
Manuel Klimek6e6310e2013-05-29 14:47:47 +00001033 const FormatToken &Current = *State.NextToken;
1034 const FormatToken &Previous = *Current.Previous;
1035 assert(&Previous == Current.Previous);
Daniel Jasper473c62c2013-05-17 09:35:01 +00001036 if (!Current.CanBreakBefore &&
1037 !(Current.is(tok::r_brace) &&
Daniel Jasper4b866272013-02-01 11:00:45 +00001038 State.Stack.back().BreakBeforeClosingBrace))
1039 return false;
Daniel Jasper473c62c2013-05-17 09:35:01 +00001040 // The opening "{" of a braced list has to be on the same line as the first
1041 // element if it is nested in another braced init list or function call.
1042 if (!Current.MustBreakBefore && Previous.is(tok::l_brace) &&
Manuel Klimek6e6310e2013-05-29 14:47:47 +00001043 Previous.Previous &&
1044 Previous.Previous->isOneOf(tok::l_brace, tok::l_paren, tok::comma))
Daniel Jasper473c62c2013-05-17 09:35:01 +00001045 return false;
Daniel Jasper32a796b2013-05-27 11:50:16 +00001046 // This prevents breaks like:
1047 // ...
1048 // SomeParameter, OtherParameter).DoSomething(
1049 // ...
1050 // As they hide "DoSomething" and are generally bad for readability.
Daniel Jasper0e90c3d2013-07-05 09:14:35 +00001051 if (Previous.opensScope() &&
1052 State.LowestLevelOnLine < State.StartOfLineLevel)
Daniel Jasper32a796b2013-05-27 11:50:16 +00001053 return false;
Daniel Jaspercc960fa2013-04-22 07:59:53 +00001054 return !State.Stack.back().NoLineBreak;
Daniel Jasper4b866272013-02-01 11:00:45 +00001055 }
Daniel Jasperf7935112012-12-03 18:12:45 +00001056
Daniel Jasper4b866272013-02-01 11:00:45 +00001057 /// \brief Returns \c true, if a line break after \p State is mandatory.
1058 bool mustBreak(const LineState &State) {
Manuel Klimek6e6310e2013-05-29 14:47:47 +00001059 const FormatToken &Current = *State.NextToken;
1060 const FormatToken &Previous = *Current.Previous;
Daniel Jasperd69fc772013-05-08 14:12:04 +00001061 if (Current.MustBreakBefore || Current.Type == TT_InlineASMColon)
Daniel Jasper4b866272013-02-01 11:00:45 +00001062 return true;
Daniel Jasperd69fc772013-05-08 14:12:04 +00001063 if (Current.is(tok::r_brace) && State.Stack.back().BreakBeforeClosingBrace)
Daniel Jasper4b866272013-02-01 11:00:45 +00001064 return true;
Daniel Jasperd69fc772013-05-08 14:12:04 +00001065 if (Previous.is(tok::semi) && State.LineContainsContinuedForLoopSection)
Daniel Jasper4b866272013-02-01 11:00:45 +00001066 return true;
Daniel Jasperd69fc772013-05-08 14:12:04 +00001067 if ((Previous.isOneOf(tok::comma, tok::semi) || Current.is(tok::question) ||
1068 Current.Type == TT_ConditionalExpr) &&
Daniel Jasperacc33662013-02-08 08:22:00 +00001069 State.Stack.back().BreakBeforeParameter &&
Daniel Jasperd69fc772013-05-08 14:12:04 +00001070 !Current.isTrailingComment() &&
1071 !Current.isOneOf(tok::r_paren, tok::r_brace))
Daniel Jasper4b866272013-02-01 11:00:45 +00001072 return true;
Daniel Jasperd69fc772013-05-08 14:12:04 +00001073
1074 // If we need to break somewhere inside the LHS of a binary expression, we
Daniel Jasper7ae41cd2013-07-03 10:34:47 +00001075 // should also break after the operator. Otherwise, the formatting would
1076 // hide the operator precedence, e.g. in:
1077 // if (aaaaaaaaaaaaaa ==
1078 // bbbbbbbbbbbbbb && c) {..
1079 // For comparisons, we only apply this rule, if the LHS is a binary
1080 // expression itself as otherwise, the line breaks seem superfluous.
1081 // We need special cases for ">>" which we have split into two ">" while
1082 // lexing in order to make template parsing easier.
1083 bool IsComparison = (Previous.getPrecedence() == prec::Relational ||
1084 Previous.getPrecedence() == prec::Equality) &&
1085 Previous.Previous &&
1086 Previous.Previous->Type != TT_BinaryOperator; // For >>.
1087 bool LHSIsBinaryExpr =
1088 Previous.Previous && Previous.Previous->FakeRParens > 0;
Daniel Jasperd69fc772013-05-08 14:12:04 +00001089 if (Previous.Type == TT_BinaryOperator &&
Daniel Jasper7ae41cd2013-07-03 10:34:47 +00001090 (!IsComparison || LHSIsBinaryExpr) &&
1091 Current.Type != TT_BinaryOperator && // For >>.
Daniel Jasper68d888c2013-06-03 08:42:05 +00001092 !Current.isTrailingComment() &&
Daniel Jasperd69fc772013-05-08 14:12:04 +00001093 !Previous.isOneOf(tok::lessless, tok::question) &&
Manuel Klimek6e6310e2013-05-29 14:47:47 +00001094 Previous.getPrecedence() != prec::Assignment &&
Daniel Jasperacc33662013-02-08 08:22:00 +00001095 State.Stack.back().BreakBeforeParameter)
Daniel Jasper1ac3e052013-02-05 10:07:47 +00001096 return true;
Daniel Jasperd69fc772013-05-08 14:12:04 +00001097
1098 // FIXME: Comparing LongestObjCSelectorName to 0 is a hacky way of finding
1099 // out whether it is the first parameter. Clean this up.
1100 if (Current.Type == TT_ObjCSelectorName &&
1101 Current.LongestObjCSelectorName == 0 &&
1102 State.Stack.back().BreakBeforeParameter)
Daniel Jasper4b866272013-02-01 11:00:45 +00001103 return true;
Daniel Jasperd69fc772013-05-08 14:12:04 +00001104 if ((Current.Type == TT_CtorInitializerColon ||
1105 (Previous.ClosesTemplateDeclaration && State.ParenLevel == 0)))
Daniel Jasper40aacf42013-03-14 13:45:21 +00001106 return true;
Daniel Jasperd69fc772013-05-08 14:12:04 +00001107
Daniel Jasperc6fbc212013-05-15 09:35:08 +00001108 if (Current.Type == TT_StartOfName && Line.MightBeFunctionDecl &&
1109 State.Stack.back().BreakBeforeParameter && State.ParenLevel == 0)
1110 return true;
Daniel Jasper4b866272013-02-01 11:00:45 +00001111 return false;
Daniel Jasperf7935112012-12-03 18:12:45 +00001112 }
1113
Daniel Jasper9b334242013-03-15 14:57:30 +00001114 // Returns the total number of columns required for the remaining tokens.
1115 unsigned getRemainingLength(const LineState &State) {
Manuel Klimek6e6310e2013-05-29 14:47:47 +00001116 if (State.NextToken && State.NextToken->Previous)
1117 return Line.Last->TotalLength - State.NextToken->Previous->TotalLength;
Daniel Jasper9b334242013-03-15 14:57:30 +00001118 return 0;
1119 }
1120
Daniel Jasperf7935112012-12-03 18:12:45 +00001121 FormatStyle Style;
1122 SourceManager &SourceMgr;
Daniel Jasperf1e4b7d2013-01-14 13:08:07 +00001123 const AnnotatedLine &Line;
Manuel Klimek0b689fd2013-01-10 18:45:26 +00001124 const unsigned FirstIndent;
Manuel Klimek6e6310e2013-05-29 14:47:47 +00001125 const FormatToken *RootToken;
Daniel Jasperaa701fa2013-01-18 08:44:07 +00001126 WhitespaceManager &Whitespaces;
Manuel Klimekaf491072013-02-13 10:54:19 +00001127
1128 llvm::SpecificBumpPtrAllocator<StateNode> Allocator;
1129 QueueType Queue;
1130 // Increasing count of \c StateNode items we have created. This is used
1131 // to create a deterministic order independent of the container.
1132 unsigned Count;
Alexander Kornienkoffcc0102013-06-05 14:09:10 +00001133 encoding::Encoding Encoding;
Daniel Jasperf7935112012-12-03 18:12:45 +00001134};
1135
Manuel Klimek15dfe7a2013-05-28 11:55:06 +00001136class FormatTokenLexer {
Alexander Kornienkoe3276842012-12-07 16:15:44 +00001137public:
Alexander Kornienkoffcc0102013-06-05 14:09:10 +00001138 FormatTokenLexer(Lexer &Lex, SourceManager &SourceMgr,
1139 encoding::Encoding Encoding)
Manuel Klimek15dfe7a2013-05-28 11:55:06 +00001140 : FormatTok(NULL), GreaterStashed(false), TrailingWhitespace(0), Lex(Lex),
Alexander Kornienkoffcc0102013-06-05 14:09:10 +00001141 SourceMgr(SourceMgr), IdentTable(Lex.getLangOpts()),
1142 Encoding(Encoding) {
Alexander Kornienkoe3276842012-12-07 16:15:44 +00001143 Lex.SetKeepWhitespaceMode(true);
1144 }
1145
Manuel Klimek15dfe7a2013-05-28 11:55:06 +00001146 ArrayRef<FormatToken *> lex() {
1147 assert(Tokens.empty());
1148 do {
1149 Tokens.push_back(getNextToken());
1150 } while (Tokens.back()->Tok.isNot(tok::eof));
1151 return Tokens;
1152 }
1153
1154 IdentifierTable &getIdentTable() { return IdentTable; }
1155
1156private:
1157 FormatToken *getNextToken() {
Alexander Kornienkoe3276842012-12-07 16:15:44 +00001158 if (GreaterStashed) {
Manuel Klimek591ab5a2013-05-28 13:42:28 +00001159 // Create a synthesized second '>' token.
1160 Token Greater = FormatTok->Tok;
1161 FormatTok = new (Allocator.Allocate()) FormatToken;
1162 FormatTok->Tok = Greater;
Manuel Klimek5c24cca2013-05-23 10:56:37 +00001163 SourceLocation GreaterLocation =
Manuel Klimek15dfe7a2013-05-28 11:55:06 +00001164 FormatTok->Tok.getLocation().getLocWithOffset(1);
1165 FormatTok->WhitespaceRange =
1166 SourceRange(GreaterLocation, GreaterLocation);
Alexander Kornienkoee4ca9b2013-06-07 17:45:07 +00001167 FormatTok->TokenText = ">";
Alexander Kornienkoffcc0102013-06-05 14:09:10 +00001168 FormatTok->CodePointCount = 1;
Alexander Kornienkoe3276842012-12-07 16:15:44 +00001169 GreaterStashed = false;
1170 return FormatTok;
1171 }
1172
Manuel Klimek15dfe7a2013-05-28 11:55:06 +00001173 FormatTok = new (Allocator.Allocate()) FormatToken;
1174 Lex.LexFromRawLexer(FormatTok->Tok);
1175 StringRef Text = rawTokenText(FormatTok->Tok);
Manuel Klimek9043c742013-05-27 15:23:34 +00001176 SourceLocation WhitespaceStart =
Manuel Klimek15dfe7a2013-05-28 11:55:06 +00001177 FormatTok->Tok.getLocation().getLocWithOffset(-TrailingWhitespace);
Manuel Klimek5c24cca2013-05-23 10:56:37 +00001178 if (SourceMgr.getFileOffset(WhitespaceStart) == 0)
Manuel Klimek15dfe7a2013-05-28 11:55:06 +00001179 FormatTok->IsFirst = true;
Alexander Kornienkoe3276842012-12-07 16:15:44 +00001180
1181 // Consume and record whitespace until we find a significant token.
Manuel Klimek9043c742013-05-27 15:23:34 +00001182 unsigned WhitespaceLength = TrailingWhitespace;
Manuel Klimek15dfe7a2013-05-28 11:55:06 +00001183 while (FormatTok->Tok.is(tok::unknown)) {
Manuel Klimek0c137952013-02-11 12:33:24 +00001184 unsigned Newlines = Text.count('\n');
Daniel Jasper973c9422013-03-04 13:43:19 +00001185 if (Newlines > 0)
Manuel Klimek15dfe7a2013-05-28 11:55:06 +00001186 FormatTok->LastNewlineOffset = WhitespaceLength + Text.rfind('\n') + 1;
Manuel Klimek15dfe7a2013-05-28 11:55:06 +00001187 FormatTok->NewlinesBefore += Newlines;
Alexander Kornienkoee4ca9b2013-06-07 17:45:07 +00001188 unsigned EscapedNewlines = Text.count("\\\n");
Manuel Klimek15dfe7a2013-05-28 11:55:06 +00001189 FormatTok->HasUnescapedNewline |= EscapedNewlines != Newlines;
1190 WhitespaceLength += FormatTok->Tok.getLength();
Alexander Kornienkoe3276842012-12-07 16:15:44 +00001191
Manuel Klimek15dfe7a2013-05-28 11:55:06 +00001192 Lex.LexFromRawLexer(FormatTok->Tok);
1193 Text = rawTokenText(FormatTok->Tok);
Manuel Klimek1abf7892013-01-04 23:34:14 +00001194 }
Manuel Klimekef920692013-01-07 07:56:50 +00001195
Manuel Klimek1abf7892013-01-04 23:34:14 +00001196 // In case the token starts with escaped newlines, we want to
1197 // take them into account as whitespace - this pattern is quite frequent
1198 // in macro definitions.
1199 // FIXME: What do we want to do with other escaped spaces, and escaped
1200 // spaces or newlines in the middle of tokens?
1201 // FIXME: Add a more explicit test.
Alexander Kornienkoee4ca9b2013-06-07 17:45:07 +00001202 while (Text.size() > 1 && Text[0] == '\\' && Text[1] == '\n') {
Manuel Klimek15dfe7a2013-05-28 11:55:06 +00001203 // FIXME: ++FormatTok->NewlinesBefore is missing...
Manuel Klimek5c24cca2013-05-23 10:56:37 +00001204 WhitespaceLength += 2;
Alexander Kornienkoee4ca9b2013-06-07 17:45:07 +00001205 Text = Text.substr(2);
Alexander Kornienkoe3276842012-12-07 16:15:44 +00001206 }
1207
Alexander Kornienkoee4ca9b2013-06-07 17:45:07 +00001208 TrailingWhitespace = 0;
1209 if (FormatTok->Tok.is(tok::comment)) {
1210 StringRef UntrimmedText = Text;
1211 Text = Text.rtrim();
1212 TrailingWhitespace = UntrimmedText.size() - Text.size();
1213 } else if (FormatTok->Tok.is(tok::raw_identifier)) {
Manuel Klimek1abf7892013-01-04 23:34:14 +00001214 IdentifierInfo &Info = IdentTable.get(Text);
Manuel Klimek15dfe7a2013-05-28 11:55:06 +00001215 FormatTok->Tok.setIdentifierInfo(&Info);
1216 FormatTok->Tok.setKind(Info.getTokenID());
Alexander Kornienkoee4ca9b2013-06-07 17:45:07 +00001217 } else if (FormatTok->Tok.is(tok::greatergreater)) {
Manuel Klimek15dfe7a2013-05-28 11:55:06 +00001218 FormatTok->Tok.setKind(tok::greater);
Alexander Kornienkoee4ca9b2013-06-07 17:45:07 +00001219 Text = Text.substr(0, 1);
Alexander Kornienkoe3276842012-12-07 16:15:44 +00001220 GreaterStashed = true;
1221 }
1222
Alexander Kornienkoee4ca9b2013-06-07 17:45:07 +00001223 // Now FormatTok is the next non-whitespace token.
1224 FormatTok->TokenText = Text;
1225 FormatTok->CodePointCount = encoding::getCodePointCount(Text, Encoding);
Alexander Kornienkoffcc0102013-06-05 14:09:10 +00001226
Manuel Klimek15dfe7a2013-05-28 11:55:06 +00001227 FormatTok->WhitespaceRange = SourceRange(
Manuel Klimek5c24cca2013-05-23 10:56:37 +00001228 WhitespaceStart, WhitespaceStart.getLocWithOffset(WhitespaceLength));
Alexander Kornienkoe3276842012-12-07 16:15:44 +00001229 return FormatTok;
1230 }
1231
Manuel Klimek15dfe7a2013-05-28 11:55:06 +00001232 FormatToken *FormatTok;
Alexander Kornienkoe3276842012-12-07 16:15:44 +00001233 bool GreaterStashed;
Manuel Klimek9043c742013-05-27 15:23:34 +00001234 unsigned TrailingWhitespace;
Alexander Kornienkoe3276842012-12-07 16:15:44 +00001235 Lexer &Lex;
1236 SourceManager &SourceMgr;
1237 IdentifierTable IdentTable;
Alexander Kornienkoffcc0102013-06-05 14:09:10 +00001238 encoding::Encoding Encoding;
Manuel Klimek15dfe7a2013-05-28 11:55:06 +00001239 llvm::SpecificBumpPtrAllocator<FormatToken> Allocator;
1240 SmallVector<FormatToken *, 16> Tokens;
Alexander Kornienkoe3276842012-12-07 16:15:44 +00001241
1242 /// Returns the text of \c FormatTok.
Manuel Klimekef920692013-01-07 07:56:50 +00001243 StringRef rawTokenText(Token &Tok) {
Alexander Kornienkoe3276842012-12-07 16:15:44 +00001244 return StringRef(SourceMgr.getCharacterData(Tok.getLocation()),
1245 Tok.getLength());
1246 }
1247};
1248
Daniel Jasperf7935112012-12-03 18:12:45 +00001249class Formatter : public UnwrappedLineConsumer {
1250public:
Daniel Jasperd2ae41a2013-05-15 08:14:19 +00001251 Formatter(const FormatStyle &Style, Lexer &Lex, SourceManager &SourceMgr,
Daniel Jasperf7935112012-12-03 18:12:45 +00001252 const std::vector<CharSourceRange> &Ranges)
Daniel Jasperd2ae41a2013-05-15 08:14:19 +00001253 : Style(Style), Lex(Lex), SourceMgr(SourceMgr),
Alexander Kornienkoffcc0102013-06-05 14:09:10 +00001254 Whitespaces(SourceMgr, Style), Ranges(Ranges),
1255 Encoding(encoding::detectEncoding(Lex.getBuffer())) {
1256 DEBUG(llvm::dbgs()
1257 << "File encoding: "
1258 << (Encoding == encoding::Encoding_UTF8 ? "UTF8" : "unknown")
1259 << "\n");
1260 }
Daniel Jasperf7935112012-12-03 18:12:45 +00001261
Daniel Jasperfd8c4b12013-01-11 14:23:32 +00001262 virtual ~Formatter() {}
Daniel Jasper61bd3a12012-12-04 21:05:31 +00001263
Alexander Kornienko62b85b92013-03-13 14:41:29 +00001264 tooling::Replacements format() {
Alexander Kornienkoffcc0102013-06-05 14:09:10 +00001265 FormatTokenLexer Tokens(Lex, SourceMgr, Encoding);
Manuel Klimek15dfe7a2013-05-28 11:55:06 +00001266
1267 UnwrappedLineParser Parser(Style, Tokens.lex(), *this);
Manuel Klimek1a18c402013-04-12 14:13:36 +00001268 bool StructuralError = Parser.parse();
Alexander Kornienkoffcc0102013-06-05 14:09:10 +00001269 TokenAnnotator Annotator(Style, Tokens.getIdentTable().get("in"));
Alexander Kornienko62b85b92013-03-13 14:41:29 +00001270 for (unsigned i = 0, e = AnnotatedLines.size(); i != e; ++i) {
1271 Annotator.annotate(AnnotatedLines[i]);
1272 }
1273 deriveLocalStyle();
1274 for (unsigned i = 0, e = AnnotatedLines.size(); i != e; ++i) {
1275 Annotator.calculateFormattingInformation(AnnotatedLines[i]);
1276 }
Daniel Jasperb67cc422013-04-09 17:46:55 +00001277
1278 // Adapt level to the next line if this is a comment.
1279 // FIXME: Can/should this be done in the UnwrappedLineParser?
Alexander Kornienko1efe0a02013-07-04 14:47:51 +00001280 const AnnotatedLine *NextNonCommentLine = NULL;
Daniel Jasperb67cc422013-04-09 17:46:55 +00001281 for (unsigned i = AnnotatedLines.size() - 1; i > 0; --i) {
Alexander Kornienko1efe0a02013-07-04 14:47:51 +00001282 if (NextNonCommentLine && AnnotatedLines[i].First->is(tok::comment) &&
Manuel Klimek6e6310e2013-05-29 14:47:47 +00001283 !AnnotatedLines[i].First->Next)
Alexander Kornienko1efe0a02013-07-04 14:47:51 +00001284 AnnotatedLines[i].Level = NextNonCommentLine->Level;
Daniel Jasperb67cc422013-04-09 17:46:55 +00001285 else
Alexander Kornienko1efe0a02013-07-04 14:47:51 +00001286 NextNonCommentLine =
Manuel Klimek6e6310e2013-05-29 14:47:47 +00001287 AnnotatedLines[i].First->isNot(tok::r_brace) ? &AnnotatedLines[i]
1288 : NULL;
Daniel Jasperb67cc422013-04-09 17:46:55 +00001289 }
1290
Alexander Kornienko62b85b92013-03-13 14:41:29 +00001291 std::vector<int> IndentForLevel;
1292 bool PreviousLineWasTouched = false;
Manuel Klimek6e6310e2013-05-29 14:47:47 +00001293 const FormatToken *PreviousLineLastToken = 0;
Daniel Jasper1cb530f2013-05-10 13:00:49 +00001294 bool FormatPPDirective = false;
Alexander Kornienko62b85b92013-03-13 14:41:29 +00001295 for (std::vector<AnnotatedLine>::iterator I = AnnotatedLines.begin(),
1296 E = AnnotatedLines.end();
1297 I != E; ++I) {
1298 const AnnotatedLine &TheLine = *I;
Manuel Klimek6e6310e2013-05-29 14:47:47 +00001299 const FormatToken *FirstTok = TheLine.First;
1300 int Offset = getIndentOffset(*TheLine.First);
Daniel Jasper1cb530f2013-05-10 13:00:49 +00001301
1302 // Check whether this line is part of a formatted preprocessor directive.
Manuel Klimek591ab5a2013-05-28 13:42:28 +00001303 if (FirstTok->HasUnescapedNewline)
Daniel Jasper1cb530f2013-05-10 13:00:49 +00001304 FormatPPDirective = false;
1305 if (!FormatPPDirective && TheLine.InPPDirective &&
1306 (touchesLine(TheLine) || touchesPPDirective(I + 1, E)))
1307 FormatPPDirective = true;
1308
Daniel Jasper12f9d8e2013-05-14 09:30:02 +00001309 // Determine indent and try to merge multiple unwrapped lines.
Alexander Kornienko62b85b92013-03-13 14:41:29 +00001310 while (IndentForLevel.size() <= TheLine.Level)
1311 IndentForLevel.push_back(-1);
1312 IndentForLevel.resize(TheLine.Level + 1);
Daniel Jasper12f9d8e2013-05-14 09:30:02 +00001313 unsigned Indent = getIndent(IndentForLevel, TheLine.Level);
1314 if (static_cast<int>(Indent) + Offset >= 0)
1315 Indent += Offset;
1316 tryFitMultipleLinesInOne(Indent, I, E);
1317
Manuel Klimek591ab5a2013-05-28 13:42:28 +00001318 bool WasMoved = PreviousLineWasTouched && FirstTok->NewlinesBefore == 0;
Manuel Klimek6e6310e2013-05-29 14:47:47 +00001319 if (TheLine.First->is(tok::eof)) {
Alexander Kornienko62b85b92013-03-13 14:41:29 +00001320 if (PreviousLineWasTouched) {
Manuel Klimek591ab5a2013-05-28 13:42:28 +00001321 unsigned NewLines = std::min(FirstTok->NewlinesBefore, 1u);
Manuel Klimek6e6310e2013-05-29 14:47:47 +00001322 Whitespaces.replaceWhitespace(*TheLine.First, NewLines, /*Indent*/ 0,
Manuel Klimek4fe43002013-05-22 12:51:29 +00001323 /*TargetColumn*/ 0);
Alexander Kornienko62b85b92013-03-13 14:41:29 +00001324 }
1325 } else if (TheLine.Type != LT_Invalid &&
Daniel Jasper1cb530f2013-05-10 13:00:49 +00001326 (WasMoved || FormatPPDirective || touchesLine(TheLine))) {
Alexander Kornienko62b85b92013-03-13 14:41:29 +00001327 unsigned LevelIndent = getIndent(IndentForLevel, TheLine.Level);
Manuel Klimek591ab5a2013-05-28 13:42:28 +00001328 if (FirstTok->WhitespaceRange.isValid() &&
Manuel Klimek1a18c402013-04-12 14:13:36 +00001329 // Insert a break even if there is a structural error in case where
1330 // we break apart a line consisting of multiple unwrapped lines.
Manuel Klimek591ab5a2013-05-28 13:42:28 +00001331 (FirstTok->NewlinesBefore == 0 || !StructuralError)) {
Manuel Klimek6e6310e2013-05-29 14:47:47 +00001332 formatFirstToken(*TheLine.First, PreviousLineLastToken, Indent,
Manuel Klimek4fe43002013-05-22 12:51:29 +00001333 TheLine.InPPDirective);
Manuel Klimek1a18c402013-04-12 14:13:36 +00001334 } else {
1335 Indent = LevelIndent =
Manuel Klimek591ab5a2013-05-28 13:42:28 +00001336 SourceMgr.getSpellingColumnNumber(FirstTok->Tok.getLocation()) -
1337 1;
Alexander Kornienko62b85b92013-03-13 14:41:29 +00001338 }
Alexander Kornienko62b85b92013-03-13 14:41:29 +00001339 UnwrappedLineFormatter Formatter(Style, SourceMgr, TheLine, Indent,
Alexander Kornienkoffcc0102013-06-05 14:09:10 +00001340 TheLine.First, Whitespaces, Encoding);
Manuel Klimek4fe43002013-05-22 12:51:29 +00001341 Formatter.format(I + 1 != E ? &*(I + 1) : NULL);
Alexander Kornienko62b85b92013-03-13 14:41:29 +00001342 IndentForLevel[TheLine.Level] = LevelIndent;
1343 PreviousLineWasTouched = true;
1344 } else {
Manuel Klimek4fe43002013-05-22 12:51:29 +00001345 // Format the first token if necessary, and notify the WhitespaceManager
1346 // about the unchanged whitespace.
Manuel Klimek6e6310e2013-05-29 14:47:47 +00001347 for (const FormatToken *Tok = TheLine.First; Tok != NULL;
1348 Tok = Tok->Next) {
1349 if (Tok == TheLine.First &&
1350 (Tok->NewlinesBefore > 0 || Tok->IsFirst)) {
1351 unsigned LevelIndent =
1352 SourceMgr.getSpellingColumnNumber(Tok->Tok.getLocation()) - 1;
Manuel Klimek4fe43002013-05-22 12:51:29 +00001353 // Remove trailing whitespace of the previous line if it was
1354 // touched.
1355 if (PreviousLineWasTouched || touchesEmptyLineBefore(TheLine)) {
1356 formatFirstToken(*Tok, PreviousLineLastToken, LevelIndent,
1357 TheLine.InPPDirective);
1358 } else {
Manuel Klimek6e6310e2013-05-29 14:47:47 +00001359 Whitespaces.addUntouchableToken(*Tok, TheLine.InPPDirective);
Manuel Klimek4fe43002013-05-22 12:51:29 +00001360 }
Daniel Jasper12f9d8e2013-05-14 09:30:02 +00001361
Manuel Klimek4fe43002013-05-22 12:51:29 +00001362 if (static_cast<int>(LevelIndent) - Offset >= 0)
1363 LevelIndent -= Offset;
1364 if (Tok->isNot(tok::comment))
1365 IndentForLevel[TheLine.Level] = LevelIndent;
1366 } else {
Manuel Klimek6e6310e2013-05-29 14:47:47 +00001367 Whitespaces.addUntouchableToken(*Tok, TheLine.InPPDirective);
Manuel Klimek4fe43002013-05-22 12:51:29 +00001368 }
Alexander Kornienko62b85b92013-03-13 14:41:29 +00001369 }
1370 // If we did not reformat this unwrapped line, the column at the end of
1371 // the last token is unchanged - thus, we can calculate the end of the
1372 // last token.
Alexander Kornienko62b85b92013-03-13 14:41:29 +00001373 PreviousLineWasTouched = false;
1374 }
Alexander Kornienkofd433362013-03-27 17:08:02 +00001375 PreviousLineLastToken = I->Last;
Alexander Kornienko62b85b92013-03-13 14:41:29 +00001376 }
1377 return Whitespaces.generateReplacements();
1378 }
1379
1380private:
Daniel Jasper7fce3ab2013-02-06 14:22:40 +00001381 void deriveLocalStyle() {
1382 unsigned CountBoundToVariable = 0;
1383 unsigned CountBoundToType = 0;
1384 bool HasCpp03IncompatibleFormat = false;
1385 for (unsigned i = 0, e = AnnotatedLines.size(); i != e; ++i) {
Manuel Klimek6e6310e2013-05-29 14:47:47 +00001386 if (!AnnotatedLines[i].First->Next)
Daniel Jasper7fce3ab2013-02-06 14:22:40 +00001387 continue;
Manuel Klimek6e6310e2013-05-29 14:47:47 +00001388 FormatToken *Tok = AnnotatedLines[i].First->Next;
1389 while (Tok->Next) {
Daniel Jasper7fce3ab2013-02-06 14:22:40 +00001390 if (Tok->Type == TT_PointerOrReference) {
Manuel Klimek6e6310e2013-05-29 14:47:47 +00001391 bool SpacesBefore =
1392 Tok->WhitespaceRange.getBegin() != Tok->WhitespaceRange.getEnd();
1393 bool SpacesAfter = Tok->Next->WhitespaceRange.getBegin() !=
1394 Tok->Next->WhitespaceRange.getEnd();
Daniel Jasper7fce3ab2013-02-06 14:22:40 +00001395 if (SpacesBefore && !SpacesAfter)
1396 ++CountBoundToVariable;
1397 else if (!SpacesBefore && SpacesAfter)
1398 ++CountBoundToType;
1399 }
1400
Daniel Jasper400adc62013-02-08 15:28:42 +00001401 if (Tok->Type == TT_TemplateCloser &&
Manuel Klimek6e6310e2013-05-29 14:47:47 +00001402 Tok->Previous->Type == TT_TemplateCloser &&
1403 Tok->WhitespaceRange.getBegin() == Tok->WhitespaceRange.getEnd())
Daniel Jasper7fce3ab2013-02-06 14:22:40 +00001404 HasCpp03IncompatibleFormat = true;
Manuel Klimek6e6310e2013-05-29 14:47:47 +00001405 Tok = Tok->Next;
Daniel Jasper7fce3ab2013-02-06 14:22:40 +00001406 }
1407 }
1408 if (Style.DerivePointerBinding) {
1409 if (CountBoundToType > CountBoundToVariable)
1410 Style.PointerBindsToType = true;
1411 else if (CountBoundToType < CountBoundToVariable)
1412 Style.PointerBindsToType = false;
1413 }
1414 if (Style.Standard == FormatStyle::LS_Auto) {
1415 Style.Standard = HasCpp03IncompatibleFormat ? FormatStyle::LS_Cpp11
1416 : FormatStyle::LS_Cpp03;
1417 }
1418 }
1419
Manuel Klimekb95f5452013-02-08 17:38:27 +00001420 /// \brief Get the indent of \p Level from \p IndentForLevel.
1421 ///
1422 /// \p IndentForLevel must contain the indent for the level \c l
1423 /// at \p IndentForLevel[l], or a value < 0 if the indent for
1424 /// that level is unknown.
Daniel Jasper687af3b2013-02-14 14:26:07 +00001425 unsigned getIndent(const std::vector<int> IndentForLevel, unsigned Level) {
Manuel Klimekb95f5452013-02-08 17:38:27 +00001426 if (IndentForLevel[Level] != -1)
1427 return IndentForLevel[Level];
Manuel Klimekd076dcd2013-02-08 19:53:32 +00001428 if (Level == 0)
1429 return 0;
Manuel Klimek13b97d82013-05-13 08:42:42 +00001430 return getIndent(IndentForLevel, Level - 1) + Style.IndentWidth;
Manuel Klimekb95f5452013-02-08 17:38:27 +00001431 }
1432
1433 /// \brief Get the offset of the line relatively to the level.
1434 ///
1435 /// For example, 'public:' labels in classes are offset by 1 or 2
1436 /// characters to the left from their level.
Manuel Klimek6e6310e2013-05-29 14:47:47 +00001437 int getIndentOffset(const FormatToken &RootToken) {
Alexander Kornienkofd433362013-03-27 17:08:02 +00001438 if (RootToken.isAccessSpecifier(false) || RootToken.isObjCAccessSpecifier())
Manuel Klimekb95f5452013-02-08 17:38:27 +00001439 return Style.AccessModifierOffset;
1440 return 0;
1441 }
1442
Manuel Klimekf4ab9ef2013-01-11 17:54:10 +00001443 /// \brief Tries to merge lines into one.
1444 ///
1445 /// This will change \c Line and \c AnnotatedLine to contain the merged line,
1446 /// if possible; note that \c I will be incremented when lines are merged.
Daniel Jaspera67a8f02013-01-16 10:41:46 +00001447 void tryFitMultipleLinesInOne(unsigned Indent,
Daniel Jasperf1e4b7d2013-01-14 13:08:07 +00001448 std::vector<AnnotatedLine>::iterator &I,
1449 std::vector<AnnotatedLine>::iterator E) {
Daniel Jaspera67a8f02013-01-16 10:41:46 +00001450 // We can never merge stuff if there are trailing line comments.
1451 if (I->Last->Type == TT_LineComment)
1452 return;
1453
Daniel Jasperc22f5b42013-02-28 11:05:57 +00001454 unsigned Limit = Style.ColumnLimit - Indent;
Daniel Jasper12ef4e52013-02-21 21:33:55 +00001455 // If we already exceed the column limit, we set 'Limit' to 0. The different
1456 // tryMerge..() functions can then decide whether to still do merging.
1457 Limit = I->Last->TotalLength > Limit ? 0 : Limit - I->Last->TotalLength;
Daniel Jasperc36492b2013-01-16 07:02:34 +00001458
Daniel Jasperd41ee2d2013-01-21 14:18:28 +00001459 if (I + 1 == E || (I + 1)->Type == LT_Invalid)
Daniel Jaspera67a8f02013-01-16 10:41:46 +00001460 return;
Manuel Klimekf4ab9ef2013-01-11 17:54:10 +00001461
Daniel Jasperabca58c2013-05-15 14:09:55 +00001462 if (I->Last->is(tok::l_brace)) {
Daniel Jasper25837aa2013-01-14 14:14:23 +00001463 tryMergeSimpleBlock(I, E, Limit);
Daniel Jasper3a685df2013-05-16 12:12:21 +00001464 } else if (Style.AllowShortIfStatementsOnASingleLine &&
Manuel Klimek6e6310e2013-05-29 14:47:47 +00001465 I->First->is(tok::kw_if)) {
Daniel Jasper3a685df2013-05-16 12:12:21 +00001466 tryMergeSimpleControlStatement(I, E, Limit);
1467 } else if (Style.AllowShortLoopsOnASingleLine &&
Manuel Klimek6e6310e2013-05-29 14:47:47 +00001468 I->First->isOneOf(tok::kw_for, tok::kw_while)) {
Daniel Jasper3a685df2013-05-16 12:12:21 +00001469 tryMergeSimpleControlStatement(I, E, Limit);
Manuel Klimek6e6310e2013-05-29 14:47:47 +00001470 } else if (I->InPPDirective &&
1471 (I->First->HasUnescapedNewline || I->First->IsFirst)) {
Daniel Jasper39825ea2013-01-14 15:40:57 +00001472 tryMergeSimplePPDirective(I, E, Limit);
Daniel Jasper25837aa2013-01-14 14:14:23 +00001473 }
Daniel Jasper25837aa2013-01-14 14:14:23 +00001474 }
1475
Daniel Jasper39825ea2013-01-14 15:40:57 +00001476 void tryMergeSimplePPDirective(std::vector<AnnotatedLine>::iterator &I,
1477 std::vector<AnnotatedLine>::iterator E,
1478 unsigned Limit) {
Daniel Jasper12ef4e52013-02-21 21:33:55 +00001479 if (Limit == 0)
1480 return;
Daniel Jasper39825ea2013-01-14 15:40:57 +00001481 AnnotatedLine &Line = *I;
Manuel Klimek6e6310e2013-05-29 14:47:47 +00001482 if (!(I + 1)->InPPDirective || (I + 1)->First->HasUnescapedNewline)
Daniel Jasper2ab0d012013-01-14 15:52:06 +00001483 return;
Daniel Jasper39825ea2013-01-14 15:40:57 +00001484 if (I + 2 != E && (I + 2)->InPPDirective &&
Manuel Klimek6e6310e2013-05-29 14:47:47 +00001485 !(I + 2)->First->HasUnescapedNewline)
Daniel Jasper39825ea2013-01-14 15:40:57 +00001486 return;
Manuel Klimeka4fe1c12013-01-21 16:42:44 +00001487 if (1 + (I + 1)->Last->TotalLength > Limit)
Daniel Jaspera67a8f02013-01-16 10:41:46 +00001488 return;
Daniel Jasper39825ea2013-01-14 15:40:57 +00001489 join(Line, *(++I));
1490 }
1491
Daniel Jasper3a685df2013-05-16 12:12:21 +00001492 void tryMergeSimpleControlStatement(std::vector<AnnotatedLine>::iterator &I,
1493 std::vector<AnnotatedLine>::iterator E,
1494 unsigned Limit) {
Daniel Jasper12ef4e52013-02-21 21:33:55 +00001495 if (Limit == 0)
1496 return;
Manuel Klimekda087612013-01-18 14:46:43 +00001497 if ((I + 1)->InPPDirective != I->InPPDirective ||
Manuel Klimek6e6310e2013-05-29 14:47:47 +00001498 ((I + 1)->InPPDirective && (I + 1)->First->HasUnescapedNewline))
Manuel Klimekda087612013-01-18 14:46:43 +00001499 return;
Daniel Jasper25837aa2013-01-14 14:14:23 +00001500 AnnotatedLine &Line = *I;
Daniel Jasperc36492b2013-01-16 07:02:34 +00001501 if (Line.Last->isNot(tok::r_paren))
1502 return;
Manuel Klimeka4fe1c12013-01-21 16:42:44 +00001503 if (1 + (I + 1)->Last->TotalLength > Limit)
Daniel Jasper25837aa2013-01-14 14:14:23 +00001504 return;
Manuel Klimek6e6310e2013-05-29 14:47:47 +00001505 if ((I + 1)->First->isOneOf(tok::semi, tok::kw_if, tok::kw_for,
1506 tok::kw_while) ||
1507 (I + 1)->First->Type == TT_LineComment)
Daniel Jasper25837aa2013-01-14 14:14:23 +00001508 return;
1509 // Only inline simple if's (no nested if or else).
Manuel Klimek6e6310e2013-05-29 14:47:47 +00001510 if (I + 2 != E && Line.First->is(tok::kw_if) &&
1511 (I + 2)->First->is(tok::kw_else))
Daniel Jasper25837aa2013-01-14 14:14:23 +00001512 return;
1513 join(Line, *(++I));
1514 }
1515
1516 void tryMergeSimpleBlock(std::vector<AnnotatedLine>::iterator &I,
Daniel Jasperbbc84152013-01-29 11:27:30 +00001517 std::vector<AnnotatedLine>::iterator E,
1518 unsigned Limit) {
Daniel Jasperabca58c2013-05-15 14:09:55 +00001519 // No merging if the brace already is on the next line.
1520 if (Style.BreakBeforeBraces != FormatStyle::BS_Attach)
1521 return;
1522
Manuel Klimekf4ab9ef2013-01-11 17:54:10 +00001523 // First, check that the current line allows merging. This is the case if
1524 // we're not in a control flow statement and the last token is an opening
1525 // brace.
Daniel Jasper25837aa2013-01-14 14:14:23 +00001526 AnnotatedLine &Line = *I;
Manuel Klimek6e6310e2013-05-29 14:47:47 +00001527 if (Line.First->isOneOf(tok::kw_if, tok::kw_while, tok::kw_do, tok::r_brace,
1528 tok::kw_else, tok::kw_try, tok::kw_catch,
Daniel Jaspera9eb2aa2013-05-31 14:56:20 +00001529 tok::kw_for,
Manuel Klimek6e6310e2013-05-29 14:47:47 +00001530 // This gets rid of all ObjC @ keywords and methods.
1531 tok::at, tok::minus, tok::plus))
Daniel Jasper25837aa2013-01-14 14:14:23 +00001532 return;
Manuel Klimekf4ab9ef2013-01-11 17:54:10 +00001533
Manuel Klimek6e6310e2013-05-29 14:47:47 +00001534 FormatToken *Tok = (I + 1)->First;
Daniel Jaspera9eb2aa2013-05-31 14:56:20 +00001535 if (Tok->is(tok::r_brace) && !Tok->MustBreakBefore &&
Alexander Kornienko1efe0a02013-07-04 14:47:51 +00001536 (Tok->getNextNonComment() == NULL ||
1537 Tok->getNextNonComment()->is(tok::semi))) {
Daniel Jasper12ef4e52013-02-21 21:33:55 +00001538 // We merge empty blocks even if the line exceeds the column limit.
Daniel Jaspereef30492013-02-11 12:36:37 +00001539 Tok->SpacesRequiredBefore = 0;
Daniel Jasper12ef4e52013-02-21 21:33:55 +00001540 Tok->CanBreakBefore = true;
Manuel Klimeka4fe1c12013-01-21 16:42:44 +00001541 join(Line, *(I + 1));
1542 I += 1;
Daniel Jaspera9eb2aa2013-05-31 14:56:20 +00001543 } else if (Limit != 0 && Line.First->isNot(tok::kw_namespace)) {
Manuel Klimeka4fe1c12013-01-21 16:42:44 +00001544 // Check that we still have three lines and they fit into the limit.
1545 if (I + 2 == E || (I + 2)->Type == LT_Invalid ||
1546 !nextTwoLinesFitInto(I, Limit))
Daniel Jasper25837aa2013-01-14 14:14:23 +00001547 return;
Manuel Klimekf4ab9ef2013-01-11 17:54:10 +00001548
Manuel Klimeka4fe1c12013-01-21 16:42:44 +00001549 // Second, check that the next line does not contain any braces - if it
1550 // does, readability declines when putting it into a single line.
1551 if ((I + 1)->Last->Type == TT_LineComment || Tok->MustBreakBefore)
1552 return;
1553 do {
Alexander Kornienko62b85b92013-03-13 14:41:29 +00001554 if (Tok->isOneOf(tok::l_brace, tok::r_brace))
Manuel Klimeka4fe1c12013-01-21 16:42:44 +00001555 return;
Manuel Klimek6e6310e2013-05-29 14:47:47 +00001556 Tok = Tok->Next;
Manuel Klimeka4fe1c12013-01-21 16:42:44 +00001557 } while (Tok != NULL);
Manuel Klimekf4ab9ef2013-01-11 17:54:10 +00001558
Manuel Klimeka4fe1c12013-01-21 16:42:44 +00001559 // Last, check that the third line contains a single closing brace.
Manuel Klimek6e6310e2013-05-29 14:47:47 +00001560 Tok = (I + 2)->First;
Alexander Kornienko1efe0a02013-07-04 14:47:51 +00001561 if (Tok->getNextNonComment() != NULL || Tok->isNot(tok::r_brace) ||
Manuel Klimeka4fe1c12013-01-21 16:42:44 +00001562 Tok->MustBreakBefore)
1563 return;
1564
1565 join(Line, *(I + 1));
1566 join(Line, *(I + 2));
1567 I += 2;
Manuel Klimekf4ab9ef2013-01-11 17:54:10 +00001568 }
Daniel Jasper25837aa2013-01-14 14:14:23 +00001569 }
1570
1571 bool nextTwoLinesFitInto(std::vector<AnnotatedLine>::iterator I,
1572 unsigned Limit) {
Manuel Klimeka4fe1c12013-01-21 16:42:44 +00001573 return 1 + (I + 1)->Last->TotalLength + 1 + (I + 2)->Last->TotalLength <=
1574 Limit;
Manuel Klimekf4ab9ef2013-01-11 17:54:10 +00001575 }
1576
Daniel Jasperf1e4b7d2013-01-14 13:08:07 +00001577 void join(AnnotatedLine &A, const AnnotatedLine &B) {
Manuel Klimek6e6310e2013-05-29 14:47:47 +00001578 assert(!A.Last->Next);
1579 assert(!B.First->Previous);
1580 A.Last->Next = B.First;
1581 B.First->Previous = A.Last;
1582 unsigned LengthA = A.Last->TotalLength + B.First->SpacesRequiredBefore;
1583 for (FormatToken *Tok = B.First; Tok; Tok = Tok->Next) {
1584 Tok->TotalLength += LengthA;
1585 A.Last = Tok;
Daniel Jasperf1e4b7d2013-01-14 13:08:07 +00001586 }
Manuel Klimek51bd6ec2013-01-10 19:49:59 +00001587 }
1588
Daniel Jasper97b89482013-03-13 07:49:51 +00001589 bool touchesRanges(const CharSourceRange &Range) {
Daniel Jasperf71cf3b2013-03-07 20:50:00 +00001590 for (unsigned i = 0, e = Ranges.size(); i != e; ++i) {
1591 if (!SourceMgr.isBeforeInTranslationUnit(Range.getEnd(),
1592 Ranges[i].getBegin()) &&
1593 !SourceMgr.isBeforeInTranslationUnit(Ranges[i].getEnd(),
1594 Range.getBegin()))
1595 return true;
1596 }
1597 return false;
1598 }
1599
1600 bool touchesLine(const AnnotatedLine &TheLine) {
Manuel Klimek6e6310e2013-05-29 14:47:47 +00001601 const FormatToken *First = TheLine.First;
1602 const FormatToken *Last = TheLine.Last;
Daniel Jaspercdd06622013-05-14 10:31:09 +00001603 CharSourceRange LineRange = CharSourceRange::getCharRange(
Manuel Klimek5c24cca2013-05-23 10:56:37 +00001604 First->WhitespaceRange.getBegin().getLocWithOffset(
1605 First->LastNewlineOffset),
Alexander Kornienkoee4ca9b2013-06-07 17:45:07 +00001606 Last->Tok.getLocation().getLocWithOffset(Last->TokenText.size() - 1));
Daniel Jasperf71cf3b2013-03-07 20:50:00 +00001607 return touchesRanges(LineRange);
1608 }
1609
Daniel Jasper1cb530f2013-05-10 13:00:49 +00001610 bool touchesPPDirective(std::vector<AnnotatedLine>::iterator I,
1611 std::vector<AnnotatedLine>::iterator E) {
1612 for (; I != E; ++I) {
Manuel Klimek6e6310e2013-05-29 14:47:47 +00001613 if (I->First->HasUnescapedNewline)
Daniel Jasper1cb530f2013-05-10 13:00:49 +00001614 return false;
1615 if (touchesLine(*I))
1616 return true;
1617 }
1618 return false;
1619 }
1620
Daniel Jasperf71cf3b2013-03-07 20:50:00 +00001621 bool touchesEmptyLineBefore(const AnnotatedLine &TheLine) {
Manuel Klimek6e6310e2013-05-29 14:47:47 +00001622 const FormatToken *First = TheLine.First;
Daniel Jasperf71cf3b2013-03-07 20:50:00 +00001623 CharSourceRange LineRange = CharSourceRange::getCharRange(
Manuel Klimek5c24cca2013-05-23 10:56:37 +00001624 First->WhitespaceRange.getBegin(),
1625 First->WhitespaceRange.getBegin().getLocWithOffset(
1626 First->LastNewlineOffset));
Daniel Jasperf71cf3b2013-03-07 20:50:00 +00001627 return touchesRanges(LineRange);
Manuel Klimek51bd6ec2013-01-10 19:49:59 +00001628 }
1629
1630 virtual void consumeUnwrappedLine(const UnwrappedLine &TheLine) {
Daniel Jasperdaffc0d2013-01-16 09:10:19 +00001631 AnnotatedLines.push_back(AnnotatedLine(TheLine));
Daniel Jasperf7935112012-12-03 18:12:45 +00001632 }
1633
Manuel Klimek0b689fd2013-01-10 18:45:26 +00001634 /// \brief Add a new line and the required indent before the first Token
1635 /// of the \c UnwrappedLine if there was no structural parsing error.
1636 /// Returns the indent level of the \c UnwrappedLine.
Manuel Klimek6e6310e2013-05-29 14:47:47 +00001637 void formatFirstToken(const FormatToken &RootToken,
1638 const FormatToken *PreviousToken, unsigned Indent,
Manuel Klimek4fe43002013-05-22 12:51:29 +00001639 bool InPPDirective) {
Daniel Jasperbbc84152013-01-29 11:27:30 +00001640 unsigned Newlines =
Manuel Klimek6e6310e2013-05-29 14:47:47 +00001641 std::min(RootToken.NewlinesBefore, Style.MaxEmptyLinesToKeep + 1);
Daniel Jasper1027c6e2013-06-03 16:16:41 +00001642 // Remove empty lines before "}" where applicable.
1643 if (RootToken.is(tok::r_brace) &&
1644 (!RootToken.Next ||
1645 (RootToken.Next->is(tok::semi) && !RootToken.Next->Next)))
1646 Newlines = std::min(Newlines, 1u);
Manuel Klimek6e6310e2013-05-29 14:47:47 +00001647 if (Newlines == 0 && !RootToken.IsFirst)
Manuel Klimek0b689fd2013-01-10 18:45:26 +00001648 Newlines = 1;
Manuel Klimek0b689fd2013-01-10 18:45:26 +00001649
Manuel Klimek4fe43002013-05-22 12:51:29 +00001650 // Insert extra new line before access specifiers.
1651 if (PreviousToken && PreviousToken->isOneOf(tok::semi, tok::r_brace) &&
Manuel Klimek6e6310e2013-05-29 14:47:47 +00001652 RootToken.isAccessSpecifier() && RootToken.NewlinesBefore == 1)
Manuel Klimek4fe43002013-05-22 12:51:29 +00001653 ++Newlines;
Alexander Kornienkofd433362013-03-27 17:08:02 +00001654
Manuel Klimek6e6310e2013-05-29 14:47:47 +00001655 Whitespaces.replaceWhitespace(
1656 RootToken, Newlines, Indent, Indent,
1657 InPPDirective && !RootToken.HasUnescapedNewline);
Manuel Klimek0b689fd2013-01-10 18:45:26 +00001658 }
1659
Daniel Jasperf7935112012-12-03 18:12:45 +00001660 FormatStyle Style;
1661 Lexer &Lex;
1662 SourceManager &SourceMgr;
Daniel Jasperaa701fa2013-01-18 08:44:07 +00001663 WhitespaceManager Whitespaces;
Daniel Jasperf7935112012-12-03 18:12:45 +00001664 std::vector<CharSourceRange> Ranges;
Daniel Jasperf1e4b7d2013-01-14 13:08:07 +00001665 std::vector<AnnotatedLine> AnnotatedLines;
Alexander Kornienkoffcc0102013-06-05 14:09:10 +00001666
1667 encoding::Encoding Encoding;
Daniel Jasperf7935112012-12-03 18:12:45 +00001668};
1669
Craig Topperaf35e852013-06-30 22:29:28 +00001670} // end anonymous namespace
1671
Alexander Kornienkocb45bc12013-04-15 14:28:00 +00001672tooling::Replacements reformat(const FormatStyle &Style, Lexer &Lex,
1673 SourceManager &SourceMgr,
Daniel Jasperd2ae41a2013-05-15 08:14:19 +00001674 std::vector<CharSourceRange> Ranges) {
1675 Formatter formatter(Style, Lex, SourceMgr, Ranges);
Daniel Jasperf7935112012-12-03 18:12:45 +00001676 return formatter.format();
1677}
1678
Daniel Jasperec04c0d2013-05-16 10:40:07 +00001679tooling::Replacements reformat(const FormatStyle &Style, StringRef Code,
1680 std::vector<tooling::Range> Ranges,
1681 StringRef FileName) {
1682 FileManager Files((FileSystemOptions()));
1683 DiagnosticsEngine Diagnostics(
1684 IntrusiveRefCntPtr<DiagnosticIDs>(new DiagnosticIDs),
1685 new DiagnosticOptions);
1686 SourceManager SourceMgr(Diagnostics, Files);
1687 llvm::MemoryBuffer *Buf = llvm::MemoryBuffer::getMemBuffer(Code, FileName);
1688 const clang::FileEntry *Entry =
1689 Files.getVirtualFile(FileName, Buf->getBufferSize(), 0);
1690 SourceMgr.overrideFileContents(Entry, Buf);
1691 FileID ID =
1692 SourceMgr.createFileID(Entry, SourceLocation(), clang::SrcMgr::C_User);
Alexander Kornienko1e808872013-06-28 12:51:24 +00001693 Lexer Lex(ID, SourceMgr.getBuffer(ID), SourceMgr,
1694 getFormattingLangOpts(Style.Standard));
Daniel Jasperec04c0d2013-05-16 10:40:07 +00001695 SourceLocation StartOfFile = SourceMgr.getLocForStartOfFile(ID);
1696 std::vector<CharSourceRange> CharRanges;
1697 for (unsigned i = 0, e = Ranges.size(); i != e; ++i) {
1698 SourceLocation Start = StartOfFile.getLocWithOffset(Ranges[i].getOffset());
1699 SourceLocation End = Start.getLocWithOffset(Ranges[i].getLength());
1700 CharRanges.push_back(CharSourceRange::getCharRange(Start, End));
1701 }
1702 return reformat(Style, Lex, SourceMgr, CharRanges);
1703}
1704
Alexander Kornienko1e808872013-06-28 12:51:24 +00001705LangOptions getFormattingLangOpts(FormatStyle::LanguageStandard Standard) {
Daniel Jasperc1fa2812013-01-10 13:08:12 +00001706 LangOptions LangOpts;
1707 LangOpts.CPlusPlus = 1;
Alexander Kornienko1e808872013-06-28 12:51:24 +00001708 LangOpts.CPlusPlus11 = Standard == FormatStyle::LS_Cpp03 ? 0 : 1;
Daniel Jasper55213652013-03-22 10:01:29 +00001709 LangOpts.LineComment = 1;
Daniel Jasperc1fa2812013-01-10 13:08:12 +00001710 LangOpts.Bool = 1;
1711 LangOpts.ObjC1 = 1;
1712 LangOpts.ObjC2 = 1;
1713 return LangOpts;
1714}
1715
Daniel Jasper8d1832e2013-01-07 13:26:07 +00001716} // namespace format
1717} // namespace clang