blob: e5a8ad383b36bef9b4d9d50bf8927913bfddf6f6 [file] [log] [blame]
Daniel Jasperf7935112012-12-03 18:12:45 +00001//===--- Format.cpp - Format C++ code -------------------------------------===//
2//
3// The LLVM Compiler Infrastructure
4//
5// This file is distributed under the University of Illinois Open Source
6// License. See LICENSE.TXT for details.
7//
8//===----------------------------------------------------------------------===//
9///
10/// \file
11/// \brief This file implements functions declared in Format.h. This will be
12/// split into separate files as we go.
13///
Daniel Jasperf7935112012-12-03 18:12:45 +000014//===----------------------------------------------------------------------===//
15
Manuel Klimek24998102013-01-16 14:55:28 +000016#define DEBUG_TYPE "format-formatter"
17
Alexander Kornienkocb45bc12013-04-15 14:28:00 +000018#include "BreakableToken.h"
Daniel Jasper7a6d09b2013-01-29 21:01:14 +000019#include "TokenAnnotator.h"
Chandler Carruth3a022472012-12-04 09:13:33 +000020#include "UnwrappedLineParser.h"
Alexander Kornienkocb45bc12013-04-15 14:28:00 +000021#include "WhitespaceManager.h"
Daniel Jasperec04c0d2013-05-16 10:40:07 +000022#include "clang/Basic/Diagnostic.h"
Daniel Jasperab7654e2012-12-21 10:20:02 +000023#include "clang/Basic/OperatorPrecedence.h"
Chandler Carruth44eb4f62013-01-02 10:28:36 +000024#include "clang/Basic/SourceManager.h"
Manuel Klimek24998102013-01-16 14:55:28 +000025#include "clang/Format/Format.h"
Daniel Jasperf7935112012-12-03 18:12:45 +000026#include "clang/Lex/Lexer.h"
Alexander Kornienkoffd6d042013-03-27 11:52:18 +000027#include "llvm/ADT/STLExtras.h"
Manuel Klimek2ef908e2013-02-13 10:46:36 +000028#include "llvm/Support/Allocator.h"
Manuel Klimek24998102013-01-16 14:55:28 +000029#include "llvm/Support/Debug.h"
Alexander Kornienkod6538332013-05-07 15:32:14 +000030#include "llvm/Support/YAMLTraits.h"
Manuel Klimek2ef908e2013-02-13 10:46:36 +000031#include <queue>
Daniel Jasper8b529712012-12-04 13:02:32 +000032#include <string>
33
Alexander Kornienkod6538332013-05-07 15:32:14 +000034namespace llvm {
35namespace yaml {
36template <>
37struct ScalarEnumerationTraits<clang::format::FormatStyle::LanguageStandard> {
Manuel Klimeka8eb9142013-05-13 12:51:40 +000038 static void enumeration(IO &IO,
39 clang::format::FormatStyle::LanguageStandard &Value) {
40 IO.enumCase(Value, "C++03", clang::format::FormatStyle::LS_Cpp03);
41 IO.enumCase(Value, "C++11", clang::format::FormatStyle::LS_Cpp11);
42 IO.enumCase(Value, "Auto", clang::format::FormatStyle::LS_Auto);
43 }
44};
45
Daniel Jasper12f9d8e2013-05-14 09:30:02 +000046template <>
Manuel Klimeka8eb9142013-05-13 12:51:40 +000047struct ScalarEnumerationTraits<clang::format::FormatStyle::BraceBreakingStyle> {
48 static void
49 enumeration(IO &IO, clang::format::FormatStyle::BraceBreakingStyle &Value) {
50 IO.enumCase(Value, "Attach", clang::format::FormatStyle::BS_Attach);
51 IO.enumCase(Value, "Linux", clang::format::FormatStyle::BS_Linux);
52 IO.enumCase(Value, "Stroustrup", clang::format::FormatStyle::BS_Stroustrup);
Alexander Kornienkod6538332013-05-07 15:32:14 +000053 }
54};
55
56template <> struct MappingTraits<clang::format::FormatStyle> {
57 static void mapping(llvm::yaml::IO &IO, clang::format::FormatStyle &Style) {
Alexander Kornienko49149672013-05-10 11:56:10 +000058 if (IO.outputting()) {
59 StringRef StylesArray[] = { "LLVM", "Google", "Chromium", "Mozilla" };
60 ArrayRef<StringRef> Styles(StylesArray);
61 for (size_t i = 0, e = Styles.size(); i < e; ++i) {
62 StringRef StyleName(Styles[i]);
Alexander Kornienko006b5c82013-05-19 00:53:30 +000063 clang::format::FormatStyle PredefinedStyle;
64 if (clang::format::getPredefinedStyle(StyleName, &PredefinedStyle) &&
65 Style == PredefinedStyle) {
Alexander Kornienko49149672013-05-10 11:56:10 +000066 IO.mapOptional("# BasedOnStyle", StyleName);
67 break;
68 }
69 }
70 } else {
Alexander Kornienkod6538332013-05-07 15:32:14 +000071 StringRef BasedOnStyle;
72 IO.mapOptional("BasedOnStyle", BasedOnStyle);
Alexander Kornienkod6538332013-05-07 15:32:14 +000073 if (!BasedOnStyle.empty())
Alexander Kornienko006b5c82013-05-19 00:53:30 +000074 if (!clang::format::getPredefinedStyle(BasedOnStyle, &Style)) {
75 IO.setError(Twine("Unknown value for BasedOnStyle: ", BasedOnStyle));
76 return;
77 }
Alexander Kornienkod6538332013-05-07 15:32:14 +000078 }
79
80 IO.mapOptional("AccessModifierOffset", Style.AccessModifierOffset);
81 IO.mapOptional("AlignEscapedNewlinesLeft", Style.AlignEscapedNewlinesLeft);
82 IO.mapOptional("AllowAllParametersOfDeclarationOnNextLine",
83 Style.AllowAllParametersOfDeclarationOnNextLine);
84 IO.mapOptional("AllowShortIfStatementsOnASingleLine",
85 Style.AllowShortIfStatementsOnASingleLine);
Daniel Jasper3a685df2013-05-16 12:12:21 +000086 IO.mapOptional("AllowShortLoopsOnASingleLine",
87 Style.AllowShortLoopsOnASingleLine);
Daniel Jasper61e6bbf2013-05-29 12:07:31 +000088 IO.mapOptional("AlwaysBreakTemplateDeclarations",
89 Style.AlwaysBreakTemplateDeclarations);
Alexander Kornienko58611712013-07-04 12:02:44 +000090 IO.mapOptional("AlwaysBreakBeforeMultilineStrings",
91 Style.AlwaysBreakBeforeMultilineStrings);
Alexander Kornienkod6538332013-05-07 15:32:14 +000092 IO.mapOptional("BinPackParameters", Style.BinPackParameters);
93 IO.mapOptional("ColumnLimit", Style.ColumnLimit);
94 IO.mapOptional("ConstructorInitializerAllOnOneLineOrOnePerLine",
95 Style.ConstructorInitializerAllOnOneLineOrOnePerLine);
96 IO.mapOptional("DerivePointerBinding", Style.DerivePointerBinding);
97 IO.mapOptional("IndentCaseLabels", Style.IndentCaseLabels);
98 IO.mapOptional("MaxEmptyLinesToKeep", Style.MaxEmptyLinesToKeep);
99 IO.mapOptional("ObjCSpaceBeforeProtocolList",
100 Style.ObjCSpaceBeforeProtocolList);
Alexander Kornienkodd7ece52013-06-07 16:02:52 +0000101 IO.mapOptional("PenaltyBreakComment", Style.PenaltyBreakComment);
102 IO.mapOptional("PenaltyBreakString", Style.PenaltyBreakString);
Alexander Kornienkod6538332013-05-07 15:32:14 +0000103 IO.mapOptional("PenaltyExcessCharacter", Style.PenaltyExcessCharacter);
104 IO.mapOptional("PenaltyReturnTypeOnItsOwnLine",
105 Style.PenaltyReturnTypeOnItsOwnLine);
106 IO.mapOptional("PointerBindsToType", Style.PointerBindsToType);
107 IO.mapOptional("SpacesBeforeTrailingComments",
108 Style.SpacesBeforeTrailingComments);
Daniel Jasper5bd0b9e2013-05-23 18:05:18 +0000109 IO.mapOptional("SpacesInBracedLists", Style.SpacesInBracedLists);
Alexander Kornienkod6538332013-05-07 15:32:14 +0000110 IO.mapOptional("Standard", Style.Standard);
Manuel Klimek13b97d82013-05-13 08:42:42 +0000111 IO.mapOptional("IndentWidth", Style.IndentWidth);
Manuel Klimekb9eae4c2013-05-13 09:22:11 +0000112 IO.mapOptional("UseTab", Style.UseTab);
Manuel Klimeka8eb9142013-05-13 12:51:40 +0000113 IO.mapOptional("BreakBeforeBraces", Style.BreakBeforeBraces);
Manuel Klimek836c2862013-06-21 17:25:42 +0000114 IO.mapOptional("IndentFunctionDeclarationAfterType",
115 Style.IndentFunctionDeclarationAfterType);
Alexander Kornienkod6538332013-05-07 15:32:14 +0000116 }
117};
118}
119}
120
Daniel Jasperf7935112012-12-03 18:12:45 +0000121namespace clang {
122namespace format {
123
Daniel Jasperf7935112012-12-03 18:12:45 +0000124FormatStyle getLLVMStyle() {
125 FormatStyle LLVMStyle;
Daniel Jasperf7935112012-12-03 18:12:45 +0000126 LLVMStyle.AccessModifierOffset = -2;
Alexander Kornienkoc8602662013-05-06 14:11:27 +0000127 LLVMStyle.AlignEscapedNewlinesLeft = false;
Daniel Jasperf7db4332013-01-29 16:03:49 +0000128 LLVMStyle.AllowAllParametersOfDeclarationOnNextLine = true;
Daniel Jasper1b750ed2013-01-14 16:24:39 +0000129 LLVMStyle.AllowShortIfStatementsOnASingleLine = false;
Daniel Jasper3a685df2013-05-16 12:12:21 +0000130 LLVMStyle.AllowShortLoopsOnASingleLine = false;
Daniel Jasper61e6bbf2013-05-29 12:07:31 +0000131 LLVMStyle.AlwaysBreakTemplateDeclarations = false;
Alexander Kornienko58611712013-07-04 12:02:44 +0000132 LLVMStyle.AlwaysBreakBeforeMultilineStrings = false;
Alexander Kornienkoc8602662013-05-06 14:11:27 +0000133 LLVMStyle.BinPackParameters = true;
134 LLVMStyle.ColumnLimit = 80;
135 LLVMStyle.ConstructorInitializerAllOnOneLineOrOnePerLine = false;
136 LLVMStyle.DerivePointerBinding = false;
137 LLVMStyle.IndentCaseLabels = false;
138 LLVMStyle.MaxEmptyLinesToKeep = 1;
Nico Webera6087752013-01-10 20:12:55 +0000139 LLVMStyle.ObjCSpaceBeforeProtocolList = true;
Alexander Kornienkodd7ece52013-06-07 16:02:52 +0000140 LLVMStyle.PenaltyBreakComment = 45;
141 LLVMStyle.PenaltyBreakString = 1000;
Daniel Jasper3a9370c2013-02-04 07:21:18 +0000142 LLVMStyle.PenaltyExcessCharacter = 1000000;
Daniel Jasper6728fc12013-04-11 14:29:13 +0000143 LLVMStyle.PenaltyReturnTypeOnItsOwnLine = 75;
Alexander Kornienkoc8602662013-05-06 14:11:27 +0000144 LLVMStyle.PointerBindsToType = false;
145 LLVMStyle.SpacesBeforeTrailingComments = 1;
Daniel Jaspere5777d22013-05-23 10:15:45 +0000146 LLVMStyle.SpacesInBracedLists = true;
Alexander Kornienkoc8602662013-05-06 14:11:27 +0000147 LLVMStyle.Standard = FormatStyle::LS_Cpp03;
Manuel Klimek13b97d82013-05-13 08:42:42 +0000148 LLVMStyle.IndentWidth = 2;
Manuel Klimekb9eae4c2013-05-13 09:22:11 +0000149 LLVMStyle.UseTab = false;
Manuel Klimeka8eb9142013-05-13 12:51:40 +0000150 LLVMStyle.BreakBeforeBraces = FormatStyle::BS_Attach;
Manuel Klimek836c2862013-06-21 17:25:42 +0000151 LLVMStyle.IndentFunctionDeclarationAfterType = false;
Daniel Jasperf7935112012-12-03 18:12:45 +0000152 return LLVMStyle;
153}
154
155FormatStyle getGoogleStyle() {
156 FormatStyle GoogleStyle;
Daniel Jasperf7935112012-12-03 18:12:45 +0000157 GoogleStyle.AccessModifierOffset = -1;
Alexander Kornienkoc8602662013-05-06 14:11:27 +0000158 GoogleStyle.AlignEscapedNewlinesLeft = true;
Daniel Jasperf7db4332013-01-29 16:03:49 +0000159 GoogleStyle.AllowAllParametersOfDeclarationOnNextLine = true;
Daniel Jasper085a2ed2013-04-24 13:46:00 +0000160 GoogleStyle.AllowShortIfStatementsOnASingleLine = true;
Daniel Jasper5bd0b9e2013-05-23 18:05:18 +0000161 GoogleStyle.AllowShortLoopsOnASingleLine = true;
Daniel Jasper61e6bbf2013-05-29 12:07:31 +0000162 GoogleStyle.AlwaysBreakTemplateDeclarations = true;
Alexander Kornienko58611712013-07-04 12:02:44 +0000163 GoogleStyle.AlwaysBreakBeforeMultilineStrings = true;
Alexander Kornienkoc8602662013-05-06 14:11:27 +0000164 GoogleStyle.BinPackParameters = true;
165 GoogleStyle.ColumnLimit = 80;
166 GoogleStyle.ConstructorInitializerAllOnOneLineOrOnePerLine = true;
167 GoogleStyle.DerivePointerBinding = true;
168 GoogleStyle.IndentCaseLabels = true;
169 GoogleStyle.MaxEmptyLinesToKeep = 1;
Nico Webera6087752013-01-10 20:12:55 +0000170 GoogleStyle.ObjCSpaceBeforeProtocolList = false;
Alexander Kornienkodd7ece52013-06-07 16:02:52 +0000171 GoogleStyle.PenaltyBreakComment = 45;
172 GoogleStyle.PenaltyBreakString = 1000;
Daniel Jasper3a9370c2013-02-04 07:21:18 +0000173 GoogleStyle.PenaltyExcessCharacter = 1000000;
Daniel Jasper6728fc12013-04-11 14:29:13 +0000174 GoogleStyle.PenaltyReturnTypeOnItsOwnLine = 200;
Alexander Kornienkoc8602662013-05-06 14:11:27 +0000175 GoogleStyle.PointerBindsToType = true;
176 GoogleStyle.SpacesBeforeTrailingComments = 2;
Daniel Jaspere5777d22013-05-23 10:15:45 +0000177 GoogleStyle.SpacesInBracedLists = false;
Alexander Kornienkoc8602662013-05-06 14:11:27 +0000178 GoogleStyle.Standard = FormatStyle::LS_Auto;
Manuel Klimek13b97d82013-05-13 08:42:42 +0000179 GoogleStyle.IndentWidth = 2;
Manuel Klimekb9eae4c2013-05-13 09:22:11 +0000180 GoogleStyle.UseTab = false;
Manuel Klimeka8eb9142013-05-13 12:51:40 +0000181 GoogleStyle.BreakBeforeBraces = FormatStyle::BS_Attach;
Manuel Klimek836c2862013-06-21 17:25:42 +0000182 GoogleStyle.IndentFunctionDeclarationAfterType = true;
Daniel Jasperf7935112012-12-03 18:12:45 +0000183 return GoogleStyle;
184}
185
Daniel Jasper1b750ed2013-01-14 16:24:39 +0000186FormatStyle getChromiumStyle() {
187 FormatStyle ChromiumStyle = getGoogleStyle();
Daniel Jasperf7db4332013-01-29 16:03:49 +0000188 ChromiumStyle.AllowAllParametersOfDeclarationOnNextLine = false;
Daniel Jasper085a2ed2013-04-24 13:46:00 +0000189 ChromiumStyle.AllowShortIfStatementsOnASingleLine = false;
Daniel Jasper3a685df2013-05-16 12:12:21 +0000190 ChromiumStyle.AllowShortLoopsOnASingleLine = false;
Daniel Jasper2cf17bf2013-02-27 09:47:53 +0000191 ChromiumStyle.BinPackParameters = false;
Daniel Jasper7fce3ab2013-02-06 14:22:40 +0000192 ChromiumStyle.Standard = FormatStyle::LS_Cpp03;
193 ChromiumStyle.DerivePointerBinding = false;
Daniel Jasper1b750ed2013-01-14 16:24:39 +0000194 return ChromiumStyle;
195}
196
Alexander Kornienkoc8602662013-05-06 14:11:27 +0000197FormatStyle getMozillaStyle() {
198 FormatStyle MozillaStyle = getLLVMStyle();
199 MozillaStyle.AllowAllParametersOfDeclarationOnNextLine = false;
200 MozillaStyle.ConstructorInitializerAllOnOneLineOrOnePerLine = true;
201 MozillaStyle.DerivePointerBinding = true;
202 MozillaStyle.IndentCaseLabels = true;
203 MozillaStyle.ObjCSpaceBeforeProtocolList = false;
204 MozillaStyle.PenaltyReturnTypeOnItsOwnLine = 200;
205 MozillaStyle.PointerBindsToType = true;
206 return MozillaStyle;
207}
208
Alexander Kornienko006b5c82013-05-19 00:53:30 +0000209bool getPredefinedStyle(StringRef Name, FormatStyle *Style) {
Alexander Kornienkod6538332013-05-07 15:32:14 +0000210 if (Name.equals_lower("llvm"))
Alexander Kornienko006b5c82013-05-19 00:53:30 +0000211 *Style = getLLVMStyle();
212 else if (Name.equals_lower("chromium"))
213 *Style = getChromiumStyle();
214 else if (Name.equals_lower("mozilla"))
215 *Style = getMozillaStyle();
216 else if (Name.equals_lower("google"))
217 *Style = getGoogleStyle();
218 else
219 return false;
Alexander Kornienkod6538332013-05-07 15:32:14 +0000220
Alexander Kornienko006b5c82013-05-19 00:53:30 +0000221 return true;
Alexander Kornienkod6538332013-05-07 15:32:14 +0000222}
223
224llvm::error_code parseConfiguration(StringRef Text, FormatStyle *Style) {
Alexander Kornienko06e00332013-05-20 15:18:01 +0000225 if (Text.trim().empty())
226 return llvm::make_error_code(llvm::errc::invalid_argument);
Alexander Kornienkod6538332013-05-07 15:32:14 +0000227 llvm::yaml::Input Input(Text);
228 Input >> *Style;
229 return Input.error();
230}
231
232std::string configurationAsText(const FormatStyle &Style) {
233 std::string Text;
234 llvm::raw_string_ostream Stream(Text);
235 llvm::yaml::Output Output(Stream);
236 // We use the same mapping method for input and output, so we need a non-const
237 // reference here.
238 FormatStyle NonConstStyle = Style;
239 Output << NonConstStyle;
Alexander Kornienko9a38ec22013-05-13 12:56:35 +0000240 return Stream.str();
Alexander Kornienkod6538332013-05-07 15:32:14 +0000241}
242
Daniel Jasperacc33662013-02-08 08:22:00 +0000243// Returns the length of everything up to the first possible line break after
244// the ), ], } or > matching \c Tok.
Manuel Klimek6e6310e2013-05-29 14:47:47 +0000245static unsigned getLengthToMatchingParen(const FormatToken &Tok) {
Daniel Jasperacc33662013-02-08 08:22:00 +0000246 if (Tok.MatchingParen == NULL)
247 return 0;
Manuel Klimek6e6310e2013-05-29 14:47:47 +0000248 FormatToken *End = Tok.MatchingParen;
249 while (End->Next && !End->Next->CanBreakBefore) {
250 End = End->Next;
Daniel Jasperacc33662013-02-08 08:22:00 +0000251 }
252 return End->TotalLength - Tok.TotalLength + 1;
253}
254
Craig Topperaf35e852013-06-30 22:29:28 +0000255namespace {
256
Daniel Jasperf7935112012-12-03 18:12:45 +0000257class UnwrappedLineFormatter {
258public:
Manuel Klimekb2c6dbe2013-01-10 19:17:33 +0000259 UnwrappedLineFormatter(const FormatStyle &Style, SourceManager &SourceMgr,
Daniel Jasperf1e4b7d2013-01-14 13:08:07 +0000260 const AnnotatedLine &Line, unsigned FirstIndent,
Manuel Klimek6e6310e2013-05-29 14:47:47 +0000261 const FormatToken *RootToken,
Alexander Kornienkoffcc0102013-06-05 14:09:10 +0000262 WhitespaceManager &Whitespaces,
263 encoding::Encoding Encoding)
Daniel Jasper2af6bbe2012-12-18 21:05:13 +0000264 : Style(Style), SourceMgr(SourceMgr), Line(Line),
Daniel Jasperaa701fa2013-01-18 08:44:07 +0000265 FirstIndent(FirstIndent), RootToken(RootToken),
Alexander Kornienkoffcc0102013-06-05 14:09:10 +0000266 Whitespaces(Whitespaces), Count(0), Encoding(Encoding) {}
Daniel Jasperf7935112012-12-03 18:12:45 +0000267
Manuel Klimek1abf7892013-01-04 23:34:14 +0000268 /// \brief Formats an \c UnwrappedLine.
Manuel Klimek4fe43002013-05-22 12:51:29 +0000269 void format(const AnnotatedLine *NextLine) {
Daniel Jaspere9de2602012-12-06 09:56:08 +0000270 // Initialize state dependent on indent.
Daniel Jasper337816e2013-01-11 10:22:12 +0000271 LineState State;
Manuel Klimek0b689fd2013-01-10 18:45:26 +0000272 State.Column = FirstIndent;
Manuel Klimek6e6310e2013-05-29 14:47:47 +0000273 State.NextToken = RootToken;
Daniel Jasper97b89482013-03-13 07:49:51 +0000274 State.Stack.push_back(
Nico Weber9096fc02013-06-26 00:30:14 +0000275 ParenState(FirstIndent, FirstIndent, /*AvoidBinPacking=*/false,
276 /*NoLineBreak=*/false));
Daniel Jasperfbde69e2012-12-21 14:37:20 +0000277 State.LineContainsContinuedForLoopSection = false;
Daniel Jasper400adc62013-02-08 15:28:42 +0000278 State.ParenLevel = 0;
Manuel Klimek02f640a2013-02-20 15:25:48 +0000279 State.StartOfStringLiteral = 0;
Daniel Jasper40c36c52013-02-18 11:05:07 +0000280 State.StartOfLineLevel = State.ParenLevel;
Daniel Jasper80503952013-06-03 09:54:46 +0000281 State.LowestCallLevel = State.ParenLevel;
Daniel Jasperf8114cf2013-05-22 05:27:42 +0000282 State.IgnoreStackForComparison = false;
Daniel Jaspere9de2602012-12-06 09:56:08 +0000283
284 // The first token has already been indented and thus consumed.
Nico Weber9096fc02013-06-26 00:30:14 +0000285 moveStateToNextToken(State, /*DryRun=*/false);
Daniel Jasperf7935112012-12-03 18:12:45 +0000286
Daniel Jasper4b866272013-02-01 11:00:45 +0000287 // If everything fits on a single line, just put it there.
Daniel Jasperc22f5b42013-02-28 11:05:57 +0000288 unsigned ColumnLimit = Style.ColumnLimit;
289 if (NextLine && NextLine->InPPDirective &&
Manuel Klimek6e6310e2013-05-29 14:47:47 +0000290 !NextLine->First->HasUnescapedNewline)
Daniel Jasperc22f5b42013-02-28 11:05:57 +0000291 ColumnLimit = getColumnLimit();
292 if (Line.Last->TotalLength <= ColumnLimit - FirstIndent) {
Daniel Jasper4b866272013-02-01 11:00:45 +0000293 while (State.NextToken != NULL) {
Daniel Jasper2af6bbe2012-12-18 21:05:13 +0000294 addTokenToState(false, false, State);
Daniel Jasper2af6bbe2012-12-18 21:05:13 +0000295 }
Daniel Jasperf7935112012-12-03 18:12:45 +0000296 }
Daniel Jasper4b866272013-02-01 11:00:45 +0000297
Daniel Jasperacc33662013-02-08 08:22:00 +0000298 // If the ObjC method declaration does not fit on a line, we should format
299 // it with one arg per line.
300 if (Line.Type == LT_ObjCMethodDecl)
301 State.Stack.back().BreakBeforeParameter = true;
302
Daniel Jasper4b866272013-02-01 11:00:45 +0000303 // Find best solution in solution space.
Manuel Klimek4fe43002013-05-22 12:51:29 +0000304 analyzeSolutionSpace(State);
Daniel Jasperf7935112012-12-03 18:12:45 +0000305 }
306
307private:
Manuel Klimek6e6310e2013-05-29 14:47:47 +0000308 void DebugTokenState(const FormatToken &FormatTok) {
309 const Token &Tok = FormatTok.Tok;
Alexander Kornienko49149672013-05-10 11:56:10 +0000310 llvm::dbgs() << StringRef(SourceMgr.getCharacterData(Tok.getLocation()),
Daniel Jasperbbc84152013-01-29 11:27:30 +0000311 Tok.getLength());
Alexander Kornienko49149672013-05-10 11:56:10 +0000312 llvm::dbgs();
Manuel Klimek24998102013-01-16 14:55:28 +0000313 }
314
Daniel Jasper337816e2013-01-11 10:22:12 +0000315 struct ParenState {
Daniel Jasperb9ebd5d2013-02-05 09:41:21 +0000316 ParenState(unsigned Indent, unsigned LastSpace, bool AvoidBinPacking,
Daniel Jaspercc960fa2013-04-22 07:59:53 +0000317 bool NoLineBreak)
Daniel Jasper400adc62013-02-08 15:28:42 +0000318 : Indent(Indent), LastSpace(LastSpace), FirstLessLess(0),
319 BreakBeforeClosingBrace(false), QuestionColumn(0),
Daniel Jasperacc33662013-02-08 08:22:00 +0000320 AvoidBinPacking(AvoidBinPacking), BreakBeforeParameter(false),
Daniel Jaspercc960fa2013-04-22 07:59:53 +0000321 NoLineBreak(NoLineBreak), ColonPos(0), StartOfFunctionCall(0),
322 NestedNameSpecifierContinuation(0), CallContinuation(0),
Daniel Jaspercc3044c2013-05-13 09:19:24 +0000323 VariablePos(0), ForFakeParenthesis(false) {}
Daniel Jasper6d822722012-12-24 16:43:00 +0000324
Daniel Jasperf7935112012-12-03 18:12:45 +0000325 /// \brief The position to which a specific parenthesis level needs to be
326 /// indented.
Daniel Jasper337816e2013-01-11 10:22:12 +0000327 unsigned Indent;
Daniel Jasperf7935112012-12-03 18:12:45 +0000328
Daniel Jaspere9de2602012-12-06 09:56:08 +0000329 /// \brief The position of the last space on each level.
330 ///
331 /// Used e.g. to break like:
332 /// functionCall(Parameter, otherCall(
333 /// OtherParameter));
Daniel Jasper337816e2013-01-11 10:22:12 +0000334 unsigned LastSpace;
Daniel Jasperf7935112012-12-03 18:12:45 +0000335
Daniel Jaspere9de2602012-12-06 09:56:08 +0000336 /// \brief The position the first "<<" operator encountered on each level.
337 ///
338 /// Used to align "<<" operators. 0 if no such operator has been encountered
339 /// on a level.
Daniel Jasper337816e2013-01-11 10:22:12 +0000340 unsigned FirstLessLess;
Daniel Jaspere9de2602012-12-06 09:56:08 +0000341
Manuel Klimek0ddd57a2013-01-10 15:58:26 +0000342 /// \brief Whether a newline needs to be inserted before the block's closing
343 /// brace.
344 ///
345 /// We only want to insert a newline before the closing brace if there also
346 /// was a newline after the beginning left brace.
Daniel Jasper337816e2013-01-11 10:22:12 +0000347 bool BreakBeforeClosingBrace;
348
Daniel Jasperca6623b2013-01-28 12:45:14 +0000349 /// \brief The column of a \c ? in a conditional expression;
350 unsigned QuestionColumn;
351
Daniel Jasper8a8ce242013-01-31 14:59:26 +0000352 /// \brief Avoid bin packing, i.e. multiple parameters/elements on multiple
353 /// lines, in this context.
354 bool AvoidBinPacking;
355
356 /// \brief Break after the next comma (or all the commas in this context if
357 /// \c AvoidBinPacking is \c true).
Daniel Jasperacc33662013-02-08 08:22:00 +0000358 bool BreakBeforeParameter;
Daniel Jasper8a8ce242013-01-31 14:59:26 +0000359
Daniel Jaspercc960fa2013-04-22 07:59:53 +0000360 /// \brief Line breaking in this context would break a formatting rule.
361 bool NoLineBreak;
Daniel Jasper2408a8c2013-01-11 11:37:55 +0000362
Daniel Jasper1ac3e052013-02-05 10:07:47 +0000363 /// \brief The position of the colon in an ObjC method declaration/call.
364 unsigned ColonPos;
Daniel Jasperdc7d5812013-02-20 12:56:39 +0000365
Daniel Jasperf9a84b52013-03-01 16:48:32 +0000366 /// \brief The start of the most recent function in a builder-type call.
367 unsigned StartOfFunctionCall;
368
Daniel Jasperc238c872013-04-02 14:33:13 +0000369 /// \brief If a nested name specifier was broken over multiple lines, this
370 /// contains the start column of the second line. Otherwise 0.
371 unsigned NestedNameSpecifierContinuation;
372
373 /// \brief If a call expression was broken over multiple lines, this
374 /// contains the start column of the second line. Otherwise 0.
375 unsigned CallContinuation;
376
Daniel Jaspera628c982013-04-03 13:36:17 +0000377 /// \brief The column of the first variable name in a variable declaration.
378 ///
379 /// Used to align further variables if necessary.
380 unsigned VariablePos;
381
Daniel Jaspercc3044c2013-05-13 09:19:24 +0000382 /// \brief \c true if this \c ParenState was created for a fake parenthesis.
383 ///
384 /// Does not need to be considered for memoization / the comparison function
385 /// as otherwise identical states will have the same fake/non-fake
386 /// \c ParenStates.
387 bool ForFakeParenthesis;
388
Daniel Jasper337816e2013-01-11 10:22:12 +0000389 bool operator<(const ParenState &Other) const {
390 if (Indent != Other.Indent)
Daniel Jasperfd8c4b12013-01-11 14:23:32 +0000391 return Indent < Other.Indent;
Daniel Jasper337816e2013-01-11 10:22:12 +0000392 if (LastSpace != Other.LastSpace)
393 return LastSpace < Other.LastSpace;
394 if (FirstLessLess != Other.FirstLessLess)
395 return FirstLessLess < Other.FirstLessLess;
Daniel Jasper2408a8c2013-01-11 11:37:55 +0000396 if (BreakBeforeClosingBrace != Other.BreakBeforeClosingBrace)
397 return BreakBeforeClosingBrace;
Daniel Jasperca6623b2013-01-28 12:45:14 +0000398 if (QuestionColumn != Other.QuestionColumn)
399 return QuestionColumn < Other.QuestionColumn;
Daniel Jasper8a8ce242013-01-31 14:59:26 +0000400 if (AvoidBinPacking != Other.AvoidBinPacking)
401 return AvoidBinPacking;
Daniel Jasperacc33662013-02-08 08:22:00 +0000402 if (BreakBeforeParameter != Other.BreakBeforeParameter)
403 return BreakBeforeParameter;
Daniel Jaspercc960fa2013-04-22 07:59:53 +0000404 if (NoLineBreak != Other.NoLineBreak)
405 return NoLineBreak;
Daniel Jasper1ac3e052013-02-05 10:07:47 +0000406 if (ColonPos != Other.ColonPos)
407 return ColonPos < Other.ColonPos;
Daniel Jasperf9a84b52013-03-01 16:48:32 +0000408 if (StartOfFunctionCall != Other.StartOfFunctionCall)
409 return StartOfFunctionCall < Other.StartOfFunctionCall;
Daniel Jasperc238c872013-04-02 14:33:13 +0000410 if (CallContinuation != Other.CallContinuation)
411 return CallContinuation < Other.CallContinuation;
Daniel Jaspera628c982013-04-03 13:36:17 +0000412 if (VariablePos != Other.VariablePos)
413 return VariablePos < Other.VariablePos;
Daniel Jasper7b7877a2013-01-12 07:36:22 +0000414 return false;
Daniel Jasper337816e2013-01-11 10:22:12 +0000415 }
416 };
417
418 /// \brief The current state when indenting a unwrapped line.
419 ///
420 /// As the indenting tries different combinations this is copied by value.
421 struct LineState {
422 /// \brief The number of used columns in the current line.
423 unsigned Column;
424
425 /// \brief The token that needs to be next formatted.
Manuel Klimek6e6310e2013-05-29 14:47:47 +0000426 const FormatToken *NextToken;
Daniel Jasper337816e2013-01-11 10:22:12 +0000427
Daniel Jasperfbde69e2012-12-21 14:37:20 +0000428 /// \brief \c true if this line contains a continued for-loop section.
429 bool LineContainsContinuedForLoopSection;
430
Daniel Jasper400adc62013-02-08 15:28:42 +0000431 /// \brief The level of nesting inside (), [], <> and {}.
432 unsigned ParenLevel;
433
Daniel Jasper40c36c52013-02-18 11:05:07 +0000434 /// \brief The \c ParenLevel at the start of this line.
435 unsigned StartOfLineLevel;
436
Daniel Jasper80503952013-06-03 09:54:46 +0000437 /// \brief The lowest \c ParenLevel of "." or "->" on the current line.
438 unsigned LowestCallLevel;
Daniel Jasper32a796b2013-05-27 11:50:16 +0000439
Manuel Klimek02f640a2013-02-20 15:25:48 +0000440 /// \brief The start column of the string literal, if we're in a string
441 /// literal sequence, 0 otherwise.
442 unsigned StartOfStringLiteral;
443
Daniel Jasper337816e2013-01-11 10:22:12 +0000444 /// \brief A stack keeping track of properties applying to parenthesis
445 /// levels.
446 std::vector<ParenState> Stack;
447
Daniel Jasperf8114cf2013-05-22 05:27:42 +0000448 /// \brief Ignore the stack of \c ParenStates for state comparison.
449 ///
450 /// In long and deeply nested unwrapped lines, the current algorithm can
451 /// be insufficient for finding the best formatting with a reasonable amount
452 /// of time and memory. Setting this flag will effectively lead to the
453 /// algorithm not analyzing some combinations. However, these combinations
454 /// rarely contain the optimal solution: In short, accepting a higher
455 /// penalty early would need to lead to different values in the \c
456 /// ParenState stack (in an otherwise identical state) and these different
457 /// values would need to lead to a significant amount of avoided penalty
458 /// later.
459 ///
460 /// FIXME: Come up with a better algorithm instead.
461 bool IgnoreStackForComparison;
462
Daniel Jasper337816e2013-01-11 10:22:12 +0000463 /// \brief Comparison operator to be able to used \c LineState in \c map.
464 bool operator<(const LineState &Other) const {
Daniel Jasper58f427e2013-02-19 09:28:55 +0000465 if (NextToken != Other.NextToken)
466 return NextToken < Other.NextToken;
467 if (Column != Other.Column)
468 return Column < Other.Column;
Daniel Jasper58f427e2013-02-19 09:28:55 +0000469 if (LineContainsContinuedForLoopSection !=
Alexander Kornienkocb45bc12013-04-15 14:28:00 +0000470 Other.LineContainsContinuedForLoopSection)
Daniel Jasperfbde69e2012-12-21 14:37:20 +0000471 return LineContainsContinuedForLoopSection;
Daniel Jasper58f427e2013-02-19 09:28:55 +0000472 if (ParenLevel != Other.ParenLevel)
473 return ParenLevel < Other.ParenLevel;
474 if (StartOfLineLevel != Other.StartOfLineLevel)
475 return StartOfLineLevel < Other.StartOfLineLevel;
Daniel Jasper80503952013-06-03 09:54:46 +0000476 if (LowestCallLevel != Other.LowestCallLevel)
477 return LowestCallLevel < Other.LowestCallLevel;
Manuel Klimek02f640a2013-02-20 15:25:48 +0000478 if (StartOfStringLiteral != Other.StartOfStringLiteral)
479 return StartOfStringLiteral < Other.StartOfStringLiteral;
Daniel Jasperf8114cf2013-05-22 05:27:42 +0000480 if (IgnoreStackForComparison || Other.IgnoreStackForComparison)
481 return false;
Daniel Jasper58f427e2013-02-19 09:28:55 +0000482 return Stack < Other.Stack;
Daniel Jasperf7935112012-12-03 18:12:45 +0000483 }
484 };
485
Daniel Jasper6021c4a2012-12-04 14:54:30 +0000486 /// \brief Appends the next token to \p State and updates information
487 /// necessary for indentation.
488 ///
Nico Weberf579ab32013-06-26 02:42:46 +0000489 /// Puts the token on the current line if \p Newline is \c false and adds a
Daniel Jasper6021c4a2012-12-04 14:54:30 +0000490 /// line break and necessary indentation otherwise.
491 ///
492 /// If \p DryRun is \c false, also creates and stores the required
493 /// \c Replacement.
Manuel Klimek1998ea22013-02-20 10:15:13 +0000494 unsigned addTokenToState(bool Newline, bool DryRun, LineState &State) {
Manuel Klimek6e6310e2013-05-29 14:47:47 +0000495 const FormatToken &Current = *State.NextToken;
496 const FormatToken &Previous = *State.NextToken->Previous;
Daniel Jasperf7935112012-12-03 18:12:45 +0000497
Daniel Jasper291f9362013-03-20 15:58:10 +0000498 if (State.Stack.size() == 0 || Current.Type == TT_ImplicitStringLiteral) {
Manuel Klimek5c24cca2013-05-23 10:56:37 +0000499 // FIXME: Is this correct?
Manuel Klimek6e6310e2013-05-29 14:47:47 +0000500 int WhitespaceLength = SourceMgr.getSpellingColumnNumber(
501 State.NextToken->WhitespaceRange.getEnd()) -
502 SourceMgr.getSpellingColumnNumber(
503 State.NextToken->WhitespaceRange.getBegin());
Alexander Kornienkoffcc0102013-06-05 14:09:10 +0000504 State.Column += WhitespaceLength + State.NextToken->CodePointCount;
Manuel Klimek6e6310e2013-05-29 14:47:47 +0000505 State.NextToken = State.NextToken->Next;
Manuel Klimek1998ea22013-02-20 10:15:13 +0000506 return 0;
Daniel Jasper4b866272013-02-01 11:00:45 +0000507 }
508
Daniel Jasper5188e6b2013-04-03 07:21:51 +0000509 // If we are continuing an expression, we want to indent an extra 4 spaces.
510 unsigned ContinuationIndent =
Daniel Jasperc238c872013-04-02 14:33:13 +0000511 std::max(State.Stack.back().LastSpace, State.Stack.back().Indent) + 4;
Daniel Jasperf7935112012-12-03 18:12:45 +0000512 if (Newline) {
Manuel Klimek8e07a1b2013-01-10 11:52:21 +0000513 if (Current.is(tok::r_brace)) {
Manuel Klimek13b97d82013-05-13 08:42:42 +0000514 State.Column = Line.Level * Style.IndentWidth;
Daniel Jasper399d24b2013-01-09 07:06:56 +0000515 } else if (Current.is(tok::string_literal) &&
Manuel Klimek02f640a2013-02-20 15:25:48 +0000516 State.StartOfStringLiteral != 0) {
517 State.Column = State.StartOfStringLiteral;
Daniel Jasper2ec3ffb82013-02-18 11:59:17 +0000518 State.Stack.back().BreakBeforeParameter = true;
Daniel Jasper399d24b2013-01-09 07:06:56 +0000519 } else if (Current.is(tok::lessless) &&
Daniel Jasper400adc62013-02-08 15:28:42 +0000520 State.Stack.back().FirstLessLess != 0) {
521 State.Column = State.Stack.back().FirstLessLess;
Daniel Jasperbca4bbe2013-05-28 11:30:49 +0000522 } else if (Current.isOneOf(tok::period, tok::arrow) &&
523 Current.Type != TT_DesignatedInitializerPeriod) {
Daniel Jasper5188e6b2013-04-03 07:21:51 +0000524 if (State.Stack.back().CallContinuation == 0) {
525 State.Column = ContinuationIndent;
Daniel Jasperc238c872013-04-02 14:33:13 +0000526 State.Stack.back().CallContinuation = State.Column;
Daniel Jasper5188e6b2013-04-03 07:21:51 +0000527 } else {
528 State.Column = State.Stack.back().CallContinuation;
529 }
Daniel Jasperca6623b2013-01-28 12:45:14 +0000530 } else if (Current.Type == TT_ConditionalExpr) {
531 State.Column = State.Stack.back().QuestionColumn;
Daniel Jaspera628c982013-04-03 13:36:17 +0000532 } else if (Previous.is(tok::comma) &&
533 State.Stack.back().VariablePos != 0) {
534 State.Column = State.Stack.back().VariablePos;
Daniel Jasper26d1b1d2013-02-24 18:54:32 +0000535 } else if (Previous.ClosesTemplateDeclaration ||
Daniel Jasper8e357692013-05-06 08:27:33 +0000536 (Current.Type == TT_StartOfName && State.ParenLevel == 0 &&
Manuel Klimek836c2862013-06-21 17:25:42 +0000537 (!Style.IndentFunctionDeclarationAfterType ||
538 Line.StartsDefinition))) {
Daniel Jasperc238c872013-04-02 14:33:13 +0000539 State.Column = State.Stack.back().Indent;
Daniel Jasper1ac3e052013-02-05 10:07:47 +0000540 } else if (Current.Type == TT_ObjCSelectorName) {
Alexander Kornienkoffcc0102013-06-05 14:09:10 +0000541 if (State.Stack.back().ColonPos > Current.CodePointCount) {
542 State.Column = State.Stack.back().ColonPos - Current.CodePointCount;
Daniel Jasper1ac3e052013-02-05 10:07:47 +0000543 } else {
544 State.Column = State.Stack.back().Indent;
Alexander Kornienkoffcc0102013-06-05 14:09:10 +0000545 State.Stack.back().ColonPos = State.Column + Current.CodePointCount;
Daniel Jasper1ac3e052013-02-05 10:07:47 +0000546 }
Daniel Jasper0f0234e2013-05-08 10:00:18 +0000547 } else if (Current.Type == TT_StartOfName ||
548 Previous.isOneOf(tok::coloncolon, tok::equal) ||
Daniel Jasperc238c872013-04-02 14:33:13 +0000549 Previous.Type == TT_ObjCMethodExpr) {
Daniel Jasper5188e6b2013-04-03 07:21:51 +0000550 State.Column = ContinuationIndent;
Daniel Jasperfbde69e2012-12-21 14:37:20 +0000551 } else {
Daniel Jasper400adc62013-02-08 15:28:42 +0000552 State.Column = State.Stack.back().Indent;
Daniel Jasper5188e6b2013-04-03 07:21:51 +0000553 // Ensure that we fall back to indenting 4 spaces instead of just
554 // flushing continuations left.
Daniel Jasperc238c872013-04-02 14:33:13 +0000555 if (State.Column == FirstIndent)
556 State.Column += 4;
Daniel Jasperfbde69e2012-12-21 14:37:20 +0000557 }
558
Daniel Jasper54a86022013-02-15 11:07:25 +0000559 if (Current.is(tok::question))
Daniel Jaspercd8599e2013-02-23 21:01:55 +0000560 State.Stack.back().BreakBeforeParameter = true;
Daniel Jasperd69fc772013-05-08 14:12:04 +0000561 if ((Previous.isOneOf(tok::comma, tok::semi) &&
562 !State.Stack.back().AvoidBinPacking) ||
563 Previous.Type == TT_BinaryOperator)
Daniel Jasperacc33662013-02-08 08:22:00 +0000564 State.Stack.back().BreakBeforeParameter = false;
Daniel Jasperc6fbc212013-05-15 09:35:08 +0000565 if (Previous.Type == TT_TemplateCloser && State.ParenLevel == 0)
566 State.Stack.back().BreakBeforeParameter = false;
Daniel Jasper8a8ce242013-01-31 14:59:26 +0000567
Manuel Klimekb69e3c62013-01-02 18:33:23 +0000568 if (!DryRun) {
Daniel Jasperfb5e2412013-02-26 13:10:34 +0000569 unsigned NewLines = 1;
Alexander Kornienkof370ad92013-06-12 19:04:12 +0000570 if (Current.is(tok::comment))
Manuel Klimek6e6310e2013-05-29 14:47:47 +0000571 NewLines = std::max(
572 NewLines,
573 std::min(Current.NewlinesBefore, Style.MaxEmptyLinesToKeep + 1));
Manuel Klimek4fe43002013-05-22 12:51:29 +0000574 Whitespaces.replaceWhitespace(Current, NewLines, State.Column,
575 State.Column, Line.InPPDirective);
Manuel Klimekb69e3c62013-01-02 18:33:23 +0000576 }
Daniel Jasperf7935112012-12-03 18:12:45 +0000577
Daniel Jasper400adc62013-02-08 15:28:42 +0000578 State.Stack.back().LastSpace = State.Column;
Daniel Jasperbca4bbe2013-05-28 11:30:49 +0000579 if (Current.isOneOf(tok::arrow, tok::period) &&
580 Current.Type != TT_DesignatedInitializerPeriod)
Alexander Kornienkoffcc0102013-06-05 14:09:10 +0000581 State.Stack.back().LastSpace += Current.CodePointCount;
Daniel Jasper40c36c52013-02-18 11:05:07 +0000582 State.StartOfLineLevel = State.ParenLevel;
Daniel Jasper80503952013-06-03 09:54:46 +0000583 State.LowestCallLevel = State.ParenLevel;
Daniel Jaspercd8599e2013-02-23 21:01:55 +0000584
585 // Any break on this level means that the parent level has been broken
586 // and we need to avoid bin packing there.
587 for (unsigned i = 0, e = State.Stack.size() - 1; i != e; ++i) {
588 State.Stack[i].BreakBeforeParameter = true;
589 }
Alexander Kornienko1efe0a02013-07-04 14:47:51 +0000590 const FormatToken *TokenBefore = Current.getPreviousNonComment();
Daniel Jasper1b8e76f2013-04-15 22:36:37 +0000591 if (TokenBefore && !TokenBefore->isOneOf(tok::comma, tok::semi) &&
Daniel Jasperc6fbc212013-05-15 09:35:08 +0000592 TokenBefore->Type != TT_TemplateCloser &&
Daniel Jasperd69fc772013-05-08 14:12:04 +0000593 TokenBefore->Type != TT_BinaryOperator && !TokenBefore->opensScope())
Daniel Jasper2cf17bf2013-02-27 09:47:53 +0000594 State.Stack.back().BreakBeforeParameter = true;
595
Daniel Jaspercd8599e2013-02-23 21:01:55 +0000596 // If we break after {, we should also break before the corresponding }.
597 if (Previous.is(tok::l_brace))
598 State.Stack.back().BreakBeforeClosingBrace = true;
599
600 if (State.Stack.back().AvoidBinPacking) {
601 // If we are breaking after '(', '{', '<', this is not bin packing
602 // unless AllowAllParametersOfDeclarationOnNextLine is false.
Daniel Jasper571f1af2013-05-14 20:39:56 +0000603 if (!(Previous.isOneOf(tok::l_paren, tok::l_brace) ||
604 Previous.Type == TT_BinaryOperator) ||
Daniel Jaspercd8599e2013-02-23 21:01:55 +0000605 (!Style.AllowAllParametersOfDeclarationOnNextLine &&
606 Line.MustBeDeclaration))
607 State.Stack.back().BreakBeforeParameter = true;
608 }
Daniel Jasperf7935112012-12-03 18:12:45 +0000609 } else {
Daniel Jasper62e68172013-02-25 15:59:54 +0000610 if (Current.is(tok::equal) &&
Manuel Klimek6e6310e2013-05-29 14:47:47 +0000611 (RootToken->is(tok::kw_for) || State.ParenLevel == 0) &&
Daniel Jasper31c96b92013-04-05 09:38:50 +0000612 State.Stack.back().VariablePos == 0) {
613 State.Stack.back().VariablePos = State.Column;
614 // Move over * and & if they are bound to the variable name.
Manuel Klimek6e6310e2013-05-29 14:47:47 +0000615 const FormatToken *Tok = &Previous;
Alexander Kornienkoffcc0102013-06-05 14:09:10 +0000616 while (Tok && State.Stack.back().VariablePos >= Tok->CodePointCount) {
617 State.Stack.back().VariablePos -= Tok->CodePointCount;
Daniel Jasper31c96b92013-04-05 09:38:50 +0000618 if (Tok->SpacesRequiredBefore != 0)
619 break;
Manuel Klimek6e6310e2013-05-29 14:47:47 +0000620 Tok = Tok->Previous;
Daniel Jasper31c96b92013-04-05 09:38:50 +0000621 }
Daniel Jaspera628c982013-04-03 13:36:17 +0000622 if (Previous.PartOfMultiVariableDeclStmt)
623 State.Stack.back().LastSpace = State.Stack.back().VariablePos;
624 }
Daniel Jasperfbde69e2012-12-21 14:37:20 +0000625
Daniel Jaspereef30492013-02-11 12:36:37 +0000626 unsigned Spaces = State.NextToken->SpacesRequiredBefore;
Daniel Jasper6021c4a2012-12-04 14:54:30 +0000627
Daniel Jasperf7935112012-12-03 18:12:45 +0000628 if (!DryRun)
Manuel Klimek4fe43002013-05-22 12:51:29 +0000629 Whitespaces.replaceWhitespace(Current, 0, Spaces,
630 State.Column + Spaces);
Daniel Jasper6021c4a2012-12-04 14:54:30 +0000631
Daniel Jasper1ac3e052013-02-05 10:07:47 +0000632 if (Current.Type == TT_ObjCSelectorName &&
633 State.Stack.back().ColonPos == 0) {
634 if (State.Stack.back().Indent + Current.LongestObjCSelectorName >
Alexander Kornienkoffcc0102013-06-05 14:09:10 +0000635 State.Column + Spaces + Current.CodePointCount)
Daniel Jasper1ac3e052013-02-05 10:07:47 +0000636 State.Stack.back().ColonPos =
637 State.Stack.back().Indent + Current.LongestObjCSelectorName;
638 else
639 State.Stack.back().ColonPos =
Alexander Kornienkoffcc0102013-06-05 14:09:10 +0000640 State.Column + Spaces + Current.CodePointCount;
Daniel Jasper1ac3e052013-02-05 10:07:47 +0000641 }
642
Daniel Jasperc04baae2013-04-10 09:49:49 +0000643 if (Previous.opensScope() && Previous.Type != TT_ObjCMethodExpr &&
Daniel Jasper6bee6822013-04-08 20:33:42 +0000644 Current.Type != TT_LineComment)
Daniel Jasper400adc62013-02-08 15:28:42 +0000645 State.Stack.back().Indent = State.Column + Spaces;
Daniel Jaspercc960fa2013-04-22 07:59:53 +0000646 if (Previous.is(tok::comma) && !Current.isTrailingComment() &&
647 State.Stack.back().AvoidBinPacking)
648 State.Stack.back().NoLineBreak = true;
Daniel Jasper9278eb92013-01-16 14:59:02 +0000649
Daniel Jaspere9de2602012-12-06 09:56:08 +0000650 State.Column += Spaces;
Daniel Jaspera628c982013-04-03 13:36:17 +0000651 if (Current.is(tok::l_paren) && Previous.isOneOf(tok::kw_if, tok::kw_for))
Daniel Jasper39e27382013-01-23 20:41:06 +0000652 // Treat the condition inside an if as if it was a second function
653 // parameter, i.e. let nested calls have an indent of 4.
654 State.Stack.back().LastSpace = State.Column + 1; // 1 is length of "(".
Daniel Jasperd1ae3582013-03-20 12:37:50 +0000655 else if (Previous.is(tok::comma))
Daniel Jasper39e27382013-01-23 20:41:06 +0000656 State.Stack.back().LastSpace = State.Column;
Daniel Jasperca6623b2013-01-28 12:45:14 +0000657 else if ((Previous.Type == TT_BinaryOperator ||
Daniel Jasper65585ed2013-01-28 13:31:35 +0000658 Previous.Type == TT_ConditionalExpr ||
659 Previous.Type == TT_CtorInitializerColon) &&
Manuel Klimek6e6310e2013-05-29 14:47:47 +0000660 !(Previous.getPrecedence() == prec::Assignment &&
Daniel Jasper7b27a102013-05-27 12:45:09 +0000661 Current.FakeLParens.empty()))
662 // Always indent relative to the RHS of the expression unless this is a
663 // simple assignment without binary expression on the RHS.
Daniel Jasper20b09ef2013-01-28 09:35:24 +0000664 State.Stack.back().LastSpace = State.Column;
Daniel Jaspereead02b2013-02-14 08:42:54 +0000665 else if (Previous.Type == TT_InheritanceColon)
666 State.Stack.back().Indent = State.Column;
Daniel Jasperd69fc772013-05-08 14:12:04 +0000667 else if (Previous.opensScope() && !Current.FakeLParens.empty())
668 // If this function has multiple parameters or a binary expression
669 // parameter, indent nested calls from the start of the first parameter.
Daniel Jasper7b5773e92013-01-28 07:35:34 +0000670 State.Stack.back().LastSpace = State.Column;
Daniel Jasperf7935112012-12-03 18:12:45 +0000671 }
Daniel Jasper9278eb92013-01-16 14:59:02 +0000672
Manuel Klimek1998ea22013-02-20 10:15:13 +0000673 return moveStateToNextToken(State, DryRun);
Daniel Jasper6021c4a2012-12-04 14:54:30 +0000674 }
Daniel Jasperf7935112012-12-03 18:12:45 +0000675
Daniel Jasper6021c4a2012-12-04 14:54:30 +0000676 /// \brief Mark the next token as consumed in \p State and modify its stacks
677 /// accordingly.
Manuel Klimek1998ea22013-02-20 10:15:13 +0000678 unsigned moveStateToNextToken(LineState &State, bool DryRun) {
Manuel Klimek6e6310e2013-05-29 14:47:47 +0000679 const FormatToken &Current = *State.NextToken;
Daniel Jasper337816e2013-01-11 10:22:12 +0000680 assert(State.Stack.size());
Daniel Jaspere9de2602012-12-06 09:56:08 +0000681
Daniel Jaspereead02b2013-02-14 08:42:54 +0000682 if (Current.Type == TT_InheritanceColon)
683 State.Stack.back().AvoidBinPacking = true;
Daniel Jasper337816e2013-01-11 10:22:12 +0000684 if (Current.is(tok::lessless) && State.Stack.back().FirstLessLess == 0)
685 State.Stack.back().FirstLessLess = State.Column;
Daniel Jasperca6623b2013-01-28 12:45:14 +0000686 if (Current.is(tok::question))
687 State.Stack.back().QuestionColumn = State.Column;
Daniel Jasper80503952013-06-03 09:54:46 +0000688 if (Current.isOneOf(tok::period, tok::arrow)) {
689 State.LowestCallLevel = std::min(State.LowestCallLevel, State.ParenLevel);
690 if (Line.Type == LT_BuilderTypeCall && State.ParenLevel == 0)
691 State.Stack.back().StartOfFunctionCall =
Alexander Kornienkoffcc0102013-06-05 14:09:10 +0000692 Current.LastInChainOfCalls ? 0
693 : State.Column + Current.CodePointCount;
Daniel Jasper80503952013-06-03 09:54:46 +0000694 }
Daniel Jasper37905f72013-02-21 15:00:29 +0000695 if (Current.Type == TT_CtorInitializerColon) {
Manuel Klimek13b97d82013-05-13 08:42:42 +0000696 // Indent 2 from the column, so:
697 // SomeClass::SomeClass()
698 // : First(...), ...
699 // Next(...)
700 // ^ line up here.
Daniel Jasper6bee6822013-04-08 20:33:42 +0000701 State.Stack.back().Indent = State.Column + 2;
Daniel Jasper37905f72013-02-21 15:00:29 +0000702 if (Style.ConstructorInitializerAllOnOneLineOrOnePerLine)
703 State.Stack.back().AvoidBinPacking = true;
704 State.Stack.back().BreakBeforeParameter = false;
Daniel Jasper8a8ce242013-01-31 14:59:26 +0000705 }
Daniel Jasper5188e6b2013-04-03 07:21:51 +0000706
Daniel Jasper6bee6822013-04-08 20:33:42 +0000707 // If return returns a binary expression, align after it.
708 if (Current.is(tok::kw_return) && !Current.FakeLParens.empty())
709 State.Stack.back().LastSpace = State.Column + 7;
710
Daniel Jasper5188e6b2013-04-03 07:21:51 +0000711 // In ObjC method declaration we align on the ":" of parameters, but we need
712 // to ensure that we indent parameters on subsequent lines by at least 4.
Daniel Jasperc238c872013-04-02 14:33:13 +0000713 if (Current.Type == TT_ObjCMethodSpecifier)
714 State.Stack.back().Indent += 4;
Daniel Jaspere9de2602012-12-06 09:56:08 +0000715
Daniel Jasper400adc62013-02-08 15:28:42 +0000716 // Insert scopes created by fake parenthesis.
Alexander Kornienko1efe0a02013-07-04 14:47:51 +0000717 const FormatToken *Previous = Current.getPreviousNonComment();
Daniel Jasper6bee6822013-04-08 20:33:42 +0000718 // Don't add extra indentation for the first fake parenthesis after
719 // 'return', assignements or opening <({[. The indentation for these cases
720 // is special cased.
721 bool SkipFirstExtraIndent =
722 Current.is(tok::kw_return) ||
Daniel Jasperc04baae2013-04-10 09:49:49 +0000723 (Previous && (Previous->opensScope() ||
Manuel Klimek6e6310e2013-05-29 14:47:47 +0000724 Previous->getPrecedence() == prec::Assignment));
Daniel Jasper6bee6822013-04-08 20:33:42 +0000725 for (SmallVector<prec::Level, 4>::const_reverse_iterator
726 I = Current.FakeLParens.rbegin(),
727 E = Current.FakeLParens.rend();
728 I != E; ++I) {
Daniel Jasper400adc62013-02-08 15:28:42 +0000729 ParenState NewParenState = State.Stack.back();
Daniel Jaspercc3044c2013-05-13 09:19:24 +0000730 NewParenState.ForFakeParenthesis = true;
Daniel Jasper6bee6822013-04-08 20:33:42 +0000731 NewParenState.Indent =
732 std::max(std::max(State.Column, NewParenState.Indent),
733 State.Stack.back().LastSpace);
734
735 // Always indent conditional expressions. Never indent expression where
736 // the 'operator' is ',', ';' or an assignment (i.e. *I <=
737 // prec::Assignment) as those have different indentation rules. Indent
738 // other expression, unless the indentation needs to be skipped.
739 if (*I == prec::Conditional ||
740 (!SkipFirstExtraIndent && *I > prec::Assignment))
741 NewParenState.Indent += 4;
Daniel Jasperc04baae2013-04-10 09:49:49 +0000742 if (Previous && !Previous->opensScope())
Daniel Jasper6bee6822013-04-08 20:33:42 +0000743 NewParenState.BreakBeforeParameter = false;
Daniel Jasper400adc62013-02-08 15:28:42 +0000744 State.Stack.push_back(NewParenState);
Daniel Jasper6bee6822013-04-08 20:33:42 +0000745 SkipFirstExtraIndent = false;
Daniel Jasper400adc62013-02-08 15:28:42 +0000746 }
747
Daniel Jasper2eda23e2012-12-24 13:43:52 +0000748 // If we encounter an opening (, [, { or <, we add a level to our stacks to
Daniel Jasper6021c4a2012-12-04 14:54:30 +0000749 // prepare for the following tokens.
Daniel Jasperc04baae2013-04-10 09:49:49 +0000750 if (Current.opensScope()) {
Daniel Jasper337816e2013-01-11 10:22:12 +0000751 unsigned NewIndent;
Daniel Jaspercc3044c2013-05-13 09:19:24 +0000752 unsigned LastSpace = State.Stack.back().LastSpace;
Daniel Jasper8a8ce242013-01-31 14:59:26 +0000753 bool AvoidBinPacking;
Manuel Klimek73a2fdf2013-01-10 14:36:46 +0000754 if (Current.is(tok::l_brace)) {
Daniel Jaspercc3044c2013-05-13 09:19:24 +0000755 NewIndent = Style.IndentWidth + LastSpace;
Alexander Kornienko1efe0a02013-07-04 14:47:51 +0000756 const FormatToken *NextNoComment = Current.getNextNonComment();
Daniel Jasperbca4bbe2013-05-28 11:30:49 +0000757 AvoidBinPacking = NextNoComment &&
758 NextNoComment->Type == TT_DesignatedInitializerPeriod;
Manuel Klimek73a2fdf2013-01-10 14:36:46 +0000759 } else {
Daniel Jaspercc3044c2013-05-13 09:19:24 +0000760 NewIndent =
761 4 + std::max(LastSpace, State.Stack.back().StartOfFunctionCall);
Daniel Jaspercc960fa2013-04-22 07:59:53 +0000762 AvoidBinPacking = !Style.BinPackParameters;
Manuel Klimek73a2fdf2013-01-10 14:36:46 +0000763 }
Daniel Jaspere3c0e012013-04-25 13:31:51 +0000764
Daniel Jaspercc3044c2013-05-13 09:19:24 +0000765 State.Stack.push_back(ParenState(NewIndent, LastSpace, AvoidBinPacking,
766 State.Stack.back().NoLineBreak));
Daniel Jasper400adc62013-02-08 15:28:42 +0000767 ++State.ParenLevel;
Daniel Jasper6021c4a2012-12-04 14:54:30 +0000768 }
769
Daniel Jasperacc33662013-02-08 08:22:00 +0000770 // If this '[' opens an ObjC call, determine whether all parameters fit into
771 // one line and put one per line if they don't.
772 if (Current.is(tok::l_square) && Current.Type == TT_ObjCMethodExpr &&
773 Current.MatchingParen != NULL) {
774 if (getLengthToMatchingParen(Current) + State.Column > getColumnLimit())
775 State.Stack.back().BreakBeforeParameter = true;
776 }
777
Daniel Jasper2eda23e2012-12-24 13:43:52 +0000778 // If we encounter a closing ), ], } or >, we can remove a level from our
Daniel Jasper6021c4a2012-12-04 14:54:30 +0000779 // stacks.
Alexander Kornienko62b85b92013-03-13 14:41:29 +0000780 if (Current.isOneOf(tok::r_paren, tok::r_square) ||
Manuel Klimek6e6310e2013-05-29 14:47:47 +0000781 (Current.is(tok::r_brace) && State.NextToken != RootToken) ||
Daniel Jasper7c85fde2013-01-08 14:56:18 +0000782 State.NextToken->Type == TT_TemplateCloser) {
Daniel Jasper337816e2013-01-11 10:22:12 +0000783 State.Stack.pop_back();
Daniel Jasper400adc62013-02-08 15:28:42 +0000784 --State.ParenLevel;
785 }
786
787 // Remove scopes created by fake parenthesis.
788 for (unsigned i = 0, e = Current.FakeRParens; i != e; ++i) {
Daniel Jasper6daabe32013-04-04 19:31:00 +0000789 unsigned VariablePos = State.Stack.back().VariablePos;
Daniel Jasper400adc62013-02-08 15:28:42 +0000790 State.Stack.pop_back();
Daniel Jasper6daabe32013-04-04 19:31:00 +0000791 State.Stack.back().VariablePos = VariablePos;
Daniel Jasperf7935112012-12-03 18:12:45 +0000792 }
Manuel Klimek73a2fdf2013-01-10 14:36:46 +0000793
Daniel Jasper47a04442013-05-13 20:50:15 +0000794 if (Current.is(tok::string_literal) && State.StartOfStringLiteral == 0) {
Manuel Klimek02f640a2013-02-20 15:25:48 +0000795 State.StartOfStringLiteral = State.Column;
Daniel Jasper47a04442013-05-13 20:50:15 +0000796 } else if (!Current.isOneOf(tok::comment, tok::identifier, tok::hash,
797 tok::string_literal)) {
Daniel Jasper7dd22c51b2013-05-16 04:26:02 +0000798 State.StartOfStringLiteral = 0;
Manuel Klimek02f640a2013-02-20 15:25:48 +0000799 }
800
Alexander Kornienkoffcc0102013-06-05 14:09:10 +0000801 State.Column += Current.CodePointCount;
Manuel Klimek1998ea22013-02-20 10:15:13 +0000802
Manuel Klimek6e6310e2013-05-29 14:47:47 +0000803 State.NextToken = State.NextToken->Next;
Manuel Klimek73a2fdf2013-01-10 14:36:46 +0000804
Manuel Klimek1998ea22013-02-20 10:15:13 +0000805 return breakProtrudingToken(Current, State, DryRun);
806 }
807
808 /// \brief If the current token sticks out over the end of the line, break
809 /// it if possible.
Manuel Klimek5ecb5fd2013-05-14 09:04:24 +0000810 ///
811 /// \returns An extra penalty if a token was broken, otherwise 0.
812 ///
Alexander Kornienkoaa620e12013-07-01 13:42:42 +0000813 /// The returned penalty will cover the cost of the additional line breaks and
814 /// column limit violation in all lines except for the last one. The penalty
815 /// for the column limit violation in the last line (and in single line
816 /// tokens) is handled in \c addNextStateToQueue.
Manuel Klimek6e6310e2013-05-29 14:47:47 +0000817 unsigned breakProtrudingToken(const FormatToken &Current, LineState &State,
Manuel Klimek4fe43002013-05-22 12:51:29 +0000818 bool DryRun) {
Alexander Kornienkocb45bc12013-04-15 14:28:00 +0000819 llvm::OwningPtr<BreakableToken> Token;
Alexander Kornienkoffcc0102013-06-05 14:09:10 +0000820 unsigned StartColumn = State.Column - Current.CodePointCount;
Manuel Klimek591ab5a2013-05-28 13:42:28 +0000821 unsigned OriginalStartColumn =
Manuel Klimek6e6310e2013-05-29 14:47:47 +0000822 SourceMgr.getSpellingColumnNumber(Current.getStartOfNonWhitespace()) -
Manuel Klimek591ab5a2013-05-28 13:42:28 +0000823 1;
Manuel Klimek9043c742013-05-27 15:23:34 +0000824
Daniel Jasper8bb99e82013-05-16 12:59:13 +0000825 if (Current.is(tok::string_literal) &&
826 Current.Type != TT_ImplicitStringLiteral) {
Alexander Kornienkocb45bc12013-04-15 14:28:00 +0000827 // Only break up default narrow strings.
Alexander Kornienkobe633902013-06-14 11:46:10 +0000828 if (!Current.TokenText.startswith("\""))
Alexander Kornienkocb45bc12013-04-15 14:28:00 +0000829 return 0;
830
Alexander Kornienkobe633902013-06-14 11:46:10 +0000831 Token.reset(new BreakableStringLiteral(Current, StartColumn,
832 Line.InPPDirective, Encoding));
Alexander Kornienkocb45bc12013-04-15 14:28:00 +0000833 } else if (Current.Type == TT_BlockComment) {
Alexander Kornienkobe633902013-06-14 11:46:10 +0000834 Token.reset(new BreakableBlockComment(
Alexander Kornienkoffcc0102013-06-05 14:09:10 +0000835 Style, Current, StartColumn, OriginalStartColumn, !Current.Previous,
Alexander Kornienkobe633902013-06-14 11:46:10 +0000836 Line.InPPDirective, Encoding));
Daniel Jasper4a4be012013-05-06 10:24:51 +0000837 } else if (Current.Type == TT_LineComment &&
Manuel Klimek6e6310e2013-05-29 14:47:47 +0000838 (Current.Previous == NULL ||
839 Current.Previous->Type != TT_ImplicitStringLiteral)) {
Alexander Kornienkobe633902013-06-14 11:46:10 +0000840 Token.reset(new BreakableLineComment(Current, StartColumn,
841 Line.InPPDirective, Encoding));
Alexander Kornienkocb45bc12013-04-15 14:28:00 +0000842 } else {
Manuel Klimek4fe43002013-05-22 12:51:29 +0000843 return 0;
Alexander Kornienkocb45bc12013-04-15 14:28:00 +0000844 }
Alexander Kornienkobe633902013-06-14 11:46:10 +0000845 if (Current.UnbreakableTailLength >= getColumnLimit())
Manuel Klimek5ecb5fd2013-05-14 09:04:24 +0000846 return 0;
Alexander Kornienkocb45bc12013-04-15 14:28:00 +0000847
Alexander Kornienkoa3555e22013-06-19 19:50:11 +0000848 unsigned RemainingSpace = getColumnLimit() - Current.UnbreakableTailLength;
Alexander Kornienkocb45bc12013-04-15 14:28:00 +0000849 bool BreakInserted = false;
850 unsigned Penalty = 0;
Alexander Kornienkoa3555e22013-06-19 19:50:11 +0000851 unsigned RemainingTokenColumns = 0;
Manuel Klimek9043c742013-05-27 15:23:34 +0000852 for (unsigned LineIndex = 0, EndIndex = Token->getLineCount();
853 LineIndex != EndIndex; ++LineIndex) {
Alexander Kornienkobe633902013-06-14 11:46:10 +0000854 if (!DryRun)
855 Token->replaceWhitespaceBefore(LineIndex, Whitespaces);
Alexander Kornienkocb45bc12013-04-15 14:28:00 +0000856 unsigned TailOffset = 0;
Alexander Kornienkoa3555e22013-06-19 19:50:11 +0000857 RemainingTokenColumns = Token->getLineLengthAfterSplit(
Alexander Kornienkodd7ece52013-06-07 16:02:52 +0000858 LineIndex, TailOffset, StringRef::npos);
Alexander Kornienkoffcc0102013-06-05 14:09:10 +0000859 while (RemainingTokenColumns > RemainingSpace) {
Alexander Kornienkocb45bc12013-04-15 14:28:00 +0000860 BreakableToken::Split Split =
Manuel Klimek4fe43002013-05-22 12:51:29 +0000861 Token->getSplit(LineIndex, TailOffset, getColumnLimit());
Alexander Kornienkoaa620e12013-07-01 13:42:42 +0000862 if (Split.first == StringRef::npos) {
863 // The last line's penalty is handled in addNextStateToQueue().
864 if (LineIndex < EndIndex - 1)
865 Penalty += Style.PenaltyExcessCharacter *
866 (RemainingTokenColumns - RemainingSpace);
Alexander Kornienkocb45bc12013-04-15 14:28:00 +0000867 break;
Alexander Kornienkoaa620e12013-07-01 13:42:42 +0000868 }
Alexander Kornienkocb45bc12013-04-15 14:28:00 +0000869 assert(Split.first != 0);
Alexander Kornienkoffcc0102013-06-05 14:09:10 +0000870 unsigned NewRemainingTokenColumns = Token->getLineLengthAfterSplit(
Alexander Kornienkodd7ece52013-06-07 16:02:52 +0000871 LineIndex, TailOffset + Split.first + Split.second,
872 StringRef::npos);
Alexander Kornienkoffcc0102013-06-05 14:09:10 +0000873 assert(NewRemainingTokenColumns < RemainingTokenColumns);
Alexander Kornienkobe633902013-06-14 11:46:10 +0000874 if (!DryRun)
875 Token->insertBreak(LineIndex, TailOffset, Split, Whitespaces);
Alexander Kornienkodd7ece52013-06-07 16:02:52 +0000876 Penalty += Current.is(tok::string_literal) ? Style.PenaltyBreakString
877 : Style.PenaltyBreakComment;
878 unsigned ColumnsUsed =
879 Token->getLineLengthAfterSplit(LineIndex, TailOffset, Split.first);
880 if (ColumnsUsed > getColumnLimit()) {
881 Penalty +=
882 Style.PenaltyExcessCharacter * (ColumnsUsed - getColumnLimit());
883 }
Alexander Kornienkocb45bc12013-04-15 14:28:00 +0000884 TailOffset += Split.first + Split.second;
Alexander Kornienkoffcc0102013-06-05 14:09:10 +0000885 RemainingTokenColumns = NewRemainingTokenColumns;
Alexander Kornienkocb45bc12013-04-15 14:28:00 +0000886 BreakInserted = true;
Manuel Klimek1998ea22013-02-20 10:15:13 +0000887 }
Alexander Kornienkocb45bc12013-04-15 14:28:00 +0000888 }
889
Alexander Kornienkoa3555e22013-06-19 19:50:11 +0000890 State.Column = RemainingTokenColumns;
891
Alexander Kornienkocb45bc12013-04-15 14:28:00 +0000892 if (BreakInserted) {
Alexander Kornienko4d26b6e2013-06-17 12:59:44 +0000893 // If we break the token inside a parameter list, we need to break before
894 // the next parameter on all levels, so that the next parameter is clearly
895 // visible. Line comments already introduce a break.
896 if (Current.Type != TT_LineComment) {
897 for (unsigned i = 0, e = State.Stack.size(); i != e; ++i)
898 State.Stack[i].BreakBeforeParameter = true;
899 }
900
Alexander Kornienkocb45bc12013-04-15 14:28:00 +0000901 State.Stack.back().LastSpace = StartColumn;
Manuel Klimek1998ea22013-02-20 10:15:13 +0000902 }
Manuel Klimek1998ea22013-02-20 10:15:13 +0000903 return Penalty;
904 }
905
Daniel Jasper2df93312013-01-09 10:16:05 +0000906 unsigned getColumnLimit() {
Alexander Kornienkocb45bc12013-04-15 14:28:00 +0000907 // In preprocessor directives reserve two chars for trailing " \"
908 return Style.ColumnLimit - (Line.InPPDirective ? 2 : 0);
Daniel Jasper2df93312013-01-09 10:16:05 +0000909 }
910
Manuel Klimek2ef908e2013-02-13 10:46:36 +0000911 /// \brief An edge in the solution space from \c Previous->State to \c State,
912 /// inserting a newline dependent on the \c NewLine.
913 struct StateNode {
914 StateNode(const LineState &State, bool NewLine, StateNode *Previous)
Daniel Jasper12ef4e52013-02-21 21:33:55 +0000915 : State(State), NewLine(NewLine), Previous(Previous) {}
Manuel Klimek2ef908e2013-02-13 10:46:36 +0000916 LineState State;
917 bool NewLine;
918 StateNode *Previous;
919 };
Daniel Jasper4b866272013-02-01 11:00:45 +0000920
Manuel Klimek2ef908e2013-02-13 10:46:36 +0000921 /// \brief A pair of <penalty, count> that is used to prioritize the BFS on.
922 ///
923 /// In case of equal penalties, we want to prefer states that were inserted
924 /// first. During state generation we make sure that we insert states first
925 /// that break the line as late as possible.
926 typedef std::pair<unsigned, unsigned> OrderedPenalty;
927
928 /// \brief An item in the prioritized BFS search queue. The \c StateNode's
929 /// \c State has the given \c OrderedPenalty.
930 typedef std::pair<OrderedPenalty, StateNode *> QueueItem;
931
932 /// \brief The BFS queue type.
933 typedef std::priority_queue<QueueItem, std::vector<QueueItem>,
934 std::greater<QueueItem> > QueueType;
Daniel Jasper4b866272013-02-01 11:00:45 +0000935
936 /// \brief Analyze the entire solution space starting from \p InitialState.
Daniel Jasperf7935112012-12-03 18:12:45 +0000937 ///
Daniel Jasper4b866272013-02-01 11:00:45 +0000938 /// This implements a variant of Dijkstra's algorithm on the graph that spans
939 /// the solution space (\c LineStates are the nodes). The algorithm tries to
940 /// find the shortest path (the one with lowest penalty) from \p InitialState
941 /// to a state where all tokens are placed.
Manuel Klimek4fe43002013-05-22 12:51:29 +0000942 void analyzeSolutionSpace(LineState &InitialState) {
Manuel Klimek2ef908e2013-02-13 10:46:36 +0000943 std::set<LineState> Seen;
944
Daniel Jasper4b866272013-02-01 11:00:45 +0000945 // Insert start element into queue.
Daniel Jasper687af3b2013-02-14 14:26:07 +0000946 StateNode *Node =
Manuel Klimek2ef908e2013-02-13 10:46:36 +0000947 new (Allocator.Allocate()) StateNode(InitialState, false, NULL);
948 Queue.push(QueueItem(OrderedPenalty(0, Count), Node));
949 ++Count;
Daniel Jasper4b866272013-02-01 11:00:45 +0000950
951 // While not empty, take first element and follow edges.
952 while (!Queue.empty()) {
Manuel Klimek2ef908e2013-02-13 10:46:36 +0000953 unsigned Penalty = Queue.top().first.first;
Daniel Jasper687af3b2013-02-14 14:26:07 +0000954 StateNode *Node = Queue.top().second;
Manuel Klimek2ef908e2013-02-13 10:46:36 +0000955 if (Node->State.NextToken == NULL) {
Alexander Kornienko49149672013-05-10 11:56:10 +0000956 DEBUG(llvm::dbgs() << "\n---\nPenalty for line: " << Penalty << "\n");
Daniel Jasper4b866272013-02-01 11:00:45 +0000957 break;
Daniel Jasper3a9370c2013-02-04 07:21:18 +0000958 }
Manuel Klimek2ef908e2013-02-13 10:46:36 +0000959 Queue.pop();
Daniel Jasper4b866272013-02-01 11:00:45 +0000960
Daniel Jasperf8114cf2013-05-22 05:27:42 +0000961 // Cut off the analysis of certain solutions if the analysis gets too
962 // complex. See description of IgnoreStackForComparison.
963 if (Count > 10000)
964 Node->State.IgnoreStackForComparison = true;
965
Manuel Klimek2ef908e2013-02-13 10:46:36 +0000966 if (!Seen.insert(Node->State).second)
967 // State already examined with lower penalty.
968 continue;
Daniel Jasper4b866272013-02-01 11:00:45 +0000969
Nico Weber9096fc02013-06-26 00:30:14 +0000970 addNextStateToQueue(Penalty, Node, /*NewLine=*/false);
971 addNextStateToQueue(Penalty, Node, /*NewLine=*/true);
Daniel Jasper4b866272013-02-01 11:00:45 +0000972 }
973
974 if (Queue.empty())
975 // We were unable to find a solution, do nothing.
976 // FIXME: Add diagnostic?
Manuel Klimek4fe43002013-05-22 12:51:29 +0000977 return;
Daniel Jasperf7935112012-12-03 18:12:45 +0000978
Daniel Jasper4b866272013-02-01 11:00:45 +0000979 // Reconstruct the solution.
Manuel Klimek2ef908e2013-02-13 10:46:36 +0000980 reconstructPath(InitialState, Queue.top().second);
Alexander Kornienko49149672013-05-10 11:56:10 +0000981 DEBUG(llvm::dbgs() << "Total number of analyzed states: " << Count << "\n");
982 DEBUG(llvm::dbgs() << "---\n");
Manuel Klimek2ef908e2013-02-13 10:46:36 +0000983 }
984
985 void reconstructPath(LineState &State, StateNode *Current) {
Manuel Klimek4c5c28b2013-05-29 15:10:11 +0000986 std::deque<StateNode *> Path;
987 // We do not need a break before the initial token.
988 while (Current->Previous) {
989 Path.push_front(Current);
990 Current = Current->Previous;
991 }
992 for (std::deque<StateNode *>::iterator I = Path.begin(), E = Path.end();
993 I != E; ++I) {
994 DEBUG({
995 if ((*I)->NewLine) {
996 llvm::dbgs() << "Penalty for splitting before "
997 << (*I)->Previous->State.NextToken->Tok.getName() << ": "
998 << (*I)->Previous->State.NextToken->SplitPenalty << "\n";
999 }
1000 });
1001 addTokenToState((*I)->NewLine, false, State);
1002 }
Daniel Jasper4b866272013-02-01 11:00:45 +00001003 }
1004
Manuel Klimekaf491072013-02-13 10:54:19 +00001005 /// \brief Add the following state to the analysis queue \c Queue.
Daniel Jasper4b866272013-02-01 11:00:45 +00001006 ///
Manuel Klimekaf491072013-02-13 10:54:19 +00001007 /// Assume the current state is \p PreviousNode and has been reached with a
Daniel Jasper4b866272013-02-01 11:00:45 +00001008 /// penalty of \p Penalty. Insert a line break if \p NewLine is \c true.
Manuel Klimekaf491072013-02-13 10:54:19 +00001009 void addNextStateToQueue(unsigned Penalty, StateNode *PreviousNode,
1010 bool NewLine) {
Manuel Klimek2ef908e2013-02-13 10:46:36 +00001011 if (NewLine && !canBreak(PreviousNode->State))
Daniel Jasper4b866272013-02-01 11:00:45 +00001012 return;
Manuel Klimek2ef908e2013-02-13 10:46:36 +00001013 if (!NewLine && mustBreak(PreviousNode->State))
Daniel Jasper4b866272013-02-01 11:00:45 +00001014 return;
Daniel Jasper20b09ef2013-01-28 09:35:24 +00001015 if (NewLine)
Manuel Klimek2ef908e2013-02-13 10:46:36 +00001016 Penalty += PreviousNode->State.NextToken->SplitPenalty;
1017
1018 StateNode *Node = new (Allocator.Allocate())
1019 StateNode(PreviousNode->State, NewLine, PreviousNode);
Manuel Klimek1998ea22013-02-20 10:15:13 +00001020 Penalty += addTokenToState(NewLine, true, Node->State);
Manuel Klimek2ef908e2013-02-13 10:46:36 +00001021 if (Node->State.Column > getColumnLimit()) {
1022 unsigned ExcessCharacters = Node->State.Column - getColumnLimit();
Daniel Jasper3a9370c2013-02-04 07:21:18 +00001023 Penalty += Style.PenaltyExcessCharacter * ExcessCharacters;
Daniel Jasper2df93312013-01-09 10:16:05 +00001024 }
Manuel Klimek2ef908e2013-02-13 10:46:36 +00001025
1026 Queue.push(QueueItem(OrderedPenalty(Penalty, Count), Node));
1027 ++Count;
Daniel Jasper4b866272013-02-01 11:00:45 +00001028 }
Daniel Jasperf7935112012-12-03 18:12:45 +00001029
Daniel Jasper4b866272013-02-01 11:00:45 +00001030 /// \brief Returns \c true, if a line break after \p State is allowed.
1031 bool canBreak(const LineState &State) {
Manuel Klimek6e6310e2013-05-29 14:47:47 +00001032 const FormatToken &Current = *State.NextToken;
1033 const FormatToken &Previous = *Current.Previous;
1034 assert(&Previous == Current.Previous);
Daniel Jasper473c62c2013-05-17 09:35:01 +00001035 if (!Current.CanBreakBefore &&
1036 !(Current.is(tok::r_brace) &&
Daniel Jasper4b866272013-02-01 11:00:45 +00001037 State.Stack.back().BreakBeforeClosingBrace))
1038 return false;
Daniel Jasper473c62c2013-05-17 09:35:01 +00001039 // The opening "{" of a braced list has to be on the same line as the first
1040 // element if it is nested in another braced init list or function call.
1041 if (!Current.MustBreakBefore && Previous.is(tok::l_brace) &&
Manuel Klimek6e6310e2013-05-29 14:47:47 +00001042 Previous.Previous &&
1043 Previous.Previous->isOneOf(tok::l_brace, tok::l_paren, tok::comma))
Daniel Jasper473c62c2013-05-17 09:35:01 +00001044 return false;
Daniel Jasper32a796b2013-05-27 11:50:16 +00001045 // This prevents breaks like:
1046 // ...
1047 // SomeParameter, OtherParameter).DoSomething(
1048 // ...
1049 // As they hide "DoSomething" and are generally bad for readability.
Daniel Jasper80503952013-06-03 09:54:46 +00001050 if (Previous.opensScope() && State.LowestCallLevel < State.StartOfLineLevel)
Daniel Jasper32a796b2013-05-27 11:50:16 +00001051 return false;
Daniel Jaspercc960fa2013-04-22 07:59:53 +00001052 return !State.Stack.back().NoLineBreak;
Daniel Jasper4b866272013-02-01 11:00:45 +00001053 }
Daniel Jasperf7935112012-12-03 18:12:45 +00001054
Daniel Jasper4b866272013-02-01 11:00:45 +00001055 /// \brief Returns \c true, if a line break after \p State is mandatory.
1056 bool mustBreak(const LineState &State) {
Manuel Klimek6e6310e2013-05-29 14:47:47 +00001057 const FormatToken &Current = *State.NextToken;
1058 const FormatToken &Previous = *Current.Previous;
Daniel Jasperd69fc772013-05-08 14:12:04 +00001059 if (Current.MustBreakBefore || Current.Type == TT_InlineASMColon)
Daniel Jasper4b866272013-02-01 11:00:45 +00001060 return true;
Daniel Jasperd69fc772013-05-08 14:12:04 +00001061 if (Current.is(tok::r_brace) && State.Stack.back().BreakBeforeClosingBrace)
Daniel Jasper4b866272013-02-01 11:00:45 +00001062 return true;
Daniel Jasperd69fc772013-05-08 14:12:04 +00001063 if (Previous.is(tok::semi) && State.LineContainsContinuedForLoopSection)
Daniel Jasper4b866272013-02-01 11:00:45 +00001064 return true;
Daniel Jasperd69fc772013-05-08 14:12:04 +00001065 if ((Previous.isOneOf(tok::comma, tok::semi) || Current.is(tok::question) ||
1066 Current.Type == TT_ConditionalExpr) &&
Daniel Jasperacc33662013-02-08 08:22:00 +00001067 State.Stack.back().BreakBeforeParameter &&
Daniel Jasperd69fc772013-05-08 14:12:04 +00001068 !Current.isTrailingComment() &&
1069 !Current.isOneOf(tok::r_paren, tok::r_brace))
Daniel Jasper4b866272013-02-01 11:00:45 +00001070 return true;
Daniel Jasperd69fc772013-05-08 14:12:04 +00001071
1072 // If we need to break somewhere inside the LHS of a binary expression, we
Daniel Jasper7ae41cd2013-07-03 10:34:47 +00001073 // should also break after the operator. Otherwise, the formatting would
1074 // hide the operator precedence, e.g. in:
1075 // if (aaaaaaaaaaaaaa ==
1076 // bbbbbbbbbbbbbb && c) {..
1077 // For comparisons, we only apply this rule, if the LHS is a binary
1078 // expression itself as otherwise, the line breaks seem superfluous.
1079 // We need special cases for ">>" which we have split into two ">" while
1080 // lexing in order to make template parsing easier.
1081 bool IsComparison = (Previous.getPrecedence() == prec::Relational ||
1082 Previous.getPrecedence() == prec::Equality) &&
1083 Previous.Previous &&
1084 Previous.Previous->Type != TT_BinaryOperator; // For >>.
1085 bool LHSIsBinaryExpr =
1086 Previous.Previous && Previous.Previous->FakeRParens > 0;
Daniel Jasperd69fc772013-05-08 14:12:04 +00001087 if (Previous.Type == TT_BinaryOperator &&
Daniel Jasper7ae41cd2013-07-03 10:34:47 +00001088 (!IsComparison || LHSIsBinaryExpr) &&
1089 Current.Type != TT_BinaryOperator && // For >>.
Daniel Jasper68d888c2013-06-03 08:42:05 +00001090 !Current.isTrailingComment() &&
Daniel Jasperd69fc772013-05-08 14:12:04 +00001091 !Previous.isOneOf(tok::lessless, tok::question) &&
Manuel Klimek6e6310e2013-05-29 14:47:47 +00001092 Previous.getPrecedence() != prec::Assignment &&
Daniel Jasperacc33662013-02-08 08:22:00 +00001093 State.Stack.back().BreakBeforeParameter)
Daniel Jasper1ac3e052013-02-05 10:07:47 +00001094 return true;
Daniel Jasperd69fc772013-05-08 14:12:04 +00001095
1096 // FIXME: Comparing LongestObjCSelectorName to 0 is a hacky way of finding
1097 // out whether it is the first parameter. Clean this up.
1098 if (Current.Type == TT_ObjCSelectorName &&
1099 Current.LongestObjCSelectorName == 0 &&
1100 State.Stack.back().BreakBeforeParameter)
Daniel Jasper4b866272013-02-01 11:00:45 +00001101 return true;
Daniel Jasperd69fc772013-05-08 14:12:04 +00001102 if ((Current.Type == TT_CtorInitializerColon ||
1103 (Previous.ClosesTemplateDeclaration && State.ParenLevel == 0)))
Daniel Jasper40aacf42013-03-14 13:45:21 +00001104 return true;
Daniel Jasperd69fc772013-05-08 14:12:04 +00001105
Daniel Jasperc6fbc212013-05-15 09:35:08 +00001106 if (Current.Type == TT_StartOfName && Line.MightBeFunctionDecl &&
1107 State.Stack.back().BreakBeforeParameter && State.ParenLevel == 0)
1108 return true;
Daniel Jasper4b866272013-02-01 11:00:45 +00001109 return false;
Daniel Jasperf7935112012-12-03 18:12:45 +00001110 }
1111
Daniel Jasper9b334242013-03-15 14:57:30 +00001112 // Returns the total number of columns required for the remaining tokens.
1113 unsigned getRemainingLength(const LineState &State) {
Manuel Klimek6e6310e2013-05-29 14:47:47 +00001114 if (State.NextToken && State.NextToken->Previous)
1115 return Line.Last->TotalLength - State.NextToken->Previous->TotalLength;
Daniel Jasper9b334242013-03-15 14:57:30 +00001116 return 0;
1117 }
1118
Daniel Jasperf7935112012-12-03 18:12:45 +00001119 FormatStyle Style;
1120 SourceManager &SourceMgr;
Daniel Jasperf1e4b7d2013-01-14 13:08:07 +00001121 const AnnotatedLine &Line;
Manuel Klimek0b689fd2013-01-10 18:45:26 +00001122 const unsigned FirstIndent;
Manuel Klimek6e6310e2013-05-29 14:47:47 +00001123 const FormatToken *RootToken;
Daniel Jasperaa701fa2013-01-18 08:44:07 +00001124 WhitespaceManager &Whitespaces;
Manuel Klimekaf491072013-02-13 10:54:19 +00001125
1126 llvm::SpecificBumpPtrAllocator<StateNode> Allocator;
1127 QueueType Queue;
1128 // Increasing count of \c StateNode items we have created. This is used
1129 // to create a deterministic order independent of the container.
1130 unsigned Count;
Alexander Kornienkoffcc0102013-06-05 14:09:10 +00001131 encoding::Encoding Encoding;
Daniel Jasperf7935112012-12-03 18:12:45 +00001132};
1133
Manuel Klimek15dfe7a2013-05-28 11:55:06 +00001134class FormatTokenLexer {
Alexander Kornienkoe3276842012-12-07 16:15:44 +00001135public:
Alexander Kornienkoffcc0102013-06-05 14:09:10 +00001136 FormatTokenLexer(Lexer &Lex, SourceManager &SourceMgr,
1137 encoding::Encoding Encoding)
Manuel Klimek15dfe7a2013-05-28 11:55:06 +00001138 : FormatTok(NULL), GreaterStashed(false), TrailingWhitespace(0), Lex(Lex),
Alexander Kornienkoffcc0102013-06-05 14:09:10 +00001139 SourceMgr(SourceMgr), IdentTable(Lex.getLangOpts()),
1140 Encoding(Encoding) {
Alexander Kornienkoe3276842012-12-07 16:15:44 +00001141 Lex.SetKeepWhitespaceMode(true);
1142 }
1143
Manuel Klimek15dfe7a2013-05-28 11:55:06 +00001144 ArrayRef<FormatToken *> lex() {
1145 assert(Tokens.empty());
1146 do {
1147 Tokens.push_back(getNextToken());
1148 } while (Tokens.back()->Tok.isNot(tok::eof));
1149 return Tokens;
1150 }
1151
1152 IdentifierTable &getIdentTable() { return IdentTable; }
1153
1154private:
1155 FormatToken *getNextToken() {
Alexander Kornienkoe3276842012-12-07 16:15:44 +00001156 if (GreaterStashed) {
Manuel Klimek591ab5a2013-05-28 13:42:28 +00001157 // Create a synthesized second '>' token.
1158 Token Greater = FormatTok->Tok;
1159 FormatTok = new (Allocator.Allocate()) FormatToken;
1160 FormatTok->Tok = Greater;
Manuel Klimek5c24cca2013-05-23 10:56:37 +00001161 SourceLocation GreaterLocation =
Manuel Klimek15dfe7a2013-05-28 11:55:06 +00001162 FormatTok->Tok.getLocation().getLocWithOffset(1);
1163 FormatTok->WhitespaceRange =
1164 SourceRange(GreaterLocation, GreaterLocation);
Alexander Kornienkoee4ca9b2013-06-07 17:45:07 +00001165 FormatTok->TokenText = ">";
Alexander Kornienkoffcc0102013-06-05 14:09:10 +00001166 FormatTok->CodePointCount = 1;
Alexander Kornienkoe3276842012-12-07 16:15:44 +00001167 GreaterStashed = false;
1168 return FormatTok;
1169 }
1170
Manuel Klimek15dfe7a2013-05-28 11:55:06 +00001171 FormatTok = new (Allocator.Allocate()) FormatToken;
1172 Lex.LexFromRawLexer(FormatTok->Tok);
1173 StringRef Text = rawTokenText(FormatTok->Tok);
Manuel Klimek9043c742013-05-27 15:23:34 +00001174 SourceLocation WhitespaceStart =
Manuel Klimek15dfe7a2013-05-28 11:55:06 +00001175 FormatTok->Tok.getLocation().getLocWithOffset(-TrailingWhitespace);
Manuel Klimek5c24cca2013-05-23 10:56:37 +00001176 if (SourceMgr.getFileOffset(WhitespaceStart) == 0)
Manuel Klimek15dfe7a2013-05-28 11:55:06 +00001177 FormatTok->IsFirst = true;
Alexander Kornienkoe3276842012-12-07 16:15:44 +00001178
1179 // Consume and record whitespace until we find a significant token.
Manuel Klimek9043c742013-05-27 15:23:34 +00001180 unsigned WhitespaceLength = TrailingWhitespace;
Manuel Klimek15dfe7a2013-05-28 11:55:06 +00001181 while (FormatTok->Tok.is(tok::unknown)) {
Manuel Klimek0c137952013-02-11 12:33:24 +00001182 unsigned Newlines = Text.count('\n');
Daniel Jasper973c9422013-03-04 13:43:19 +00001183 if (Newlines > 0)
Manuel Klimek15dfe7a2013-05-28 11:55:06 +00001184 FormatTok->LastNewlineOffset = WhitespaceLength + Text.rfind('\n') + 1;
Manuel Klimek15dfe7a2013-05-28 11:55:06 +00001185 FormatTok->NewlinesBefore += Newlines;
Alexander Kornienkoee4ca9b2013-06-07 17:45:07 +00001186 unsigned EscapedNewlines = Text.count("\\\n");
Manuel Klimek15dfe7a2013-05-28 11:55:06 +00001187 FormatTok->HasUnescapedNewline |= EscapedNewlines != Newlines;
1188 WhitespaceLength += FormatTok->Tok.getLength();
Alexander Kornienkoe3276842012-12-07 16:15:44 +00001189
Manuel Klimek15dfe7a2013-05-28 11:55:06 +00001190 Lex.LexFromRawLexer(FormatTok->Tok);
1191 Text = rawTokenText(FormatTok->Tok);
Manuel Klimek1abf7892013-01-04 23:34:14 +00001192 }
Manuel Klimekef920692013-01-07 07:56:50 +00001193
Manuel Klimek1abf7892013-01-04 23:34:14 +00001194 // In case the token starts with escaped newlines, we want to
1195 // take them into account as whitespace - this pattern is quite frequent
1196 // in macro definitions.
1197 // FIXME: What do we want to do with other escaped spaces, and escaped
1198 // spaces or newlines in the middle of tokens?
1199 // FIXME: Add a more explicit test.
Alexander Kornienkoee4ca9b2013-06-07 17:45:07 +00001200 while (Text.size() > 1 && Text[0] == '\\' && Text[1] == '\n') {
Manuel Klimek15dfe7a2013-05-28 11:55:06 +00001201 // FIXME: ++FormatTok->NewlinesBefore is missing...
Manuel Klimek5c24cca2013-05-23 10:56:37 +00001202 WhitespaceLength += 2;
Alexander Kornienkoee4ca9b2013-06-07 17:45:07 +00001203 Text = Text.substr(2);
Alexander Kornienkoe3276842012-12-07 16:15:44 +00001204 }
1205
Alexander Kornienkoee4ca9b2013-06-07 17:45:07 +00001206 TrailingWhitespace = 0;
1207 if (FormatTok->Tok.is(tok::comment)) {
1208 StringRef UntrimmedText = Text;
1209 Text = Text.rtrim();
1210 TrailingWhitespace = UntrimmedText.size() - Text.size();
1211 } else if (FormatTok->Tok.is(tok::raw_identifier)) {
Manuel Klimek1abf7892013-01-04 23:34:14 +00001212 IdentifierInfo &Info = IdentTable.get(Text);
Manuel Klimek15dfe7a2013-05-28 11:55:06 +00001213 FormatTok->Tok.setIdentifierInfo(&Info);
1214 FormatTok->Tok.setKind(Info.getTokenID());
Alexander Kornienkoee4ca9b2013-06-07 17:45:07 +00001215 } else if (FormatTok->Tok.is(tok::greatergreater)) {
Manuel Klimek15dfe7a2013-05-28 11:55:06 +00001216 FormatTok->Tok.setKind(tok::greater);
Alexander Kornienkoee4ca9b2013-06-07 17:45:07 +00001217 Text = Text.substr(0, 1);
Alexander Kornienkoe3276842012-12-07 16:15:44 +00001218 GreaterStashed = true;
1219 }
1220
Alexander Kornienkoee4ca9b2013-06-07 17:45:07 +00001221 // Now FormatTok is the next non-whitespace token.
1222 FormatTok->TokenText = Text;
1223 FormatTok->CodePointCount = encoding::getCodePointCount(Text, Encoding);
Alexander Kornienkoffcc0102013-06-05 14:09:10 +00001224
Manuel Klimek15dfe7a2013-05-28 11:55:06 +00001225 FormatTok->WhitespaceRange = SourceRange(
Manuel Klimek5c24cca2013-05-23 10:56:37 +00001226 WhitespaceStart, WhitespaceStart.getLocWithOffset(WhitespaceLength));
Alexander Kornienkoe3276842012-12-07 16:15:44 +00001227 return FormatTok;
1228 }
1229
Manuel Klimek15dfe7a2013-05-28 11:55:06 +00001230 FormatToken *FormatTok;
Alexander Kornienkoe3276842012-12-07 16:15:44 +00001231 bool GreaterStashed;
Manuel Klimek9043c742013-05-27 15:23:34 +00001232 unsigned TrailingWhitespace;
Alexander Kornienkoe3276842012-12-07 16:15:44 +00001233 Lexer &Lex;
1234 SourceManager &SourceMgr;
1235 IdentifierTable IdentTable;
Alexander Kornienkoffcc0102013-06-05 14:09:10 +00001236 encoding::Encoding Encoding;
Manuel Klimek15dfe7a2013-05-28 11:55:06 +00001237 llvm::SpecificBumpPtrAllocator<FormatToken> Allocator;
1238 SmallVector<FormatToken *, 16> Tokens;
Alexander Kornienkoe3276842012-12-07 16:15:44 +00001239
1240 /// Returns the text of \c FormatTok.
Manuel Klimekef920692013-01-07 07:56:50 +00001241 StringRef rawTokenText(Token &Tok) {
Alexander Kornienkoe3276842012-12-07 16:15:44 +00001242 return StringRef(SourceMgr.getCharacterData(Tok.getLocation()),
1243 Tok.getLength());
1244 }
1245};
1246
Daniel Jasperf7935112012-12-03 18:12:45 +00001247class Formatter : public UnwrappedLineConsumer {
1248public:
Daniel Jasperd2ae41a2013-05-15 08:14:19 +00001249 Formatter(const FormatStyle &Style, Lexer &Lex, SourceManager &SourceMgr,
Daniel Jasperf7935112012-12-03 18:12:45 +00001250 const std::vector<CharSourceRange> &Ranges)
Daniel Jasperd2ae41a2013-05-15 08:14:19 +00001251 : Style(Style), Lex(Lex), SourceMgr(SourceMgr),
Alexander Kornienkoffcc0102013-06-05 14:09:10 +00001252 Whitespaces(SourceMgr, Style), Ranges(Ranges),
1253 Encoding(encoding::detectEncoding(Lex.getBuffer())) {
1254 DEBUG(llvm::dbgs()
1255 << "File encoding: "
1256 << (Encoding == encoding::Encoding_UTF8 ? "UTF8" : "unknown")
1257 << "\n");
1258 }
Daniel Jasperf7935112012-12-03 18:12:45 +00001259
Daniel Jasperfd8c4b12013-01-11 14:23:32 +00001260 virtual ~Formatter() {}
Daniel Jasper61bd3a12012-12-04 21:05:31 +00001261
Alexander Kornienko62b85b92013-03-13 14:41:29 +00001262 tooling::Replacements format() {
Alexander Kornienkoffcc0102013-06-05 14:09:10 +00001263 FormatTokenLexer Tokens(Lex, SourceMgr, Encoding);
Manuel Klimek15dfe7a2013-05-28 11:55:06 +00001264
1265 UnwrappedLineParser Parser(Style, Tokens.lex(), *this);
Manuel Klimek1a18c402013-04-12 14:13:36 +00001266 bool StructuralError = Parser.parse();
Alexander Kornienkoffcc0102013-06-05 14:09:10 +00001267 TokenAnnotator Annotator(Style, Tokens.getIdentTable().get("in"));
Alexander Kornienko62b85b92013-03-13 14:41:29 +00001268 for (unsigned i = 0, e = AnnotatedLines.size(); i != e; ++i) {
1269 Annotator.annotate(AnnotatedLines[i]);
1270 }
1271 deriveLocalStyle();
1272 for (unsigned i = 0, e = AnnotatedLines.size(); i != e; ++i) {
1273 Annotator.calculateFormattingInformation(AnnotatedLines[i]);
1274 }
Daniel Jasperb67cc422013-04-09 17:46:55 +00001275
1276 // Adapt level to the next line if this is a comment.
1277 // FIXME: Can/should this be done in the UnwrappedLineParser?
Alexander Kornienko1efe0a02013-07-04 14:47:51 +00001278 const AnnotatedLine *NextNonCommentLine = NULL;
Daniel Jasperb67cc422013-04-09 17:46:55 +00001279 for (unsigned i = AnnotatedLines.size() - 1; i > 0; --i) {
Alexander Kornienko1efe0a02013-07-04 14:47:51 +00001280 if (NextNonCommentLine && AnnotatedLines[i].First->is(tok::comment) &&
Manuel Klimek6e6310e2013-05-29 14:47:47 +00001281 !AnnotatedLines[i].First->Next)
Alexander Kornienko1efe0a02013-07-04 14:47:51 +00001282 AnnotatedLines[i].Level = NextNonCommentLine->Level;
Daniel Jasperb67cc422013-04-09 17:46:55 +00001283 else
Alexander Kornienko1efe0a02013-07-04 14:47:51 +00001284 NextNonCommentLine =
Manuel Klimek6e6310e2013-05-29 14:47:47 +00001285 AnnotatedLines[i].First->isNot(tok::r_brace) ? &AnnotatedLines[i]
1286 : NULL;
Daniel Jasperb67cc422013-04-09 17:46:55 +00001287 }
1288
Alexander Kornienko62b85b92013-03-13 14:41:29 +00001289 std::vector<int> IndentForLevel;
1290 bool PreviousLineWasTouched = false;
Manuel Klimek6e6310e2013-05-29 14:47:47 +00001291 const FormatToken *PreviousLineLastToken = 0;
Daniel Jasper1cb530f2013-05-10 13:00:49 +00001292 bool FormatPPDirective = false;
Alexander Kornienko62b85b92013-03-13 14:41:29 +00001293 for (std::vector<AnnotatedLine>::iterator I = AnnotatedLines.begin(),
1294 E = AnnotatedLines.end();
1295 I != E; ++I) {
1296 const AnnotatedLine &TheLine = *I;
Manuel Klimek6e6310e2013-05-29 14:47:47 +00001297 const FormatToken *FirstTok = TheLine.First;
1298 int Offset = getIndentOffset(*TheLine.First);
Daniel Jasper1cb530f2013-05-10 13:00:49 +00001299
1300 // Check whether this line is part of a formatted preprocessor directive.
Manuel Klimek591ab5a2013-05-28 13:42:28 +00001301 if (FirstTok->HasUnescapedNewline)
Daniel Jasper1cb530f2013-05-10 13:00:49 +00001302 FormatPPDirective = false;
1303 if (!FormatPPDirective && TheLine.InPPDirective &&
1304 (touchesLine(TheLine) || touchesPPDirective(I + 1, E)))
1305 FormatPPDirective = true;
1306
Daniel Jasper12f9d8e2013-05-14 09:30:02 +00001307 // Determine indent and try to merge multiple unwrapped lines.
Alexander Kornienko62b85b92013-03-13 14:41:29 +00001308 while (IndentForLevel.size() <= TheLine.Level)
1309 IndentForLevel.push_back(-1);
1310 IndentForLevel.resize(TheLine.Level + 1);
Daniel Jasper12f9d8e2013-05-14 09:30:02 +00001311 unsigned Indent = getIndent(IndentForLevel, TheLine.Level);
1312 if (static_cast<int>(Indent) + Offset >= 0)
1313 Indent += Offset;
1314 tryFitMultipleLinesInOne(Indent, I, E);
1315
Manuel Klimek591ab5a2013-05-28 13:42:28 +00001316 bool WasMoved = PreviousLineWasTouched && FirstTok->NewlinesBefore == 0;
Manuel Klimek6e6310e2013-05-29 14:47:47 +00001317 if (TheLine.First->is(tok::eof)) {
Alexander Kornienko62b85b92013-03-13 14:41:29 +00001318 if (PreviousLineWasTouched) {
Manuel Klimek591ab5a2013-05-28 13:42:28 +00001319 unsigned NewLines = std::min(FirstTok->NewlinesBefore, 1u);
Manuel Klimek6e6310e2013-05-29 14:47:47 +00001320 Whitespaces.replaceWhitespace(*TheLine.First, NewLines, /*Indent*/ 0,
Manuel Klimek4fe43002013-05-22 12:51:29 +00001321 /*TargetColumn*/ 0);
Alexander Kornienko62b85b92013-03-13 14:41:29 +00001322 }
1323 } else if (TheLine.Type != LT_Invalid &&
Daniel Jasper1cb530f2013-05-10 13:00:49 +00001324 (WasMoved || FormatPPDirective || touchesLine(TheLine))) {
Alexander Kornienko62b85b92013-03-13 14:41:29 +00001325 unsigned LevelIndent = getIndent(IndentForLevel, TheLine.Level);
Manuel Klimek591ab5a2013-05-28 13:42:28 +00001326 if (FirstTok->WhitespaceRange.isValid() &&
Manuel Klimek1a18c402013-04-12 14:13:36 +00001327 // Insert a break even if there is a structural error in case where
1328 // we break apart a line consisting of multiple unwrapped lines.
Manuel Klimek591ab5a2013-05-28 13:42:28 +00001329 (FirstTok->NewlinesBefore == 0 || !StructuralError)) {
Manuel Klimek6e6310e2013-05-29 14:47:47 +00001330 formatFirstToken(*TheLine.First, PreviousLineLastToken, Indent,
Manuel Klimek4fe43002013-05-22 12:51:29 +00001331 TheLine.InPPDirective);
Manuel Klimek1a18c402013-04-12 14:13:36 +00001332 } else {
1333 Indent = LevelIndent =
Manuel Klimek591ab5a2013-05-28 13:42:28 +00001334 SourceMgr.getSpellingColumnNumber(FirstTok->Tok.getLocation()) -
1335 1;
Alexander Kornienko62b85b92013-03-13 14:41:29 +00001336 }
Alexander Kornienko62b85b92013-03-13 14:41:29 +00001337 UnwrappedLineFormatter Formatter(Style, SourceMgr, TheLine, Indent,
Alexander Kornienkoffcc0102013-06-05 14:09:10 +00001338 TheLine.First, Whitespaces, Encoding);
Manuel Klimek4fe43002013-05-22 12:51:29 +00001339 Formatter.format(I + 1 != E ? &*(I + 1) : NULL);
Alexander Kornienko62b85b92013-03-13 14:41:29 +00001340 IndentForLevel[TheLine.Level] = LevelIndent;
1341 PreviousLineWasTouched = true;
1342 } else {
Manuel Klimek4fe43002013-05-22 12:51:29 +00001343 // Format the first token if necessary, and notify the WhitespaceManager
1344 // about the unchanged whitespace.
Manuel Klimek6e6310e2013-05-29 14:47:47 +00001345 for (const FormatToken *Tok = TheLine.First; Tok != NULL;
1346 Tok = Tok->Next) {
1347 if (Tok == TheLine.First &&
1348 (Tok->NewlinesBefore > 0 || Tok->IsFirst)) {
1349 unsigned LevelIndent =
1350 SourceMgr.getSpellingColumnNumber(Tok->Tok.getLocation()) - 1;
Manuel Klimek4fe43002013-05-22 12:51:29 +00001351 // Remove trailing whitespace of the previous line if it was
1352 // touched.
1353 if (PreviousLineWasTouched || touchesEmptyLineBefore(TheLine)) {
1354 formatFirstToken(*Tok, PreviousLineLastToken, LevelIndent,
1355 TheLine.InPPDirective);
1356 } else {
Manuel Klimek6e6310e2013-05-29 14:47:47 +00001357 Whitespaces.addUntouchableToken(*Tok, TheLine.InPPDirective);
Manuel Klimek4fe43002013-05-22 12:51:29 +00001358 }
Daniel Jasper12f9d8e2013-05-14 09:30:02 +00001359
Manuel Klimek4fe43002013-05-22 12:51:29 +00001360 if (static_cast<int>(LevelIndent) - Offset >= 0)
1361 LevelIndent -= Offset;
1362 if (Tok->isNot(tok::comment))
1363 IndentForLevel[TheLine.Level] = LevelIndent;
1364 } else {
Manuel Klimek6e6310e2013-05-29 14:47:47 +00001365 Whitespaces.addUntouchableToken(*Tok, TheLine.InPPDirective);
Manuel Klimek4fe43002013-05-22 12:51:29 +00001366 }
Alexander Kornienko62b85b92013-03-13 14:41:29 +00001367 }
1368 // If we did not reformat this unwrapped line, the column at the end of
1369 // the last token is unchanged - thus, we can calculate the end of the
1370 // last token.
Alexander Kornienko62b85b92013-03-13 14:41:29 +00001371 PreviousLineWasTouched = false;
1372 }
Alexander Kornienkofd433362013-03-27 17:08:02 +00001373 PreviousLineLastToken = I->Last;
Alexander Kornienko62b85b92013-03-13 14:41:29 +00001374 }
1375 return Whitespaces.generateReplacements();
1376 }
1377
1378private:
Daniel Jasper7fce3ab2013-02-06 14:22:40 +00001379 void deriveLocalStyle() {
1380 unsigned CountBoundToVariable = 0;
1381 unsigned CountBoundToType = 0;
1382 bool HasCpp03IncompatibleFormat = false;
1383 for (unsigned i = 0, e = AnnotatedLines.size(); i != e; ++i) {
Manuel Klimek6e6310e2013-05-29 14:47:47 +00001384 if (!AnnotatedLines[i].First->Next)
Daniel Jasper7fce3ab2013-02-06 14:22:40 +00001385 continue;
Manuel Klimek6e6310e2013-05-29 14:47:47 +00001386 FormatToken *Tok = AnnotatedLines[i].First->Next;
1387 while (Tok->Next) {
Daniel Jasper7fce3ab2013-02-06 14:22:40 +00001388 if (Tok->Type == TT_PointerOrReference) {
Manuel Klimek6e6310e2013-05-29 14:47:47 +00001389 bool SpacesBefore =
1390 Tok->WhitespaceRange.getBegin() != Tok->WhitespaceRange.getEnd();
1391 bool SpacesAfter = Tok->Next->WhitespaceRange.getBegin() !=
1392 Tok->Next->WhitespaceRange.getEnd();
Daniel Jasper7fce3ab2013-02-06 14:22:40 +00001393 if (SpacesBefore && !SpacesAfter)
1394 ++CountBoundToVariable;
1395 else if (!SpacesBefore && SpacesAfter)
1396 ++CountBoundToType;
1397 }
1398
Daniel Jasper400adc62013-02-08 15:28:42 +00001399 if (Tok->Type == TT_TemplateCloser &&
Manuel Klimek6e6310e2013-05-29 14:47:47 +00001400 Tok->Previous->Type == TT_TemplateCloser &&
1401 Tok->WhitespaceRange.getBegin() == Tok->WhitespaceRange.getEnd())
Daniel Jasper7fce3ab2013-02-06 14:22:40 +00001402 HasCpp03IncompatibleFormat = true;
Manuel Klimek6e6310e2013-05-29 14:47:47 +00001403 Tok = Tok->Next;
Daniel Jasper7fce3ab2013-02-06 14:22:40 +00001404 }
1405 }
1406 if (Style.DerivePointerBinding) {
1407 if (CountBoundToType > CountBoundToVariable)
1408 Style.PointerBindsToType = true;
1409 else if (CountBoundToType < CountBoundToVariable)
1410 Style.PointerBindsToType = false;
1411 }
1412 if (Style.Standard == FormatStyle::LS_Auto) {
1413 Style.Standard = HasCpp03IncompatibleFormat ? FormatStyle::LS_Cpp11
1414 : FormatStyle::LS_Cpp03;
1415 }
1416 }
1417
Manuel Klimekb95f5452013-02-08 17:38:27 +00001418 /// \brief Get the indent of \p Level from \p IndentForLevel.
1419 ///
1420 /// \p IndentForLevel must contain the indent for the level \c l
1421 /// at \p IndentForLevel[l], or a value < 0 if the indent for
1422 /// that level is unknown.
Daniel Jasper687af3b2013-02-14 14:26:07 +00001423 unsigned getIndent(const std::vector<int> IndentForLevel, unsigned Level) {
Manuel Klimekb95f5452013-02-08 17:38:27 +00001424 if (IndentForLevel[Level] != -1)
1425 return IndentForLevel[Level];
Manuel Klimekd076dcd2013-02-08 19:53:32 +00001426 if (Level == 0)
1427 return 0;
Manuel Klimek13b97d82013-05-13 08:42:42 +00001428 return getIndent(IndentForLevel, Level - 1) + Style.IndentWidth;
Manuel Klimekb95f5452013-02-08 17:38:27 +00001429 }
1430
1431 /// \brief Get the offset of the line relatively to the level.
1432 ///
1433 /// For example, 'public:' labels in classes are offset by 1 or 2
1434 /// characters to the left from their level.
Manuel Klimek6e6310e2013-05-29 14:47:47 +00001435 int getIndentOffset(const FormatToken &RootToken) {
Alexander Kornienkofd433362013-03-27 17:08:02 +00001436 if (RootToken.isAccessSpecifier(false) || RootToken.isObjCAccessSpecifier())
Manuel Klimekb95f5452013-02-08 17:38:27 +00001437 return Style.AccessModifierOffset;
1438 return 0;
1439 }
1440
Manuel Klimekf4ab9ef2013-01-11 17:54:10 +00001441 /// \brief Tries to merge lines into one.
1442 ///
1443 /// This will change \c Line and \c AnnotatedLine to contain the merged line,
1444 /// if possible; note that \c I will be incremented when lines are merged.
Daniel Jaspera67a8f02013-01-16 10:41:46 +00001445 void tryFitMultipleLinesInOne(unsigned Indent,
Daniel Jasperf1e4b7d2013-01-14 13:08:07 +00001446 std::vector<AnnotatedLine>::iterator &I,
1447 std::vector<AnnotatedLine>::iterator E) {
Daniel Jaspera67a8f02013-01-16 10:41:46 +00001448 // We can never merge stuff if there are trailing line comments.
1449 if (I->Last->Type == TT_LineComment)
1450 return;
1451
Daniel Jasperc22f5b42013-02-28 11:05:57 +00001452 unsigned Limit = Style.ColumnLimit - Indent;
Daniel Jasper12ef4e52013-02-21 21:33:55 +00001453 // If we already exceed the column limit, we set 'Limit' to 0. The different
1454 // tryMerge..() functions can then decide whether to still do merging.
1455 Limit = I->Last->TotalLength > Limit ? 0 : Limit - I->Last->TotalLength;
Daniel Jasperc36492b2013-01-16 07:02:34 +00001456
Daniel Jasperd41ee2d2013-01-21 14:18:28 +00001457 if (I + 1 == E || (I + 1)->Type == LT_Invalid)
Daniel Jaspera67a8f02013-01-16 10:41:46 +00001458 return;
Manuel Klimekf4ab9ef2013-01-11 17:54:10 +00001459
Daniel Jasperabca58c2013-05-15 14:09:55 +00001460 if (I->Last->is(tok::l_brace)) {
Daniel Jasper25837aa2013-01-14 14:14:23 +00001461 tryMergeSimpleBlock(I, E, Limit);
Daniel Jasper3a685df2013-05-16 12:12:21 +00001462 } else if (Style.AllowShortIfStatementsOnASingleLine &&
Manuel Klimek6e6310e2013-05-29 14:47:47 +00001463 I->First->is(tok::kw_if)) {
Daniel Jasper3a685df2013-05-16 12:12:21 +00001464 tryMergeSimpleControlStatement(I, E, Limit);
1465 } else if (Style.AllowShortLoopsOnASingleLine &&
Manuel Klimek6e6310e2013-05-29 14:47:47 +00001466 I->First->isOneOf(tok::kw_for, tok::kw_while)) {
Daniel Jasper3a685df2013-05-16 12:12:21 +00001467 tryMergeSimpleControlStatement(I, E, Limit);
Manuel Klimek6e6310e2013-05-29 14:47:47 +00001468 } else if (I->InPPDirective &&
1469 (I->First->HasUnescapedNewline || I->First->IsFirst)) {
Daniel Jasper39825ea2013-01-14 15:40:57 +00001470 tryMergeSimplePPDirective(I, E, Limit);
Daniel Jasper25837aa2013-01-14 14:14:23 +00001471 }
Daniel Jasper25837aa2013-01-14 14:14:23 +00001472 }
1473
Daniel Jasper39825ea2013-01-14 15:40:57 +00001474 void tryMergeSimplePPDirective(std::vector<AnnotatedLine>::iterator &I,
1475 std::vector<AnnotatedLine>::iterator E,
1476 unsigned Limit) {
Daniel Jasper12ef4e52013-02-21 21:33:55 +00001477 if (Limit == 0)
1478 return;
Daniel Jasper39825ea2013-01-14 15:40:57 +00001479 AnnotatedLine &Line = *I;
Manuel Klimek6e6310e2013-05-29 14:47:47 +00001480 if (!(I + 1)->InPPDirective || (I + 1)->First->HasUnescapedNewline)
Daniel Jasper2ab0d012013-01-14 15:52:06 +00001481 return;
Daniel Jasper39825ea2013-01-14 15:40:57 +00001482 if (I + 2 != E && (I + 2)->InPPDirective &&
Manuel Klimek6e6310e2013-05-29 14:47:47 +00001483 !(I + 2)->First->HasUnescapedNewline)
Daniel Jasper39825ea2013-01-14 15:40:57 +00001484 return;
Manuel Klimeka4fe1c12013-01-21 16:42:44 +00001485 if (1 + (I + 1)->Last->TotalLength > Limit)
Daniel Jaspera67a8f02013-01-16 10:41:46 +00001486 return;
Daniel Jasper39825ea2013-01-14 15:40:57 +00001487 join(Line, *(++I));
1488 }
1489
Daniel Jasper3a685df2013-05-16 12:12:21 +00001490 void tryMergeSimpleControlStatement(std::vector<AnnotatedLine>::iterator &I,
1491 std::vector<AnnotatedLine>::iterator E,
1492 unsigned Limit) {
Daniel Jasper12ef4e52013-02-21 21:33:55 +00001493 if (Limit == 0)
1494 return;
Manuel Klimekda087612013-01-18 14:46:43 +00001495 if ((I + 1)->InPPDirective != I->InPPDirective ||
Manuel Klimek6e6310e2013-05-29 14:47:47 +00001496 ((I + 1)->InPPDirective && (I + 1)->First->HasUnescapedNewline))
Manuel Klimekda087612013-01-18 14:46:43 +00001497 return;
Daniel Jasper25837aa2013-01-14 14:14:23 +00001498 AnnotatedLine &Line = *I;
Daniel Jasperc36492b2013-01-16 07:02:34 +00001499 if (Line.Last->isNot(tok::r_paren))
1500 return;
Manuel Klimeka4fe1c12013-01-21 16:42:44 +00001501 if (1 + (I + 1)->Last->TotalLength > Limit)
Daniel Jasper25837aa2013-01-14 14:14:23 +00001502 return;
Manuel Klimek6e6310e2013-05-29 14:47:47 +00001503 if ((I + 1)->First->isOneOf(tok::semi, tok::kw_if, tok::kw_for,
1504 tok::kw_while) ||
1505 (I + 1)->First->Type == TT_LineComment)
Daniel Jasper25837aa2013-01-14 14:14:23 +00001506 return;
1507 // Only inline simple if's (no nested if or else).
Manuel Klimek6e6310e2013-05-29 14:47:47 +00001508 if (I + 2 != E && Line.First->is(tok::kw_if) &&
1509 (I + 2)->First->is(tok::kw_else))
Daniel Jasper25837aa2013-01-14 14:14:23 +00001510 return;
1511 join(Line, *(++I));
1512 }
1513
1514 void tryMergeSimpleBlock(std::vector<AnnotatedLine>::iterator &I,
Daniel Jasperbbc84152013-01-29 11:27:30 +00001515 std::vector<AnnotatedLine>::iterator E,
1516 unsigned Limit) {
Daniel Jasperabca58c2013-05-15 14:09:55 +00001517 // No merging if the brace already is on the next line.
1518 if (Style.BreakBeforeBraces != FormatStyle::BS_Attach)
1519 return;
1520
Manuel Klimekf4ab9ef2013-01-11 17:54:10 +00001521 // First, check that the current line allows merging. This is the case if
1522 // we're not in a control flow statement and the last token is an opening
1523 // brace.
Daniel Jasper25837aa2013-01-14 14:14:23 +00001524 AnnotatedLine &Line = *I;
Manuel Klimek6e6310e2013-05-29 14:47:47 +00001525 if (Line.First->isOneOf(tok::kw_if, tok::kw_while, tok::kw_do, tok::r_brace,
1526 tok::kw_else, tok::kw_try, tok::kw_catch,
Daniel Jaspera9eb2aa2013-05-31 14:56:20 +00001527 tok::kw_for,
Manuel Klimek6e6310e2013-05-29 14:47:47 +00001528 // This gets rid of all ObjC @ keywords and methods.
1529 tok::at, tok::minus, tok::plus))
Daniel Jasper25837aa2013-01-14 14:14:23 +00001530 return;
Manuel Klimekf4ab9ef2013-01-11 17:54:10 +00001531
Manuel Klimek6e6310e2013-05-29 14:47:47 +00001532 FormatToken *Tok = (I + 1)->First;
Daniel Jaspera9eb2aa2013-05-31 14:56:20 +00001533 if (Tok->is(tok::r_brace) && !Tok->MustBreakBefore &&
Alexander Kornienko1efe0a02013-07-04 14:47:51 +00001534 (Tok->getNextNonComment() == NULL ||
1535 Tok->getNextNonComment()->is(tok::semi))) {
Daniel Jasper12ef4e52013-02-21 21:33:55 +00001536 // We merge empty blocks even if the line exceeds the column limit.
Daniel Jaspereef30492013-02-11 12:36:37 +00001537 Tok->SpacesRequiredBefore = 0;
Daniel Jasper12ef4e52013-02-21 21:33:55 +00001538 Tok->CanBreakBefore = true;
Manuel Klimeka4fe1c12013-01-21 16:42:44 +00001539 join(Line, *(I + 1));
1540 I += 1;
Daniel Jaspera9eb2aa2013-05-31 14:56:20 +00001541 } else if (Limit != 0 && Line.First->isNot(tok::kw_namespace)) {
Manuel Klimeka4fe1c12013-01-21 16:42:44 +00001542 // Check that we still have three lines and they fit into the limit.
1543 if (I + 2 == E || (I + 2)->Type == LT_Invalid ||
1544 !nextTwoLinesFitInto(I, Limit))
Daniel Jasper25837aa2013-01-14 14:14:23 +00001545 return;
Manuel Klimekf4ab9ef2013-01-11 17:54:10 +00001546
Manuel Klimeka4fe1c12013-01-21 16:42:44 +00001547 // Second, check that the next line does not contain any braces - if it
1548 // does, readability declines when putting it into a single line.
1549 if ((I + 1)->Last->Type == TT_LineComment || Tok->MustBreakBefore)
1550 return;
1551 do {
Alexander Kornienko62b85b92013-03-13 14:41:29 +00001552 if (Tok->isOneOf(tok::l_brace, tok::r_brace))
Manuel Klimeka4fe1c12013-01-21 16:42:44 +00001553 return;
Manuel Klimek6e6310e2013-05-29 14:47:47 +00001554 Tok = Tok->Next;
Manuel Klimeka4fe1c12013-01-21 16:42:44 +00001555 } while (Tok != NULL);
Manuel Klimekf4ab9ef2013-01-11 17:54:10 +00001556
Manuel Klimeka4fe1c12013-01-21 16:42:44 +00001557 // Last, check that the third line contains a single closing brace.
Manuel Klimek6e6310e2013-05-29 14:47:47 +00001558 Tok = (I + 2)->First;
Alexander Kornienko1efe0a02013-07-04 14:47:51 +00001559 if (Tok->getNextNonComment() != NULL || Tok->isNot(tok::r_brace) ||
Manuel Klimeka4fe1c12013-01-21 16:42:44 +00001560 Tok->MustBreakBefore)
1561 return;
1562
1563 join(Line, *(I + 1));
1564 join(Line, *(I + 2));
1565 I += 2;
Manuel Klimekf4ab9ef2013-01-11 17:54:10 +00001566 }
Daniel Jasper25837aa2013-01-14 14:14:23 +00001567 }
1568
1569 bool nextTwoLinesFitInto(std::vector<AnnotatedLine>::iterator I,
1570 unsigned Limit) {
Manuel Klimeka4fe1c12013-01-21 16:42:44 +00001571 return 1 + (I + 1)->Last->TotalLength + 1 + (I + 2)->Last->TotalLength <=
1572 Limit;
Manuel Klimekf4ab9ef2013-01-11 17:54:10 +00001573 }
1574
Daniel Jasperf1e4b7d2013-01-14 13:08:07 +00001575 void join(AnnotatedLine &A, const AnnotatedLine &B) {
Manuel Klimek6e6310e2013-05-29 14:47:47 +00001576 assert(!A.Last->Next);
1577 assert(!B.First->Previous);
1578 A.Last->Next = B.First;
1579 B.First->Previous = A.Last;
1580 unsigned LengthA = A.Last->TotalLength + B.First->SpacesRequiredBefore;
1581 for (FormatToken *Tok = B.First; Tok; Tok = Tok->Next) {
1582 Tok->TotalLength += LengthA;
1583 A.Last = Tok;
Daniel Jasperf1e4b7d2013-01-14 13:08:07 +00001584 }
Manuel Klimek51bd6ec2013-01-10 19:49:59 +00001585 }
1586
Daniel Jasper97b89482013-03-13 07:49:51 +00001587 bool touchesRanges(const CharSourceRange &Range) {
Daniel Jasperf71cf3b2013-03-07 20:50:00 +00001588 for (unsigned i = 0, e = Ranges.size(); i != e; ++i) {
1589 if (!SourceMgr.isBeforeInTranslationUnit(Range.getEnd(),
1590 Ranges[i].getBegin()) &&
1591 !SourceMgr.isBeforeInTranslationUnit(Ranges[i].getEnd(),
1592 Range.getBegin()))
1593 return true;
1594 }
1595 return false;
1596 }
1597
1598 bool touchesLine(const AnnotatedLine &TheLine) {
Manuel Klimek6e6310e2013-05-29 14:47:47 +00001599 const FormatToken *First = TheLine.First;
1600 const FormatToken *Last = TheLine.Last;
Daniel Jaspercdd06622013-05-14 10:31:09 +00001601 CharSourceRange LineRange = CharSourceRange::getCharRange(
Manuel Klimek5c24cca2013-05-23 10:56:37 +00001602 First->WhitespaceRange.getBegin().getLocWithOffset(
1603 First->LastNewlineOffset),
Alexander Kornienkoee4ca9b2013-06-07 17:45:07 +00001604 Last->Tok.getLocation().getLocWithOffset(Last->TokenText.size() - 1));
Daniel Jasperf71cf3b2013-03-07 20:50:00 +00001605 return touchesRanges(LineRange);
1606 }
1607
Daniel Jasper1cb530f2013-05-10 13:00:49 +00001608 bool touchesPPDirective(std::vector<AnnotatedLine>::iterator I,
1609 std::vector<AnnotatedLine>::iterator E) {
1610 for (; I != E; ++I) {
Manuel Klimek6e6310e2013-05-29 14:47:47 +00001611 if (I->First->HasUnescapedNewline)
Daniel Jasper1cb530f2013-05-10 13:00:49 +00001612 return false;
1613 if (touchesLine(*I))
1614 return true;
1615 }
1616 return false;
1617 }
1618
Daniel Jasperf71cf3b2013-03-07 20:50:00 +00001619 bool touchesEmptyLineBefore(const AnnotatedLine &TheLine) {
Manuel Klimek6e6310e2013-05-29 14:47:47 +00001620 const FormatToken *First = TheLine.First;
Daniel Jasperf71cf3b2013-03-07 20:50:00 +00001621 CharSourceRange LineRange = CharSourceRange::getCharRange(
Manuel Klimek5c24cca2013-05-23 10:56:37 +00001622 First->WhitespaceRange.getBegin(),
1623 First->WhitespaceRange.getBegin().getLocWithOffset(
1624 First->LastNewlineOffset));
Daniel Jasperf71cf3b2013-03-07 20:50:00 +00001625 return touchesRanges(LineRange);
Manuel Klimek51bd6ec2013-01-10 19:49:59 +00001626 }
1627
1628 virtual void consumeUnwrappedLine(const UnwrappedLine &TheLine) {
Daniel Jasperdaffc0d2013-01-16 09:10:19 +00001629 AnnotatedLines.push_back(AnnotatedLine(TheLine));
Daniel Jasperf7935112012-12-03 18:12:45 +00001630 }
1631
Manuel Klimek0b689fd2013-01-10 18:45:26 +00001632 /// \brief Add a new line and the required indent before the first Token
1633 /// of the \c UnwrappedLine if there was no structural parsing error.
1634 /// Returns the indent level of the \c UnwrappedLine.
Manuel Klimek6e6310e2013-05-29 14:47:47 +00001635 void formatFirstToken(const FormatToken &RootToken,
1636 const FormatToken *PreviousToken, unsigned Indent,
Manuel Klimek4fe43002013-05-22 12:51:29 +00001637 bool InPPDirective) {
Daniel Jasperbbc84152013-01-29 11:27:30 +00001638 unsigned Newlines =
Manuel Klimek6e6310e2013-05-29 14:47:47 +00001639 std::min(RootToken.NewlinesBefore, Style.MaxEmptyLinesToKeep + 1);
Daniel Jasper1027c6e2013-06-03 16:16:41 +00001640 // Remove empty lines before "}" where applicable.
1641 if (RootToken.is(tok::r_brace) &&
1642 (!RootToken.Next ||
1643 (RootToken.Next->is(tok::semi) && !RootToken.Next->Next)))
1644 Newlines = std::min(Newlines, 1u);
Manuel Klimek6e6310e2013-05-29 14:47:47 +00001645 if (Newlines == 0 && !RootToken.IsFirst)
Manuel Klimek0b689fd2013-01-10 18:45:26 +00001646 Newlines = 1;
Manuel Klimek0b689fd2013-01-10 18:45:26 +00001647
Manuel Klimek4fe43002013-05-22 12:51:29 +00001648 // Insert extra new line before access specifiers.
1649 if (PreviousToken && PreviousToken->isOneOf(tok::semi, tok::r_brace) &&
Manuel Klimek6e6310e2013-05-29 14:47:47 +00001650 RootToken.isAccessSpecifier() && RootToken.NewlinesBefore == 1)
Manuel Klimek4fe43002013-05-22 12:51:29 +00001651 ++Newlines;
Alexander Kornienkofd433362013-03-27 17:08:02 +00001652
Manuel Klimek6e6310e2013-05-29 14:47:47 +00001653 Whitespaces.replaceWhitespace(
1654 RootToken, Newlines, Indent, Indent,
1655 InPPDirective && !RootToken.HasUnescapedNewline);
Manuel Klimek0b689fd2013-01-10 18:45:26 +00001656 }
1657
Daniel Jasperf7935112012-12-03 18:12:45 +00001658 FormatStyle Style;
1659 Lexer &Lex;
1660 SourceManager &SourceMgr;
Daniel Jasperaa701fa2013-01-18 08:44:07 +00001661 WhitespaceManager Whitespaces;
Daniel Jasperf7935112012-12-03 18:12:45 +00001662 std::vector<CharSourceRange> Ranges;
Daniel Jasperf1e4b7d2013-01-14 13:08:07 +00001663 std::vector<AnnotatedLine> AnnotatedLines;
Alexander Kornienkoffcc0102013-06-05 14:09:10 +00001664
1665 encoding::Encoding Encoding;
Daniel Jasperf7935112012-12-03 18:12:45 +00001666};
1667
Craig Topperaf35e852013-06-30 22:29:28 +00001668} // end anonymous namespace
1669
Alexander Kornienkocb45bc12013-04-15 14:28:00 +00001670tooling::Replacements reformat(const FormatStyle &Style, Lexer &Lex,
1671 SourceManager &SourceMgr,
Daniel Jasperd2ae41a2013-05-15 08:14:19 +00001672 std::vector<CharSourceRange> Ranges) {
1673 Formatter formatter(Style, Lex, SourceMgr, Ranges);
Daniel Jasperf7935112012-12-03 18:12:45 +00001674 return formatter.format();
1675}
1676
Daniel Jasperec04c0d2013-05-16 10:40:07 +00001677tooling::Replacements reformat(const FormatStyle &Style, StringRef Code,
1678 std::vector<tooling::Range> Ranges,
1679 StringRef FileName) {
1680 FileManager Files((FileSystemOptions()));
1681 DiagnosticsEngine Diagnostics(
1682 IntrusiveRefCntPtr<DiagnosticIDs>(new DiagnosticIDs),
1683 new DiagnosticOptions);
1684 SourceManager SourceMgr(Diagnostics, Files);
1685 llvm::MemoryBuffer *Buf = llvm::MemoryBuffer::getMemBuffer(Code, FileName);
1686 const clang::FileEntry *Entry =
1687 Files.getVirtualFile(FileName, Buf->getBufferSize(), 0);
1688 SourceMgr.overrideFileContents(Entry, Buf);
1689 FileID ID =
1690 SourceMgr.createFileID(Entry, SourceLocation(), clang::SrcMgr::C_User);
Alexander Kornienko1e808872013-06-28 12:51:24 +00001691 Lexer Lex(ID, SourceMgr.getBuffer(ID), SourceMgr,
1692 getFormattingLangOpts(Style.Standard));
Daniel Jasperec04c0d2013-05-16 10:40:07 +00001693 SourceLocation StartOfFile = SourceMgr.getLocForStartOfFile(ID);
1694 std::vector<CharSourceRange> CharRanges;
1695 for (unsigned i = 0, e = Ranges.size(); i != e; ++i) {
1696 SourceLocation Start = StartOfFile.getLocWithOffset(Ranges[i].getOffset());
1697 SourceLocation End = Start.getLocWithOffset(Ranges[i].getLength());
1698 CharRanges.push_back(CharSourceRange::getCharRange(Start, End));
1699 }
1700 return reformat(Style, Lex, SourceMgr, CharRanges);
1701}
1702
Alexander Kornienko1e808872013-06-28 12:51:24 +00001703LangOptions getFormattingLangOpts(FormatStyle::LanguageStandard Standard) {
Daniel Jasperc1fa2812013-01-10 13:08:12 +00001704 LangOptions LangOpts;
1705 LangOpts.CPlusPlus = 1;
Alexander Kornienko1e808872013-06-28 12:51:24 +00001706 LangOpts.CPlusPlus11 = Standard == FormatStyle::LS_Cpp03 ? 0 : 1;
Daniel Jasper55213652013-03-22 10:01:29 +00001707 LangOpts.LineComment = 1;
Daniel Jasperc1fa2812013-01-10 13:08:12 +00001708 LangOpts.Bool = 1;
1709 LangOpts.ObjC1 = 1;
1710 LangOpts.ObjC2 = 1;
1711 return LangOpts;
1712}
1713
Daniel Jasper8d1832e2013-01-07 13:26:07 +00001714} // namespace format
1715} // namespace clang