blob: 7d6bc14241ec1ccc791af9d9cfdd0a8d9bc27b1d [file] [log] [blame]
Daniel Jasperbac016b2012-12-03 18:12:45 +00001//===--- Format.cpp - Format C++ code -------------------------------------===//
2//
3// The LLVM Compiler Infrastructure
4//
5// This file is distributed under the University of Illinois Open Source
6// License. See LICENSE.TXT for details.
7//
8//===----------------------------------------------------------------------===//
9///
10/// \file
11/// \brief This file implements functions declared in Format.h. This will be
12/// split into separate files as we go.
13///
Daniel Jasperbac016b2012-12-03 18:12:45 +000014//===----------------------------------------------------------------------===//
15
Manuel Klimekca547db2013-01-16 14:55:28 +000016#define DEBUG_TYPE "format-formatter"
17
Alexander Kornienko70ce7882013-04-15 14:28:00 +000018#include "BreakableToken.h"
Daniel Jasper32d28ee2013-01-29 21:01:14 +000019#include "TokenAnnotator.h"
Chandler Carruth55fc8732012-12-04 09:13:33 +000020#include "UnwrappedLineParser.h"
Alexander Kornienko70ce7882013-04-15 14:28:00 +000021#include "WhitespaceManager.h"
Daniel Jasper8a999452013-05-16 10:40:07 +000022#include "clang/Basic/Diagnostic.h"
Daniel Jasper675d2e32012-12-21 10:20:02 +000023#include "clang/Basic/OperatorPrecedence.h"
Chandler Carruthb99083e2013-01-02 10:28:36 +000024#include "clang/Basic/SourceManager.h"
Manuel Klimekca547db2013-01-16 14:55:28 +000025#include "clang/Format/Format.h"
Daniel Jasperbac016b2012-12-03 18:12:45 +000026#include "clang/Lex/Lexer.h"
Alexander Kornienko5262dd92013-03-27 11:52:18 +000027#include "llvm/ADT/STLExtras.h"
Manuel Klimek32a2fd72013-02-13 10:46:36 +000028#include "llvm/Support/Allocator.h"
Manuel Klimekca547db2013-01-16 14:55:28 +000029#include "llvm/Support/Debug.h"
Alexander Kornienkod71ec162013-05-07 15:32:14 +000030#include "llvm/Support/YAMLTraits.h"
Manuel Klimek32a2fd72013-02-13 10:46:36 +000031#include <queue>
Daniel Jasper8822d3a2012-12-04 13:02:32 +000032#include <string>
33
Alexander Kornienkod71ec162013-05-07 15:32:14 +000034namespace llvm {
35namespace yaml {
36template <>
37struct ScalarEnumerationTraits<clang::format::FormatStyle::LanguageStandard> {
Manuel Klimek44135b82013-05-13 12:51:40 +000038 static void enumeration(IO &IO,
39 clang::format::FormatStyle::LanguageStandard &Value) {
40 IO.enumCase(Value, "C++03", clang::format::FormatStyle::LS_Cpp03);
41 IO.enumCase(Value, "C++11", clang::format::FormatStyle::LS_Cpp11);
42 IO.enumCase(Value, "Auto", clang::format::FormatStyle::LS_Auto);
43 }
44};
45
Daniel Jasper1fb8d882013-05-14 09:30:02 +000046template <>
Manuel Klimek44135b82013-05-13 12:51:40 +000047struct ScalarEnumerationTraits<clang::format::FormatStyle::BraceBreakingStyle> {
48 static void
49 enumeration(IO &IO, clang::format::FormatStyle::BraceBreakingStyle &Value) {
50 IO.enumCase(Value, "Attach", clang::format::FormatStyle::BS_Attach);
51 IO.enumCase(Value, "Linux", clang::format::FormatStyle::BS_Linux);
52 IO.enumCase(Value, "Stroustrup", clang::format::FormatStyle::BS_Stroustrup);
Alexander Kornienkod71ec162013-05-07 15:32:14 +000053 }
54};
55
56template <> struct MappingTraits<clang::format::FormatStyle> {
57 static void mapping(llvm::yaml::IO &IO, clang::format::FormatStyle &Style) {
Alexander Kornienkodd256312013-05-10 11:56:10 +000058 if (IO.outputting()) {
59 StringRef StylesArray[] = { "LLVM", "Google", "Chromium", "Mozilla" };
60 ArrayRef<StringRef> Styles(StylesArray);
61 for (size_t i = 0, e = Styles.size(); i < e; ++i) {
62 StringRef StyleName(Styles[i]);
Alexander Kornienko885f87b2013-05-19 00:53:30 +000063 clang::format::FormatStyle PredefinedStyle;
64 if (clang::format::getPredefinedStyle(StyleName, &PredefinedStyle) &&
65 Style == PredefinedStyle) {
Alexander Kornienkodd256312013-05-10 11:56:10 +000066 IO.mapOptional("# BasedOnStyle", StyleName);
67 break;
68 }
69 }
70 } else {
Alexander Kornienkod71ec162013-05-07 15:32:14 +000071 StringRef BasedOnStyle;
72 IO.mapOptional("BasedOnStyle", BasedOnStyle);
Alexander Kornienkod71ec162013-05-07 15:32:14 +000073 if (!BasedOnStyle.empty())
Alexander Kornienko885f87b2013-05-19 00:53:30 +000074 if (!clang::format::getPredefinedStyle(BasedOnStyle, &Style)) {
75 IO.setError(Twine("Unknown value for BasedOnStyle: ", BasedOnStyle));
76 return;
77 }
Alexander Kornienkod71ec162013-05-07 15:32:14 +000078 }
79
80 IO.mapOptional("AccessModifierOffset", Style.AccessModifierOffset);
81 IO.mapOptional("AlignEscapedNewlinesLeft", Style.AlignEscapedNewlinesLeft);
82 IO.mapOptional("AllowAllParametersOfDeclarationOnNextLine",
83 Style.AllowAllParametersOfDeclarationOnNextLine);
84 IO.mapOptional("AllowShortIfStatementsOnASingleLine",
85 Style.AllowShortIfStatementsOnASingleLine);
Daniel Jasperf11bbb92013-05-16 12:12:21 +000086 IO.mapOptional("AllowShortLoopsOnASingleLine",
87 Style.AllowShortLoopsOnASingleLine);
Daniel Jasperbbc87762013-05-29 12:07:31 +000088 IO.mapOptional("AlwaysBreakTemplateDeclarations",
89 Style.AlwaysBreakTemplateDeclarations);
Alexander Kornienkod71ec162013-05-07 15:32:14 +000090 IO.mapOptional("BinPackParameters", Style.BinPackParameters);
91 IO.mapOptional("ColumnLimit", Style.ColumnLimit);
92 IO.mapOptional("ConstructorInitializerAllOnOneLineOrOnePerLine",
93 Style.ConstructorInitializerAllOnOneLineOrOnePerLine);
94 IO.mapOptional("DerivePointerBinding", Style.DerivePointerBinding);
95 IO.mapOptional("IndentCaseLabels", Style.IndentCaseLabels);
96 IO.mapOptional("MaxEmptyLinesToKeep", Style.MaxEmptyLinesToKeep);
97 IO.mapOptional("ObjCSpaceBeforeProtocolList",
98 Style.ObjCSpaceBeforeProtocolList);
Alexander Kornienko2785b9a2013-06-07 16:02:52 +000099 IO.mapOptional("PenaltyBreakComment", Style.PenaltyBreakComment);
100 IO.mapOptional("PenaltyBreakString", Style.PenaltyBreakString);
Alexander Kornienkod71ec162013-05-07 15:32:14 +0000101 IO.mapOptional("PenaltyExcessCharacter", Style.PenaltyExcessCharacter);
102 IO.mapOptional("PenaltyReturnTypeOnItsOwnLine",
103 Style.PenaltyReturnTypeOnItsOwnLine);
104 IO.mapOptional("PointerBindsToType", Style.PointerBindsToType);
105 IO.mapOptional("SpacesBeforeTrailingComments",
106 Style.SpacesBeforeTrailingComments);
Daniel Jasper1bee0732013-05-23 18:05:18 +0000107 IO.mapOptional("SpacesInBracedLists", Style.SpacesInBracedLists);
Alexander Kornienkod71ec162013-05-07 15:32:14 +0000108 IO.mapOptional("Standard", Style.Standard);
Manuel Klimek07a64ec2013-05-13 08:42:42 +0000109 IO.mapOptional("IndentWidth", Style.IndentWidth);
Manuel Klimek7c9a93e2013-05-13 09:22:11 +0000110 IO.mapOptional("UseTab", Style.UseTab);
Manuel Klimek44135b82013-05-13 12:51:40 +0000111 IO.mapOptional("BreakBeforeBraces", Style.BreakBeforeBraces);
Manuel Klimeka9a7f102013-06-21 17:25:42 +0000112 IO.mapOptional("IndentFunctionDeclarationAfterType",
113 Style.IndentFunctionDeclarationAfterType);
Alexander Kornienkod71ec162013-05-07 15:32:14 +0000114 }
115};
116}
117}
118
Daniel Jasperbac016b2012-12-03 18:12:45 +0000119namespace clang {
120namespace format {
121
Daniel Jasperbac016b2012-12-03 18:12:45 +0000122FormatStyle getLLVMStyle() {
123 FormatStyle LLVMStyle;
Daniel Jasperbac016b2012-12-03 18:12:45 +0000124 LLVMStyle.AccessModifierOffset = -2;
Alexander Kornienkofb594862013-05-06 14:11:27 +0000125 LLVMStyle.AlignEscapedNewlinesLeft = false;
Daniel Jasperf1579602013-01-29 16:03:49 +0000126 LLVMStyle.AllowAllParametersOfDeclarationOnNextLine = true;
Daniel Jasper6f5bb2c2013-01-14 16:24:39 +0000127 LLVMStyle.AllowShortIfStatementsOnASingleLine = false;
Daniel Jasperf11bbb92013-05-16 12:12:21 +0000128 LLVMStyle.AllowShortLoopsOnASingleLine = false;
Daniel Jasperbbc87762013-05-29 12:07:31 +0000129 LLVMStyle.AlwaysBreakTemplateDeclarations = false;
Alexander Kornienkofb594862013-05-06 14:11:27 +0000130 LLVMStyle.BinPackParameters = true;
131 LLVMStyle.ColumnLimit = 80;
132 LLVMStyle.ConstructorInitializerAllOnOneLineOrOnePerLine = false;
133 LLVMStyle.DerivePointerBinding = false;
134 LLVMStyle.IndentCaseLabels = false;
135 LLVMStyle.MaxEmptyLinesToKeep = 1;
Nico Weber5f500df2013-01-10 20:12:55 +0000136 LLVMStyle.ObjCSpaceBeforeProtocolList = true;
Alexander Kornienko2785b9a2013-06-07 16:02:52 +0000137 LLVMStyle.PenaltyBreakComment = 45;
138 LLVMStyle.PenaltyBreakString = 1000;
Daniel Jasper01786732013-02-04 07:21:18 +0000139 LLVMStyle.PenaltyExcessCharacter = 1000000;
Daniel Jasper1407bee2013-04-11 14:29:13 +0000140 LLVMStyle.PenaltyReturnTypeOnItsOwnLine = 75;
Alexander Kornienkofb594862013-05-06 14:11:27 +0000141 LLVMStyle.PointerBindsToType = false;
142 LLVMStyle.SpacesBeforeTrailingComments = 1;
Daniel Jasper2424eef2013-05-23 10:15:45 +0000143 LLVMStyle.SpacesInBracedLists = true;
Alexander Kornienkofb594862013-05-06 14:11:27 +0000144 LLVMStyle.Standard = FormatStyle::LS_Cpp03;
Manuel Klimek07a64ec2013-05-13 08:42:42 +0000145 LLVMStyle.IndentWidth = 2;
Manuel Klimek7c9a93e2013-05-13 09:22:11 +0000146 LLVMStyle.UseTab = false;
Manuel Klimek44135b82013-05-13 12:51:40 +0000147 LLVMStyle.BreakBeforeBraces = FormatStyle::BS_Attach;
Manuel Klimeka9a7f102013-06-21 17:25:42 +0000148 LLVMStyle.IndentFunctionDeclarationAfterType = false;
Daniel Jasperbac016b2012-12-03 18:12:45 +0000149 return LLVMStyle;
150}
151
152FormatStyle getGoogleStyle() {
153 FormatStyle GoogleStyle;
Daniel Jasperbac016b2012-12-03 18:12:45 +0000154 GoogleStyle.AccessModifierOffset = -1;
Alexander Kornienkofb594862013-05-06 14:11:27 +0000155 GoogleStyle.AlignEscapedNewlinesLeft = true;
Daniel Jasperf1579602013-01-29 16:03:49 +0000156 GoogleStyle.AllowAllParametersOfDeclarationOnNextLine = true;
Daniel Jasper94d6ad72013-04-24 13:46:00 +0000157 GoogleStyle.AllowShortIfStatementsOnASingleLine = true;
Daniel Jasper1bee0732013-05-23 18:05:18 +0000158 GoogleStyle.AllowShortLoopsOnASingleLine = true;
Daniel Jasperbbc87762013-05-29 12:07:31 +0000159 GoogleStyle.AlwaysBreakTemplateDeclarations = true;
Alexander Kornienkofb594862013-05-06 14:11:27 +0000160 GoogleStyle.BinPackParameters = true;
161 GoogleStyle.ColumnLimit = 80;
162 GoogleStyle.ConstructorInitializerAllOnOneLineOrOnePerLine = true;
163 GoogleStyle.DerivePointerBinding = true;
164 GoogleStyle.IndentCaseLabels = true;
165 GoogleStyle.MaxEmptyLinesToKeep = 1;
Nico Weber5f500df2013-01-10 20:12:55 +0000166 GoogleStyle.ObjCSpaceBeforeProtocolList = false;
Alexander Kornienko2785b9a2013-06-07 16:02:52 +0000167 GoogleStyle.PenaltyBreakComment = 45;
168 GoogleStyle.PenaltyBreakString = 1000;
Daniel Jasper01786732013-02-04 07:21:18 +0000169 GoogleStyle.PenaltyExcessCharacter = 1000000;
Daniel Jasper1407bee2013-04-11 14:29:13 +0000170 GoogleStyle.PenaltyReturnTypeOnItsOwnLine = 200;
Alexander Kornienkofb594862013-05-06 14:11:27 +0000171 GoogleStyle.PointerBindsToType = true;
172 GoogleStyle.SpacesBeforeTrailingComments = 2;
Daniel Jasper2424eef2013-05-23 10:15:45 +0000173 GoogleStyle.SpacesInBracedLists = false;
Alexander Kornienkofb594862013-05-06 14:11:27 +0000174 GoogleStyle.Standard = FormatStyle::LS_Auto;
Manuel Klimek07a64ec2013-05-13 08:42:42 +0000175 GoogleStyle.IndentWidth = 2;
Manuel Klimek7c9a93e2013-05-13 09:22:11 +0000176 GoogleStyle.UseTab = false;
Manuel Klimek44135b82013-05-13 12:51:40 +0000177 GoogleStyle.BreakBeforeBraces = FormatStyle::BS_Attach;
Manuel Klimeka9a7f102013-06-21 17:25:42 +0000178 GoogleStyle.IndentFunctionDeclarationAfterType = true;
Daniel Jasperbac016b2012-12-03 18:12:45 +0000179 return GoogleStyle;
180}
181
Daniel Jasper6f5bb2c2013-01-14 16:24:39 +0000182FormatStyle getChromiumStyle() {
183 FormatStyle ChromiumStyle = getGoogleStyle();
Daniel Jasperf1579602013-01-29 16:03:49 +0000184 ChromiumStyle.AllowAllParametersOfDeclarationOnNextLine = false;
Daniel Jasper94d6ad72013-04-24 13:46:00 +0000185 ChromiumStyle.AllowShortIfStatementsOnASingleLine = false;
Daniel Jasperf11bbb92013-05-16 12:12:21 +0000186 ChromiumStyle.AllowShortLoopsOnASingleLine = false;
Daniel Jasperfaab0d32013-02-27 09:47:53 +0000187 ChromiumStyle.BinPackParameters = false;
Daniel Jasper8ff690a2013-02-06 14:22:40 +0000188 ChromiumStyle.Standard = FormatStyle::LS_Cpp03;
189 ChromiumStyle.DerivePointerBinding = false;
Daniel Jasper6f5bb2c2013-01-14 16:24:39 +0000190 return ChromiumStyle;
191}
192
Alexander Kornienkofb594862013-05-06 14:11:27 +0000193FormatStyle getMozillaStyle() {
194 FormatStyle MozillaStyle = getLLVMStyle();
195 MozillaStyle.AllowAllParametersOfDeclarationOnNextLine = false;
196 MozillaStyle.ConstructorInitializerAllOnOneLineOrOnePerLine = true;
197 MozillaStyle.DerivePointerBinding = true;
198 MozillaStyle.IndentCaseLabels = true;
199 MozillaStyle.ObjCSpaceBeforeProtocolList = false;
200 MozillaStyle.PenaltyReturnTypeOnItsOwnLine = 200;
201 MozillaStyle.PointerBindsToType = true;
202 return MozillaStyle;
203}
204
Alexander Kornienko885f87b2013-05-19 00:53:30 +0000205bool getPredefinedStyle(StringRef Name, FormatStyle *Style) {
Alexander Kornienkod71ec162013-05-07 15:32:14 +0000206 if (Name.equals_lower("llvm"))
Alexander Kornienko885f87b2013-05-19 00:53:30 +0000207 *Style = getLLVMStyle();
208 else if (Name.equals_lower("chromium"))
209 *Style = getChromiumStyle();
210 else if (Name.equals_lower("mozilla"))
211 *Style = getMozillaStyle();
212 else if (Name.equals_lower("google"))
213 *Style = getGoogleStyle();
214 else
215 return false;
Alexander Kornienkod71ec162013-05-07 15:32:14 +0000216
Alexander Kornienko885f87b2013-05-19 00:53:30 +0000217 return true;
Alexander Kornienkod71ec162013-05-07 15:32:14 +0000218}
219
220llvm::error_code parseConfiguration(StringRef Text, FormatStyle *Style) {
Alexander Kornienko107db3c2013-05-20 15:18:01 +0000221 if (Text.trim().empty())
222 return llvm::make_error_code(llvm::errc::invalid_argument);
Alexander Kornienkod71ec162013-05-07 15:32:14 +0000223 llvm::yaml::Input Input(Text);
224 Input >> *Style;
225 return Input.error();
226}
227
228std::string configurationAsText(const FormatStyle &Style) {
229 std::string Text;
230 llvm::raw_string_ostream Stream(Text);
231 llvm::yaml::Output Output(Stream);
232 // We use the same mapping method for input and output, so we need a non-const
233 // reference here.
234 FormatStyle NonConstStyle = Style;
235 Output << NonConstStyle;
Alexander Kornienko2b6acb62013-05-13 12:56:35 +0000236 return Stream.str();
Alexander Kornienkod71ec162013-05-07 15:32:14 +0000237}
238
Daniel Jasperce3d1a62013-02-08 08:22:00 +0000239// Returns the length of everything up to the first possible line break after
240// the ), ], } or > matching \c Tok.
Manuel Klimekb3987012013-05-29 14:47:47 +0000241static unsigned getLengthToMatchingParen(const FormatToken &Tok) {
Daniel Jasperce3d1a62013-02-08 08:22:00 +0000242 if (Tok.MatchingParen == NULL)
243 return 0;
Manuel Klimekb3987012013-05-29 14:47:47 +0000244 FormatToken *End = Tok.MatchingParen;
245 while (End->Next && !End->Next->CanBreakBefore) {
246 End = End->Next;
Daniel Jasperce3d1a62013-02-08 08:22:00 +0000247 }
248 return End->TotalLength - Tok.TotalLength + 1;
249}
250
Daniel Jasperbac016b2012-12-03 18:12:45 +0000251class UnwrappedLineFormatter {
252public:
Manuel Klimek94fc6f12013-01-10 19:17:33 +0000253 UnwrappedLineFormatter(const FormatStyle &Style, SourceManager &SourceMgr,
Daniel Jasper995e8202013-01-14 13:08:07 +0000254 const AnnotatedLine &Line, unsigned FirstIndent,
Manuel Klimekb3987012013-05-29 14:47:47 +0000255 const FormatToken *RootToken,
Alexander Kornienko00895102013-06-05 14:09:10 +0000256 WhitespaceManager &Whitespaces,
257 encoding::Encoding Encoding)
Daniel Jasper1321eb52012-12-18 21:05:13 +0000258 : Style(Style), SourceMgr(SourceMgr), Line(Line),
Daniel Jasperdcc2a622013-01-18 08:44:07 +0000259 FirstIndent(FirstIndent), RootToken(RootToken),
Alexander Kornienko00895102013-06-05 14:09:10 +0000260 Whitespaces(Whitespaces), Count(0), Encoding(Encoding) {}
Daniel Jasperbac016b2012-12-03 18:12:45 +0000261
Manuel Klimekd4397b92013-01-04 23:34:14 +0000262 /// \brief Formats an \c UnwrappedLine.
Manuel Klimeke573c3f2013-05-22 12:51:29 +0000263 void format(const AnnotatedLine *NextLine) {
Daniel Jasper3b5943f2012-12-06 09:56:08 +0000264 // Initialize state dependent on indent.
Daniel Jasper604eb4c2013-01-11 10:22:12 +0000265 LineState State;
Manuel Klimek3f8c7f32013-01-10 18:45:26 +0000266 State.Column = FirstIndent;
Manuel Klimekb3987012013-05-29 14:47:47 +0000267 State.NextToken = RootToken;
Daniel Jasper6f21a982013-03-13 07:49:51 +0000268 State.Stack.push_back(
Nico Weber27268772013-06-26 00:30:14 +0000269 ParenState(FirstIndent, FirstIndent, /*AvoidBinPacking=*/false,
270 /*NoLineBreak=*/false));
Daniel Jaspera324a0e2012-12-21 14:37:20 +0000271 State.LineContainsContinuedForLoopSection = false;
Daniel Jasper29f123b2013-02-08 15:28:42 +0000272 State.ParenLevel = 0;
Manuel Klimekb56b6d12013-02-20 15:25:48 +0000273 State.StartOfStringLiteral = 0;
Daniel Jaspercf5767d2013-02-18 11:05:07 +0000274 State.StartOfLineLevel = State.ParenLevel;
Daniel Jasperce912f42013-06-03 09:54:46 +0000275 State.LowestCallLevel = State.ParenLevel;
Daniel Jasper54b4e442013-05-22 05:27:42 +0000276 State.IgnoreStackForComparison = false;
Daniel Jasper3b5943f2012-12-06 09:56:08 +0000277
278 // The first token has already been indented and thus consumed.
Nico Weber27268772013-06-26 00:30:14 +0000279 moveStateToNextToken(State, /*DryRun=*/false);
Daniel Jasperbac016b2012-12-03 18:12:45 +0000280
Daniel Jasper68ef0df2013-02-01 11:00:45 +0000281 // If everything fits on a single line, just put it there.
Daniel Jaspera4d46212013-02-28 11:05:57 +0000282 unsigned ColumnLimit = Style.ColumnLimit;
283 if (NextLine && NextLine->InPPDirective &&
Manuel Klimekb3987012013-05-29 14:47:47 +0000284 !NextLine->First->HasUnescapedNewline)
Daniel Jaspera4d46212013-02-28 11:05:57 +0000285 ColumnLimit = getColumnLimit();
286 if (Line.Last->TotalLength <= ColumnLimit - FirstIndent) {
Daniel Jasper68ef0df2013-02-01 11:00:45 +0000287 while (State.NextToken != NULL) {
Daniel Jasper1321eb52012-12-18 21:05:13 +0000288 addTokenToState(false, false, State);
Daniel Jasper1321eb52012-12-18 21:05:13 +0000289 }
Daniel Jasperbac016b2012-12-03 18:12:45 +0000290 }
Daniel Jasper68ef0df2013-02-01 11:00:45 +0000291
Daniel Jasperce3d1a62013-02-08 08:22:00 +0000292 // If the ObjC method declaration does not fit on a line, we should format
293 // it with one arg per line.
294 if (Line.Type == LT_ObjCMethodDecl)
295 State.Stack.back().BreakBeforeParameter = true;
296
Daniel Jasper68ef0df2013-02-01 11:00:45 +0000297 // Find best solution in solution space.
Manuel Klimeke573c3f2013-05-22 12:51:29 +0000298 analyzeSolutionSpace(State);
Daniel Jasperbac016b2012-12-03 18:12:45 +0000299 }
300
301private:
Manuel Klimekb3987012013-05-29 14:47:47 +0000302 void DebugTokenState(const FormatToken &FormatTok) {
303 const Token &Tok = FormatTok.Tok;
Alexander Kornienkodd256312013-05-10 11:56:10 +0000304 llvm::dbgs() << StringRef(SourceMgr.getCharacterData(Tok.getLocation()),
Daniel Jasper1a1ce832013-01-29 11:27:30 +0000305 Tok.getLength());
Alexander Kornienkodd256312013-05-10 11:56:10 +0000306 llvm::dbgs();
Manuel Klimekca547db2013-01-16 14:55:28 +0000307 }
308
Daniel Jasper604eb4c2013-01-11 10:22:12 +0000309 struct ParenState {
Daniel Jasperd399bff2013-02-05 09:41:21 +0000310 ParenState(unsigned Indent, unsigned LastSpace, bool AvoidBinPacking,
Daniel Jasper001bf4e2013-04-22 07:59:53 +0000311 bool NoLineBreak)
Daniel Jasper29f123b2013-02-08 15:28:42 +0000312 : Indent(Indent), LastSpace(LastSpace), FirstLessLess(0),
313 BreakBeforeClosingBrace(false), QuestionColumn(0),
Daniel Jasperce3d1a62013-02-08 08:22:00 +0000314 AvoidBinPacking(AvoidBinPacking), BreakBeforeParameter(false),
Daniel Jasper001bf4e2013-04-22 07:59:53 +0000315 NoLineBreak(NoLineBreak), ColonPos(0), StartOfFunctionCall(0),
316 NestedNameSpecifierContinuation(0), CallContinuation(0),
Daniel Jasperc3df5ff2013-05-13 09:19:24 +0000317 VariablePos(0), ForFakeParenthesis(false) {}
Daniel Jaspera4974cf2012-12-24 16:43:00 +0000318
Daniel Jasperbac016b2012-12-03 18:12:45 +0000319 /// \brief The position to which a specific parenthesis level needs to be
320 /// indented.
Daniel Jasper604eb4c2013-01-11 10:22:12 +0000321 unsigned Indent;
Daniel Jasperbac016b2012-12-03 18:12:45 +0000322
Daniel Jasper3b5943f2012-12-06 09:56:08 +0000323 /// \brief The position of the last space on each level.
324 ///
325 /// Used e.g. to break like:
326 /// functionCall(Parameter, otherCall(
327 /// OtherParameter));
Daniel Jasper604eb4c2013-01-11 10:22:12 +0000328 unsigned LastSpace;
Daniel Jasperbac016b2012-12-03 18:12:45 +0000329
Daniel Jasper3b5943f2012-12-06 09:56:08 +0000330 /// \brief The position the first "<<" operator encountered on each level.
331 ///
332 /// Used to align "<<" operators. 0 if no such operator has been encountered
333 /// on a level.
Daniel Jasper604eb4c2013-01-11 10:22:12 +0000334 unsigned FirstLessLess;
Daniel Jasper3b5943f2012-12-06 09:56:08 +0000335
Manuel Klimekc8c8a472013-01-10 15:58:26 +0000336 /// \brief Whether a newline needs to be inserted before the block's closing
337 /// brace.
338 ///
339 /// We only want to insert a newline before the closing brace if there also
340 /// was a newline after the beginning left brace.
Daniel Jasper604eb4c2013-01-11 10:22:12 +0000341 bool BreakBeforeClosingBrace;
342
Daniel Jasperbfe6fd42013-01-28 12:45:14 +0000343 /// \brief The column of a \c ? in a conditional expression;
344 unsigned QuestionColumn;
345
Daniel Jasperf343cab2013-01-31 14:59:26 +0000346 /// \brief Avoid bin packing, i.e. multiple parameters/elements on multiple
347 /// lines, in this context.
348 bool AvoidBinPacking;
349
350 /// \brief Break after the next comma (or all the commas in this context if
351 /// \c AvoidBinPacking is \c true).
Daniel Jasperce3d1a62013-02-08 08:22:00 +0000352 bool BreakBeforeParameter;
Daniel Jasperf343cab2013-01-31 14:59:26 +0000353
Daniel Jasper001bf4e2013-04-22 07:59:53 +0000354 /// \brief Line breaking in this context would break a formatting rule.
355 bool NoLineBreak;
Daniel Jasper7e9bf8c2013-01-11 11:37:55 +0000356
Daniel Jasper63d7ced2013-02-05 10:07:47 +0000357 /// \brief The position of the colon in an ObjC method declaration/call.
358 unsigned ColonPos;
Daniel Jasperc4615b72013-02-20 12:56:39 +0000359
Daniel Jasper24849712013-03-01 16:48:32 +0000360 /// \brief The start of the most recent function in a builder-type call.
361 unsigned StartOfFunctionCall;
362
Daniel Jasper37911302013-04-02 14:33:13 +0000363 /// \brief If a nested name specifier was broken over multiple lines, this
364 /// contains the start column of the second line. Otherwise 0.
365 unsigned NestedNameSpecifierContinuation;
366
367 /// \brief If a call expression was broken over multiple lines, this
368 /// contains the start column of the second line. Otherwise 0.
369 unsigned CallContinuation;
370
Daniel Jasper8ed9f2b2013-04-03 13:36:17 +0000371 /// \brief The column of the first variable name in a variable declaration.
372 ///
373 /// Used to align further variables if necessary.
374 unsigned VariablePos;
375
Daniel Jasperc3df5ff2013-05-13 09:19:24 +0000376 /// \brief \c true if this \c ParenState was created for a fake parenthesis.
377 ///
378 /// Does not need to be considered for memoization / the comparison function
379 /// as otherwise identical states will have the same fake/non-fake
380 /// \c ParenStates.
381 bool ForFakeParenthesis;
382
Daniel Jasper604eb4c2013-01-11 10:22:12 +0000383 bool operator<(const ParenState &Other) const {
384 if (Indent != Other.Indent)
Daniel Jasper7d19bc22013-01-11 14:23:32 +0000385 return Indent < Other.Indent;
Daniel Jasper604eb4c2013-01-11 10:22:12 +0000386 if (LastSpace != Other.LastSpace)
387 return LastSpace < Other.LastSpace;
388 if (FirstLessLess != Other.FirstLessLess)
389 return FirstLessLess < Other.FirstLessLess;
Daniel Jasper7e9bf8c2013-01-11 11:37:55 +0000390 if (BreakBeforeClosingBrace != Other.BreakBeforeClosingBrace)
391 return BreakBeforeClosingBrace;
Daniel Jasperbfe6fd42013-01-28 12:45:14 +0000392 if (QuestionColumn != Other.QuestionColumn)
393 return QuestionColumn < Other.QuestionColumn;
Daniel Jasperf343cab2013-01-31 14:59:26 +0000394 if (AvoidBinPacking != Other.AvoidBinPacking)
395 return AvoidBinPacking;
Daniel Jasperce3d1a62013-02-08 08:22:00 +0000396 if (BreakBeforeParameter != Other.BreakBeforeParameter)
397 return BreakBeforeParameter;
Daniel Jasper001bf4e2013-04-22 07:59:53 +0000398 if (NoLineBreak != Other.NoLineBreak)
399 return NoLineBreak;
Daniel Jasper63d7ced2013-02-05 10:07:47 +0000400 if (ColonPos != Other.ColonPos)
401 return ColonPos < Other.ColonPos;
Daniel Jasper24849712013-03-01 16:48:32 +0000402 if (StartOfFunctionCall != Other.StartOfFunctionCall)
403 return StartOfFunctionCall < Other.StartOfFunctionCall;
Daniel Jasper37911302013-04-02 14:33:13 +0000404 if (CallContinuation != Other.CallContinuation)
405 return CallContinuation < Other.CallContinuation;
Daniel Jasper8ed9f2b2013-04-03 13:36:17 +0000406 if (VariablePos != Other.VariablePos)
407 return VariablePos < Other.VariablePos;
Daniel Jasperb3123142013-01-12 07:36:22 +0000408 return false;
Daniel Jasper604eb4c2013-01-11 10:22:12 +0000409 }
410 };
411
412 /// \brief The current state when indenting a unwrapped line.
413 ///
414 /// As the indenting tries different combinations this is copied by value.
415 struct LineState {
416 /// \brief The number of used columns in the current line.
417 unsigned Column;
418
419 /// \brief The token that needs to be next formatted.
Manuel Klimekb3987012013-05-29 14:47:47 +0000420 const FormatToken *NextToken;
Daniel Jasper604eb4c2013-01-11 10:22:12 +0000421
Daniel Jaspera324a0e2012-12-21 14:37:20 +0000422 /// \brief \c true if this line contains a continued for-loop section.
423 bool LineContainsContinuedForLoopSection;
424
Daniel Jasper29f123b2013-02-08 15:28:42 +0000425 /// \brief The level of nesting inside (), [], <> and {}.
426 unsigned ParenLevel;
427
Daniel Jaspercf5767d2013-02-18 11:05:07 +0000428 /// \brief The \c ParenLevel at the start of this line.
429 unsigned StartOfLineLevel;
430
Daniel Jasperce912f42013-06-03 09:54:46 +0000431 /// \brief The lowest \c ParenLevel of "." or "->" on the current line.
432 unsigned LowestCallLevel;
Daniel Jasper259a0382013-05-27 11:50:16 +0000433
Manuel Klimekb56b6d12013-02-20 15:25:48 +0000434 /// \brief The start column of the string literal, if we're in a string
435 /// literal sequence, 0 otherwise.
436 unsigned StartOfStringLiteral;
437
Daniel Jasper604eb4c2013-01-11 10:22:12 +0000438 /// \brief A stack keeping track of properties applying to parenthesis
439 /// levels.
440 std::vector<ParenState> Stack;
441
Daniel Jasper54b4e442013-05-22 05:27:42 +0000442 /// \brief Ignore the stack of \c ParenStates for state comparison.
443 ///
444 /// In long and deeply nested unwrapped lines, the current algorithm can
445 /// be insufficient for finding the best formatting with a reasonable amount
446 /// of time and memory. Setting this flag will effectively lead to the
447 /// algorithm not analyzing some combinations. However, these combinations
448 /// rarely contain the optimal solution: In short, accepting a higher
449 /// penalty early would need to lead to different values in the \c
450 /// ParenState stack (in an otherwise identical state) and these different
451 /// values would need to lead to a significant amount of avoided penalty
452 /// later.
453 ///
454 /// FIXME: Come up with a better algorithm instead.
455 bool IgnoreStackForComparison;
456
Daniel Jasper604eb4c2013-01-11 10:22:12 +0000457 /// \brief Comparison operator to be able to used \c LineState in \c map.
458 bool operator<(const LineState &Other) const {
Daniel Jasperd7896702013-02-19 09:28:55 +0000459 if (NextToken != Other.NextToken)
460 return NextToken < Other.NextToken;
461 if (Column != Other.Column)
462 return Column < Other.Column;
Daniel Jasperd7896702013-02-19 09:28:55 +0000463 if (LineContainsContinuedForLoopSection !=
Alexander Kornienko70ce7882013-04-15 14:28:00 +0000464 Other.LineContainsContinuedForLoopSection)
Daniel Jaspera324a0e2012-12-21 14:37:20 +0000465 return LineContainsContinuedForLoopSection;
Daniel Jasperd7896702013-02-19 09:28:55 +0000466 if (ParenLevel != Other.ParenLevel)
467 return ParenLevel < Other.ParenLevel;
468 if (StartOfLineLevel != Other.StartOfLineLevel)
469 return StartOfLineLevel < Other.StartOfLineLevel;
Daniel Jasperce912f42013-06-03 09:54:46 +0000470 if (LowestCallLevel != Other.LowestCallLevel)
471 return LowestCallLevel < Other.LowestCallLevel;
Manuel Klimekb56b6d12013-02-20 15:25:48 +0000472 if (StartOfStringLiteral != Other.StartOfStringLiteral)
473 return StartOfStringLiteral < Other.StartOfStringLiteral;
Daniel Jasper54b4e442013-05-22 05:27:42 +0000474 if (IgnoreStackForComparison || Other.IgnoreStackForComparison)
475 return false;
Daniel Jasperd7896702013-02-19 09:28:55 +0000476 return Stack < Other.Stack;
Daniel Jasperbac016b2012-12-03 18:12:45 +0000477 }
478 };
479
Daniel Jasper20409152012-12-04 14:54:30 +0000480 /// \brief Appends the next token to \p State and updates information
481 /// necessary for indentation.
482 ///
Nico Weber1907c572013-06-26 02:42:46 +0000483 /// Puts the token on the current line if \p Newline is \c false and adds a
Daniel Jasper20409152012-12-04 14:54:30 +0000484 /// line break and necessary indentation otherwise.
485 ///
486 /// If \p DryRun is \c false, also creates and stores the required
487 /// \c Replacement.
Manuel Klimek8092a942013-02-20 10:15:13 +0000488 unsigned addTokenToState(bool Newline, bool DryRun, LineState &State) {
Manuel Klimekb3987012013-05-29 14:47:47 +0000489 const FormatToken &Current = *State.NextToken;
490 const FormatToken &Previous = *State.NextToken->Previous;
Daniel Jasperbac016b2012-12-03 18:12:45 +0000491
Daniel Jasper92f9faf2013-03-20 15:58:10 +0000492 if (State.Stack.size() == 0 || Current.Type == TT_ImplicitStringLiteral) {
Manuel Klimekad3094b2013-05-23 10:56:37 +0000493 // FIXME: Is this correct?
Manuel Klimekb3987012013-05-29 14:47:47 +0000494 int WhitespaceLength = SourceMgr.getSpellingColumnNumber(
495 State.NextToken->WhitespaceRange.getEnd()) -
496 SourceMgr.getSpellingColumnNumber(
497 State.NextToken->WhitespaceRange.getBegin());
Alexander Kornienko00895102013-06-05 14:09:10 +0000498 State.Column += WhitespaceLength + State.NextToken->CodePointCount;
Manuel Klimekb3987012013-05-29 14:47:47 +0000499 State.NextToken = State.NextToken->Next;
Manuel Klimek8092a942013-02-20 10:15:13 +0000500 return 0;
Daniel Jasper68ef0df2013-02-01 11:00:45 +0000501 }
502
Daniel Jasper3776ef32013-04-03 07:21:51 +0000503 // If we are continuing an expression, we want to indent an extra 4 spaces.
504 unsigned ContinuationIndent =
Daniel Jasper37911302013-04-02 14:33:13 +0000505 std::max(State.Stack.back().LastSpace, State.Stack.back().Indent) + 4;
Daniel Jasperbac016b2012-12-03 18:12:45 +0000506 if (Newline) {
Manuel Klimekbb42bf12013-01-10 11:52:21 +0000507 if (Current.is(tok::r_brace)) {
Manuel Klimek07a64ec2013-05-13 08:42:42 +0000508 State.Column = Line.Level * Style.IndentWidth;
Daniel Jasper9c837d02013-01-09 07:06:56 +0000509 } else if (Current.is(tok::string_literal) &&
Manuel Klimekb56b6d12013-02-20 15:25:48 +0000510 State.StartOfStringLiteral != 0) {
511 State.Column = State.StartOfStringLiteral;
Daniel Jasper66d19bd2013-02-18 11:59:17 +0000512 State.Stack.back().BreakBeforeParameter = true;
Daniel Jasper9c837d02013-01-09 07:06:56 +0000513 } else if (Current.is(tok::lessless) &&
Daniel Jasper29f123b2013-02-08 15:28:42 +0000514 State.Stack.back().FirstLessLess != 0) {
515 State.Column = State.Stack.back().FirstLessLess;
Daniel Jasper5ad390d2013-05-28 11:30:49 +0000516 } else if (Current.isOneOf(tok::period, tok::arrow) &&
517 Current.Type != TT_DesignatedInitializerPeriod) {
Daniel Jasper3776ef32013-04-03 07:21:51 +0000518 if (State.Stack.back().CallContinuation == 0) {
519 State.Column = ContinuationIndent;
Daniel Jasper37911302013-04-02 14:33:13 +0000520 State.Stack.back().CallContinuation = State.Column;
Daniel Jasper3776ef32013-04-03 07:21:51 +0000521 } else {
522 State.Column = State.Stack.back().CallContinuation;
523 }
Daniel Jasperbfe6fd42013-01-28 12:45:14 +0000524 } else if (Current.Type == TT_ConditionalExpr) {
525 State.Column = State.Stack.back().QuestionColumn;
Daniel Jasper8ed9f2b2013-04-03 13:36:17 +0000526 } else if (Previous.is(tok::comma) &&
527 State.Stack.back().VariablePos != 0) {
528 State.Column = State.Stack.back().VariablePos;
Daniel Jasper3c08a812013-02-24 18:54:32 +0000529 } else if (Previous.ClosesTemplateDeclaration ||
Daniel Jasper53e72cd2013-05-06 08:27:33 +0000530 (Current.Type == TT_StartOfName && State.ParenLevel == 0 &&
Manuel Klimeka9a7f102013-06-21 17:25:42 +0000531 (!Style.IndentFunctionDeclarationAfterType ||
532 Line.StartsDefinition))) {
Daniel Jasper37911302013-04-02 14:33:13 +0000533 State.Column = State.Stack.back().Indent;
Daniel Jasper63d7ced2013-02-05 10:07:47 +0000534 } else if (Current.Type == TT_ObjCSelectorName) {
Alexander Kornienko00895102013-06-05 14:09:10 +0000535 if (State.Stack.back().ColonPos > Current.CodePointCount) {
536 State.Column = State.Stack.back().ColonPos - Current.CodePointCount;
Daniel Jasper63d7ced2013-02-05 10:07:47 +0000537 } else {
538 State.Column = State.Stack.back().Indent;
Alexander Kornienko00895102013-06-05 14:09:10 +0000539 State.Stack.back().ColonPos = State.Column + Current.CodePointCount;
Daniel Jasper63d7ced2013-02-05 10:07:47 +0000540 }
Daniel Jasperb2f063a2013-05-08 10:00:18 +0000541 } else if (Current.Type == TT_StartOfName ||
542 Previous.isOneOf(tok::coloncolon, tok::equal) ||
Daniel Jasper37911302013-04-02 14:33:13 +0000543 Previous.Type == TT_ObjCMethodExpr) {
Daniel Jasper3776ef32013-04-03 07:21:51 +0000544 State.Column = ContinuationIndent;
Daniel Jaspera324a0e2012-12-21 14:37:20 +0000545 } else {
Daniel Jasper29f123b2013-02-08 15:28:42 +0000546 State.Column = State.Stack.back().Indent;
Daniel Jasper3776ef32013-04-03 07:21:51 +0000547 // Ensure that we fall back to indenting 4 spaces instead of just
548 // flushing continuations left.
Daniel Jasper37911302013-04-02 14:33:13 +0000549 if (State.Column == FirstIndent)
550 State.Column += 4;
Daniel Jaspera324a0e2012-12-21 14:37:20 +0000551 }
552
Daniel Jasper7878a7b2013-02-15 11:07:25 +0000553 if (Current.is(tok::question))
Daniel Jasper237d4c12013-02-23 21:01:55 +0000554 State.Stack.back().BreakBeforeParameter = true;
Daniel Jasper11e13802013-05-08 14:12:04 +0000555 if ((Previous.isOneOf(tok::comma, tok::semi) &&
556 !State.Stack.back().AvoidBinPacking) ||
557 Previous.Type == TT_BinaryOperator)
Daniel Jasperce3d1a62013-02-08 08:22:00 +0000558 State.Stack.back().BreakBeforeParameter = false;
Daniel Jasper33f4b902013-05-15 09:35:08 +0000559 if (Previous.Type == TT_TemplateCloser && State.ParenLevel == 0)
560 State.Stack.back().BreakBeforeParameter = false;
Daniel Jasperf343cab2013-01-31 14:59:26 +0000561
Manuel Klimek060143e2013-01-02 18:33:23 +0000562 if (!DryRun) {
Daniel Jasper1ef81d52013-02-26 13:10:34 +0000563 unsigned NewLines = 1;
Alexander Kornienkoe3f11972013-06-12 19:04:12 +0000564 if (Current.is(tok::comment))
Manuel Klimekb3987012013-05-29 14:47:47 +0000565 NewLines = std::max(
566 NewLines,
567 std::min(Current.NewlinesBefore, Style.MaxEmptyLinesToKeep + 1));
Manuel Klimeke573c3f2013-05-22 12:51:29 +0000568 Whitespaces.replaceWhitespace(Current, NewLines, State.Column,
569 State.Column, Line.InPPDirective);
Manuel Klimek060143e2013-01-02 18:33:23 +0000570 }
Daniel Jasperbac016b2012-12-03 18:12:45 +0000571
Daniel Jasper29f123b2013-02-08 15:28:42 +0000572 State.Stack.back().LastSpace = State.Column;
Daniel Jasper5ad390d2013-05-28 11:30:49 +0000573 if (Current.isOneOf(tok::arrow, tok::period) &&
574 Current.Type != TT_DesignatedInitializerPeriod)
Alexander Kornienko00895102013-06-05 14:09:10 +0000575 State.Stack.back().LastSpace += Current.CodePointCount;
Daniel Jaspercf5767d2013-02-18 11:05:07 +0000576 State.StartOfLineLevel = State.ParenLevel;
Daniel Jasperce912f42013-06-03 09:54:46 +0000577 State.LowestCallLevel = State.ParenLevel;
Daniel Jasper237d4c12013-02-23 21:01:55 +0000578
579 // Any break on this level means that the parent level has been broken
580 // and we need to avoid bin packing there.
581 for (unsigned i = 0, e = State.Stack.size() - 1; i != e; ++i) {
582 State.Stack[i].BreakBeforeParameter = true;
583 }
Manuel Klimekb3987012013-05-29 14:47:47 +0000584 const FormatToken *TokenBefore = Current.getPreviousNoneComment();
Daniel Jasper01218ff2013-04-15 22:36:37 +0000585 if (TokenBefore && !TokenBefore->isOneOf(tok::comma, tok::semi) &&
Daniel Jasper33f4b902013-05-15 09:35:08 +0000586 TokenBefore->Type != TT_TemplateCloser &&
Daniel Jasper11e13802013-05-08 14:12:04 +0000587 TokenBefore->Type != TT_BinaryOperator && !TokenBefore->opensScope())
Daniel Jasperfaab0d32013-02-27 09:47:53 +0000588 State.Stack.back().BreakBeforeParameter = true;
589
Daniel Jasper237d4c12013-02-23 21:01:55 +0000590 // If we break after {, we should also break before the corresponding }.
591 if (Previous.is(tok::l_brace))
592 State.Stack.back().BreakBeforeClosingBrace = true;
593
594 if (State.Stack.back().AvoidBinPacking) {
595 // If we are breaking after '(', '{', '<', this is not bin packing
596 // unless AllowAllParametersOfDeclarationOnNextLine is false.
Daniel Jasperd741f022013-05-14 20:39:56 +0000597 if (!(Previous.isOneOf(tok::l_paren, tok::l_brace) ||
598 Previous.Type == TT_BinaryOperator) ||
Daniel Jasper237d4c12013-02-23 21:01:55 +0000599 (!Style.AllowAllParametersOfDeclarationOnNextLine &&
600 Line.MustBeDeclaration))
601 State.Stack.back().BreakBeforeParameter = true;
602 }
Daniel Jasperbac016b2012-12-03 18:12:45 +0000603 } else {
Daniel Jasper9c3e71a2013-02-25 15:59:54 +0000604 if (Current.is(tok::equal) &&
Manuel Klimekb3987012013-05-29 14:47:47 +0000605 (RootToken->is(tok::kw_for) || State.ParenLevel == 0) &&
Daniel Jasperadc0f092013-04-05 09:38:50 +0000606 State.Stack.back().VariablePos == 0) {
607 State.Stack.back().VariablePos = State.Column;
608 // Move over * and & if they are bound to the variable name.
Manuel Klimekb3987012013-05-29 14:47:47 +0000609 const FormatToken *Tok = &Previous;
Alexander Kornienko00895102013-06-05 14:09:10 +0000610 while (Tok && State.Stack.back().VariablePos >= Tok->CodePointCount) {
611 State.Stack.back().VariablePos -= Tok->CodePointCount;
Daniel Jasperadc0f092013-04-05 09:38:50 +0000612 if (Tok->SpacesRequiredBefore != 0)
613 break;
Manuel Klimekb3987012013-05-29 14:47:47 +0000614 Tok = Tok->Previous;
Daniel Jasperadc0f092013-04-05 09:38:50 +0000615 }
Daniel Jasper8ed9f2b2013-04-03 13:36:17 +0000616 if (Previous.PartOfMultiVariableDeclStmt)
617 State.Stack.back().LastSpace = State.Stack.back().VariablePos;
618 }
Daniel Jaspera324a0e2012-12-21 14:37:20 +0000619
Daniel Jasper729a7432013-02-11 12:36:37 +0000620 unsigned Spaces = State.NextToken->SpacesRequiredBefore;
Daniel Jasper20409152012-12-04 14:54:30 +0000621
Daniel Jasperbac016b2012-12-03 18:12:45 +0000622 if (!DryRun)
Manuel Klimeke573c3f2013-05-22 12:51:29 +0000623 Whitespaces.replaceWhitespace(Current, 0, Spaces,
624 State.Column + Spaces);
Daniel Jasper20409152012-12-04 14:54:30 +0000625
Daniel Jasper63d7ced2013-02-05 10:07:47 +0000626 if (Current.Type == TT_ObjCSelectorName &&
627 State.Stack.back().ColonPos == 0) {
628 if (State.Stack.back().Indent + Current.LongestObjCSelectorName >
Alexander Kornienko00895102013-06-05 14:09:10 +0000629 State.Column + Spaces + Current.CodePointCount)
Daniel Jasper63d7ced2013-02-05 10:07:47 +0000630 State.Stack.back().ColonPos =
631 State.Stack.back().Indent + Current.LongestObjCSelectorName;
632 else
633 State.Stack.back().ColonPos =
Alexander Kornienko00895102013-06-05 14:09:10 +0000634 State.Column + Spaces + Current.CodePointCount;
Daniel Jasper63d7ced2013-02-05 10:07:47 +0000635 }
636
Daniel Jasperac3223e2013-04-10 09:49:49 +0000637 if (Previous.opensScope() && Previous.Type != TT_ObjCMethodExpr &&
Daniel Jasperbf71ba22013-04-08 20:33:42 +0000638 Current.Type != TT_LineComment)
Daniel Jasper29f123b2013-02-08 15:28:42 +0000639 State.Stack.back().Indent = State.Column + Spaces;
Daniel Jasper001bf4e2013-04-22 07:59:53 +0000640 if (Previous.is(tok::comma) && !Current.isTrailingComment() &&
641 State.Stack.back().AvoidBinPacking)
642 State.Stack.back().NoLineBreak = true;
Daniel Jasper0df6acd2013-01-16 14:59:02 +0000643
Daniel Jasper3b5943f2012-12-06 09:56:08 +0000644 State.Column += Spaces;
Daniel Jasper8ed9f2b2013-04-03 13:36:17 +0000645 if (Current.is(tok::l_paren) && Previous.isOneOf(tok::kw_if, tok::kw_for))
Daniel Jaspere438bac2013-01-23 20:41:06 +0000646 // Treat the condition inside an if as if it was a second function
647 // parameter, i.e. let nested calls have an indent of 4.
648 State.Stack.back().LastSpace = State.Column + 1; // 1 is length of "(".
Daniel Jasperf9955d32013-03-20 12:37:50 +0000649 else if (Previous.is(tok::comma))
Daniel Jaspere438bac2013-01-23 20:41:06 +0000650 State.Stack.back().LastSpace = State.Column;
Daniel Jasperbfe6fd42013-01-28 12:45:14 +0000651 else if ((Previous.Type == TT_BinaryOperator ||
Daniel Jasper02b771e2013-01-28 13:31:35 +0000652 Previous.Type == TT_ConditionalExpr ||
653 Previous.Type == TT_CtorInitializerColon) &&
Manuel Klimekb3987012013-05-29 14:47:47 +0000654 !(Previous.getPrecedence() == prec::Assignment &&
Daniel Jasper512843a2013-05-27 12:45:09 +0000655 Current.FakeLParens.empty()))
656 // Always indent relative to the RHS of the expression unless this is a
657 // simple assignment without binary expression on the RHS.
Daniel Jasperae8699b2013-01-28 09:35:24 +0000658 State.Stack.back().LastSpace = State.Column;
Daniel Jasper6cabab42013-02-14 08:42:54 +0000659 else if (Previous.Type == TT_InheritanceColon)
660 State.Stack.back().Indent = State.Column;
Daniel Jasper11e13802013-05-08 14:12:04 +0000661 else if (Previous.opensScope() && !Current.FakeLParens.empty())
662 // If this function has multiple parameters or a binary expression
663 // parameter, indent nested calls from the start of the first parameter.
Daniel Jasper986e17f2013-01-28 07:35:34 +0000664 State.Stack.back().LastSpace = State.Column;
Daniel Jasperbac016b2012-12-03 18:12:45 +0000665 }
Daniel Jasper0df6acd2013-01-16 14:59:02 +0000666
Manuel Klimek8092a942013-02-20 10:15:13 +0000667 return moveStateToNextToken(State, DryRun);
Daniel Jasper20409152012-12-04 14:54:30 +0000668 }
Daniel Jasperbac016b2012-12-03 18:12:45 +0000669
Daniel Jasper20409152012-12-04 14:54:30 +0000670 /// \brief Mark the next token as consumed in \p State and modify its stacks
671 /// accordingly.
Manuel Klimek8092a942013-02-20 10:15:13 +0000672 unsigned moveStateToNextToken(LineState &State, bool DryRun) {
Manuel Klimekb3987012013-05-29 14:47:47 +0000673 const FormatToken &Current = *State.NextToken;
Daniel Jasper604eb4c2013-01-11 10:22:12 +0000674 assert(State.Stack.size());
Daniel Jasper3b5943f2012-12-06 09:56:08 +0000675
Daniel Jasper6cabab42013-02-14 08:42:54 +0000676 if (Current.Type == TT_InheritanceColon)
677 State.Stack.back().AvoidBinPacking = true;
Daniel Jasper604eb4c2013-01-11 10:22:12 +0000678 if (Current.is(tok::lessless) && State.Stack.back().FirstLessLess == 0)
679 State.Stack.back().FirstLessLess = State.Column;
Daniel Jasperbfe6fd42013-01-28 12:45:14 +0000680 if (Current.is(tok::question))
681 State.Stack.back().QuestionColumn = State.Column;
Daniel Jasperce912f42013-06-03 09:54:46 +0000682 if (Current.isOneOf(tok::period, tok::arrow)) {
683 State.LowestCallLevel = std::min(State.LowestCallLevel, State.ParenLevel);
684 if (Line.Type == LT_BuilderTypeCall && State.ParenLevel == 0)
685 State.Stack.back().StartOfFunctionCall =
Alexander Kornienko00895102013-06-05 14:09:10 +0000686 Current.LastInChainOfCalls ? 0
687 : State.Column + Current.CodePointCount;
Daniel Jasperce912f42013-06-03 09:54:46 +0000688 }
Daniel Jasper7d812812013-02-21 15:00:29 +0000689 if (Current.Type == TT_CtorInitializerColon) {
Manuel Klimek07a64ec2013-05-13 08:42:42 +0000690 // Indent 2 from the column, so:
691 // SomeClass::SomeClass()
692 // : First(...), ...
693 // Next(...)
694 // ^ line up here.
Daniel Jasperbf71ba22013-04-08 20:33:42 +0000695 State.Stack.back().Indent = State.Column + 2;
Daniel Jasper7d812812013-02-21 15:00:29 +0000696 if (Style.ConstructorInitializerAllOnOneLineOrOnePerLine)
697 State.Stack.back().AvoidBinPacking = true;
698 State.Stack.back().BreakBeforeParameter = false;
Daniel Jasperf343cab2013-01-31 14:59:26 +0000699 }
Daniel Jasper3776ef32013-04-03 07:21:51 +0000700
Daniel Jasperbf71ba22013-04-08 20:33:42 +0000701 // If return returns a binary expression, align after it.
702 if (Current.is(tok::kw_return) && !Current.FakeLParens.empty())
703 State.Stack.back().LastSpace = State.Column + 7;
704
Daniel Jasper3776ef32013-04-03 07:21:51 +0000705 // In ObjC method declaration we align on the ":" of parameters, but we need
706 // to ensure that we indent parameters on subsequent lines by at least 4.
Daniel Jasper37911302013-04-02 14:33:13 +0000707 if (Current.Type == TT_ObjCMethodSpecifier)
708 State.Stack.back().Indent += 4;
Daniel Jasper3b5943f2012-12-06 09:56:08 +0000709
Daniel Jasper29f123b2013-02-08 15:28:42 +0000710 // Insert scopes created by fake parenthesis.
Manuel Klimekb3987012013-05-29 14:47:47 +0000711 const FormatToken *Previous = Current.getPreviousNoneComment();
Daniel Jasperbf71ba22013-04-08 20:33:42 +0000712 // Don't add extra indentation for the first fake parenthesis after
713 // 'return', assignements or opening <({[. The indentation for these cases
714 // is special cased.
715 bool SkipFirstExtraIndent =
716 Current.is(tok::kw_return) ||
Daniel Jasperac3223e2013-04-10 09:49:49 +0000717 (Previous && (Previous->opensScope() ||
Manuel Klimekb3987012013-05-29 14:47:47 +0000718 Previous->getPrecedence() == prec::Assignment));
Daniel Jasperbf71ba22013-04-08 20:33:42 +0000719 for (SmallVector<prec::Level, 4>::const_reverse_iterator
720 I = Current.FakeLParens.rbegin(),
721 E = Current.FakeLParens.rend();
722 I != E; ++I) {
Daniel Jasper29f123b2013-02-08 15:28:42 +0000723 ParenState NewParenState = State.Stack.back();
Daniel Jasperc3df5ff2013-05-13 09:19:24 +0000724 NewParenState.ForFakeParenthesis = true;
Daniel Jasperbf71ba22013-04-08 20:33:42 +0000725 NewParenState.Indent =
726 std::max(std::max(State.Column, NewParenState.Indent),
727 State.Stack.back().LastSpace);
728
729 // Always indent conditional expressions. Never indent expression where
730 // the 'operator' is ',', ';' or an assignment (i.e. *I <=
731 // prec::Assignment) as those have different indentation rules. Indent
732 // other expression, unless the indentation needs to be skipped.
733 if (*I == prec::Conditional ||
734 (!SkipFirstExtraIndent && *I > prec::Assignment))
735 NewParenState.Indent += 4;
Daniel Jasperac3223e2013-04-10 09:49:49 +0000736 if (Previous && !Previous->opensScope())
Daniel Jasperbf71ba22013-04-08 20:33:42 +0000737 NewParenState.BreakBeforeParameter = false;
Daniel Jasper29f123b2013-02-08 15:28:42 +0000738 State.Stack.push_back(NewParenState);
Daniel Jasperbf71ba22013-04-08 20:33:42 +0000739 SkipFirstExtraIndent = false;
Daniel Jasper29f123b2013-02-08 15:28:42 +0000740 }
741
Daniel Jaspercf225b62012-12-24 13:43:52 +0000742 // If we encounter an opening (, [, { or <, we add a level to our stacks to
Daniel Jasper20409152012-12-04 14:54:30 +0000743 // prepare for the following tokens.
Daniel Jasperac3223e2013-04-10 09:49:49 +0000744 if (Current.opensScope()) {
Daniel Jasper604eb4c2013-01-11 10:22:12 +0000745 unsigned NewIndent;
Daniel Jasperc3df5ff2013-05-13 09:19:24 +0000746 unsigned LastSpace = State.Stack.back().LastSpace;
Daniel Jasperf343cab2013-01-31 14:59:26 +0000747 bool AvoidBinPacking;
Manuel Klimek2851c162013-01-10 14:36:46 +0000748 if (Current.is(tok::l_brace)) {
Daniel Jasperc3df5ff2013-05-13 09:19:24 +0000749 NewIndent = Style.IndentWidth + LastSpace;
Manuel Klimekb3987012013-05-29 14:47:47 +0000750 const FormatToken *NextNoComment = Current.getNextNoneComment();
Daniel Jasper5ad390d2013-05-28 11:30:49 +0000751 AvoidBinPacking = NextNoComment &&
752 NextNoComment->Type == TT_DesignatedInitializerPeriod;
Manuel Klimek2851c162013-01-10 14:36:46 +0000753 } else {
Daniel Jasperc3df5ff2013-05-13 09:19:24 +0000754 NewIndent =
755 4 + std::max(LastSpace, State.Stack.back().StartOfFunctionCall);
Daniel Jasper001bf4e2013-04-22 07:59:53 +0000756 AvoidBinPacking = !Style.BinPackParameters;
Manuel Klimek2851c162013-01-10 14:36:46 +0000757 }
Daniel Jasperfca24bc2013-04-25 13:31:51 +0000758
Daniel Jasperc3df5ff2013-05-13 09:19:24 +0000759 State.Stack.push_back(ParenState(NewIndent, LastSpace, AvoidBinPacking,
760 State.Stack.back().NoLineBreak));
Daniel Jasper29f123b2013-02-08 15:28:42 +0000761 ++State.ParenLevel;
Daniel Jasper20409152012-12-04 14:54:30 +0000762 }
763
Daniel Jasperce3d1a62013-02-08 08:22:00 +0000764 // If this '[' opens an ObjC call, determine whether all parameters fit into
765 // one line and put one per line if they don't.
766 if (Current.is(tok::l_square) && Current.Type == TT_ObjCMethodExpr &&
767 Current.MatchingParen != NULL) {
768 if (getLengthToMatchingParen(Current) + State.Column > getColumnLimit())
769 State.Stack.back().BreakBeforeParameter = true;
770 }
771
Daniel Jaspercf225b62012-12-24 13:43:52 +0000772 // If we encounter a closing ), ], } or >, we can remove a level from our
Daniel Jasper20409152012-12-04 14:54:30 +0000773 // stacks.
Alexander Kornienkoe74de282013-03-13 14:41:29 +0000774 if (Current.isOneOf(tok::r_paren, tok::r_square) ||
Manuel Klimekb3987012013-05-29 14:47:47 +0000775 (Current.is(tok::r_brace) && State.NextToken != RootToken) ||
Daniel Jasper26f7e782013-01-08 14:56:18 +0000776 State.NextToken->Type == TT_TemplateCloser) {
Daniel Jasper604eb4c2013-01-11 10:22:12 +0000777 State.Stack.pop_back();
Daniel Jasper29f123b2013-02-08 15:28:42 +0000778 --State.ParenLevel;
779 }
780
781 // Remove scopes created by fake parenthesis.
782 for (unsigned i = 0, e = Current.FakeRParens; i != e; ++i) {
Daniel Jasperabfc9c12013-04-04 19:31:00 +0000783 unsigned VariablePos = State.Stack.back().VariablePos;
Daniel Jasper29f123b2013-02-08 15:28:42 +0000784 State.Stack.pop_back();
Daniel Jasperabfc9c12013-04-04 19:31:00 +0000785 State.Stack.back().VariablePos = VariablePos;
Daniel Jasperbac016b2012-12-03 18:12:45 +0000786 }
Manuel Klimek2851c162013-01-10 14:36:46 +0000787
Daniel Jasper27c7f542013-05-13 20:50:15 +0000788 if (Current.is(tok::string_literal) && State.StartOfStringLiteral == 0) {
Manuel Klimekb56b6d12013-02-20 15:25:48 +0000789 State.StartOfStringLiteral = State.Column;
Daniel Jasper27c7f542013-05-13 20:50:15 +0000790 } else if (!Current.isOneOf(tok::comment, tok::identifier, tok::hash,
791 tok::string_literal)) {
Daniel Jasper9a2f8d02013-05-16 04:26:02 +0000792 State.StartOfStringLiteral = 0;
Manuel Klimekb56b6d12013-02-20 15:25:48 +0000793 }
794
Alexander Kornienko00895102013-06-05 14:09:10 +0000795 State.Column += Current.CodePointCount;
Manuel Klimek8092a942013-02-20 10:15:13 +0000796
Manuel Klimekb3987012013-05-29 14:47:47 +0000797 State.NextToken = State.NextToken->Next;
Manuel Klimek2851c162013-01-10 14:36:46 +0000798
Manuel Klimek8092a942013-02-20 10:15:13 +0000799 return breakProtrudingToken(Current, State, DryRun);
800 }
801
802 /// \brief If the current token sticks out over the end of the line, break
803 /// it if possible.
Manuel Klimek2a9805d2013-05-14 09:04:24 +0000804 ///
805 /// \returns An extra penalty if a token was broken, otherwise 0.
806 ///
807 /// Note that the penalty of the token protruding the allowed line length is
808 /// already handled in \c addNextStateToQueue; the returned penalty will only
809 /// cover the cost of the additional line breaks.
Manuel Klimekb3987012013-05-29 14:47:47 +0000810 unsigned breakProtrudingToken(const FormatToken &Current, LineState &State,
Manuel Klimeke573c3f2013-05-22 12:51:29 +0000811 bool DryRun) {
Alexander Kornienko70ce7882013-04-15 14:28:00 +0000812 llvm::OwningPtr<BreakableToken> Token;
Alexander Kornienko00895102013-06-05 14:09:10 +0000813 unsigned StartColumn = State.Column - Current.CodePointCount;
Manuel Klimekdcb3f2a2013-05-28 13:42:28 +0000814 unsigned OriginalStartColumn =
Manuel Klimekb3987012013-05-29 14:47:47 +0000815 SourceMgr.getSpellingColumnNumber(Current.getStartOfNonWhitespace()) -
Manuel Klimekdcb3f2a2013-05-28 13:42:28 +0000816 1;
Manuel Klimekde008c02013-05-27 15:23:34 +0000817
Daniel Jasper5d5b4242013-05-16 12:59:13 +0000818 if (Current.is(tok::string_literal) &&
819 Current.Type != TT_ImplicitStringLiteral) {
Alexander Kornienko70ce7882013-04-15 14:28:00 +0000820 // Only break up default narrow strings.
Alexander Kornienko16a0ec62013-06-14 11:46:10 +0000821 if (!Current.TokenText.startswith("\""))
Alexander Kornienko70ce7882013-04-15 14:28:00 +0000822 return 0;
823
Alexander Kornienko16a0ec62013-06-14 11:46:10 +0000824 Token.reset(new BreakableStringLiteral(Current, StartColumn,
825 Line.InPPDirective, Encoding));
Alexander Kornienko70ce7882013-04-15 14:28:00 +0000826 } else if (Current.Type == TT_BlockComment) {
Alexander Kornienko16a0ec62013-06-14 11:46:10 +0000827 Token.reset(new BreakableBlockComment(
Alexander Kornienko00895102013-06-05 14:09:10 +0000828 Style, Current, StartColumn, OriginalStartColumn, !Current.Previous,
Alexander Kornienko16a0ec62013-06-14 11:46:10 +0000829 Line.InPPDirective, Encoding));
Daniel Jasper7ff96ed2013-05-06 10:24:51 +0000830 } else if (Current.Type == TT_LineComment &&
Manuel Klimekb3987012013-05-29 14:47:47 +0000831 (Current.Previous == NULL ||
832 Current.Previous->Type != TT_ImplicitStringLiteral)) {
Alexander Kornienko16a0ec62013-06-14 11:46:10 +0000833 Token.reset(new BreakableLineComment(Current, StartColumn,
834 Line.InPPDirective, Encoding));
Alexander Kornienko70ce7882013-04-15 14:28:00 +0000835 } else {
Manuel Klimeke573c3f2013-05-22 12:51:29 +0000836 return 0;
Alexander Kornienko70ce7882013-04-15 14:28:00 +0000837 }
Alexander Kornienko16a0ec62013-06-14 11:46:10 +0000838 if (Current.UnbreakableTailLength >= getColumnLimit())
Manuel Klimek2a9805d2013-05-14 09:04:24 +0000839 return 0;
Alexander Kornienko70ce7882013-04-15 14:28:00 +0000840
Alexander Kornienkoc36c5c22013-06-19 19:50:11 +0000841 unsigned RemainingSpace = getColumnLimit() - Current.UnbreakableTailLength;
Alexander Kornienko70ce7882013-04-15 14:28:00 +0000842 bool BreakInserted = false;
843 unsigned Penalty = 0;
Alexander Kornienkoc36c5c22013-06-19 19:50:11 +0000844 unsigned RemainingTokenColumns = 0;
Manuel Klimekde008c02013-05-27 15:23:34 +0000845 for (unsigned LineIndex = 0, EndIndex = Token->getLineCount();
846 LineIndex != EndIndex; ++LineIndex) {
Alexander Kornienko16a0ec62013-06-14 11:46:10 +0000847 if (!DryRun)
848 Token->replaceWhitespaceBefore(LineIndex, Whitespaces);
Alexander Kornienko70ce7882013-04-15 14:28:00 +0000849 unsigned TailOffset = 0;
Alexander Kornienkoc36c5c22013-06-19 19:50:11 +0000850 RemainingTokenColumns = Token->getLineLengthAfterSplit(
Alexander Kornienko2785b9a2013-06-07 16:02:52 +0000851 LineIndex, TailOffset, StringRef::npos);
Alexander Kornienko00895102013-06-05 14:09:10 +0000852 while (RemainingTokenColumns > RemainingSpace) {
Alexander Kornienko70ce7882013-04-15 14:28:00 +0000853 BreakableToken::Split Split =
Manuel Klimeke573c3f2013-05-22 12:51:29 +0000854 Token->getSplit(LineIndex, TailOffset, getColumnLimit());
Alexander Kornienko70ce7882013-04-15 14:28:00 +0000855 if (Split.first == StringRef::npos)
856 break;
857 assert(Split.first != 0);
Alexander Kornienko00895102013-06-05 14:09:10 +0000858 unsigned NewRemainingTokenColumns = Token->getLineLengthAfterSplit(
Alexander Kornienko2785b9a2013-06-07 16:02:52 +0000859 LineIndex, TailOffset + Split.first + Split.second,
860 StringRef::npos);
Alexander Kornienko00895102013-06-05 14:09:10 +0000861 assert(NewRemainingTokenColumns < RemainingTokenColumns);
Alexander Kornienko16a0ec62013-06-14 11:46:10 +0000862 if (!DryRun)
863 Token->insertBreak(LineIndex, TailOffset, Split, Whitespaces);
Alexander Kornienko2785b9a2013-06-07 16:02:52 +0000864 Penalty += Current.is(tok::string_literal) ? Style.PenaltyBreakString
865 : Style.PenaltyBreakComment;
866 unsigned ColumnsUsed =
867 Token->getLineLengthAfterSplit(LineIndex, TailOffset, Split.first);
868 if (ColumnsUsed > getColumnLimit()) {
869 Penalty +=
870 Style.PenaltyExcessCharacter * (ColumnsUsed - getColumnLimit());
871 }
Alexander Kornienko70ce7882013-04-15 14:28:00 +0000872 TailOffset += Split.first + Split.second;
Alexander Kornienko00895102013-06-05 14:09:10 +0000873 RemainingTokenColumns = NewRemainingTokenColumns;
Alexander Kornienko70ce7882013-04-15 14:28:00 +0000874 BreakInserted = true;
Manuel Klimek8092a942013-02-20 10:15:13 +0000875 }
Alexander Kornienko70ce7882013-04-15 14:28:00 +0000876 }
877
Alexander Kornienkoc36c5c22013-06-19 19:50:11 +0000878 State.Column = RemainingTokenColumns;
879
Alexander Kornienko70ce7882013-04-15 14:28:00 +0000880 if (BreakInserted) {
Alexander Kornienko22d0e292013-06-17 12:59:44 +0000881 // If we break the token inside a parameter list, we need to break before
882 // the next parameter on all levels, so that the next parameter is clearly
883 // visible. Line comments already introduce a break.
884 if (Current.Type != TT_LineComment) {
885 for (unsigned i = 0, e = State.Stack.size(); i != e; ++i)
886 State.Stack[i].BreakBeforeParameter = true;
887 }
888
Alexander Kornienko70ce7882013-04-15 14:28:00 +0000889 State.Stack.back().LastSpace = StartColumn;
Manuel Klimek8092a942013-02-20 10:15:13 +0000890 }
Manuel Klimek8092a942013-02-20 10:15:13 +0000891 return Penalty;
892 }
893
Daniel Jasperceb99ab2013-01-09 10:16:05 +0000894 unsigned getColumnLimit() {
Alexander Kornienko70ce7882013-04-15 14:28:00 +0000895 // In preprocessor directives reserve two chars for trailing " \"
896 return Style.ColumnLimit - (Line.InPPDirective ? 2 : 0);
Daniel Jasperceb99ab2013-01-09 10:16:05 +0000897 }
898
Manuel Klimek32a2fd72013-02-13 10:46:36 +0000899 /// \brief An edge in the solution space from \c Previous->State to \c State,
900 /// inserting a newline dependent on the \c NewLine.
901 struct StateNode {
902 StateNode(const LineState &State, bool NewLine, StateNode *Previous)
Daniel Jasperf11a7052013-02-21 21:33:55 +0000903 : State(State), NewLine(NewLine), Previous(Previous) {}
Manuel Klimek32a2fd72013-02-13 10:46:36 +0000904 LineState State;
905 bool NewLine;
906 StateNode *Previous;
907 };
Daniel Jasper68ef0df2013-02-01 11:00:45 +0000908
Manuel Klimek32a2fd72013-02-13 10:46:36 +0000909 /// \brief A pair of <penalty, count> that is used to prioritize the BFS on.
910 ///
911 /// In case of equal penalties, we want to prefer states that were inserted
912 /// first. During state generation we make sure that we insert states first
913 /// that break the line as late as possible.
914 typedef std::pair<unsigned, unsigned> OrderedPenalty;
915
916 /// \brief An item in the prioritized BFS search queue. The \c StateNode's
917 /// \c State has the given \c OrderedPenalty.
918 typedef std::pair<OrderedPenalty, StateNode *> QueueItem;
919
920 /// \brief The BFS queue type.
921 typedef std::priority_queue<QueueItem, std::vector<QueueItem>,
922 std::greater<QueueItem> > QueueType;
Daniel Jasper68ef0df2013-02-01 11:00:45 +0000923
924 /// \brief Analyze the entire solution space starting from \p InitialState.
Daniel Jasperbac016b2012-12-03 18:12:45 +0000925 ///
Daniel Jasper68ef0df2013-02-01 11:00:45 +0000926 /// This implements a variant of Dijkstra's algorithm on the graph that spans
927 /// the solution space (\c LineStates are the nodes). The algorithm tries to
928 /// find the shortest path (the one with lowest penalty) from \p InitialState
929 /// to a state where all tokens are placed.
Manuel Klimeke573c3f2013-05-22 12:51:29 +0000930 void analyzeSolutionSpace(LineState &InitialState) {
Manuel Klimek32a2fd72013-02-13 10:46:36 +0000931 std::set<LineState> Seen;
932
Daniel Jasper68ef0df2013-02-01 11:00:45 +0000933 // Insert start element into queue.
Daniel Jasperfc759082013-02-14 14:26:07 +0000934 StateNode *Node =
Manuel Klimek32a2fd72013-02-13 10:46:36 +0000935 new (Allocator.Allocate()) StateNode(InitialState, false, NULL);
936 Queue.push(QueueItem(OrderedPenalty(0, Count), Node));
937 ++Count;
Daniel Jasper68ef0df2013-02-01 11:00:45 +0000938
939 // While not empty, take first element and follow edges.
940 while (!Queue.empty()) {
Manuel Klimek32a2fd72013-02-13 10:46:36 +0000941 unsigned Penalty = Queue.top().first.first;
Daniel Jasperfc759082013-02-14 14:26:07 +0000942 StateNode *Node = Queue.top().second;
Manuel Klimek32a2fd72013-02-13 10:46:36 +0000943 if (Node->State.NextToken == NULL) {
Alexander Kornienkodd256312013-05-10 11:56:10 +0000944 DEBUG(llvm::dbgs() << "\n---\nPenalty for line: " << Penalty << "\n");
Daniel Jasper68ef0df2013-02-01 11:00:45 +0000945 break;
Daniel Jasper01786732013-02-04 07:21:18 +0000946 }
Manuel Klimek32a2fd72013-02-13 10:46:36 +0000947 Queue.pop();
Daniel Jasper68ef0df2013-02-01 11:00:45 +0000948
Daniel Jasper54b4e442013-05-22 05:27:42 +0000949 // Cut off the analysis of certain solutions if the analysis gets too
950 // complex. See description of IgnoreStackForComparison.
951 if (Count > 10000)
952 Node->State.IgnoreStackForComparison = true;
953
Manuel Klimek32a2fd72013-02-13 10:46:36 +0000954 if (!Seen.insert(Node->State).second)
955 // State already examined with lower penalty.
956 continue;
Daniel Jasper68ef0df2013-02-01 11:00:45 +0000957
Nico Weber27268772013-06-26 00:30:14 +0000958 addNextStateToQueue(Penalty, Node, /*NewLine=*/false);
959 addNextStateToQueue(Penalty, Node, /*NewLine=*/true);
Daniel Jasper68ef0df2013-02-01 11:00:45 +0000960 }
961
962 if (Queue.empty())
963 // We were unable to find a solution, do nothing.
964 // FIXME: Add diagnostic?
Manuel Klimeke573c3f2013-05-22 12:51:29 +0000965 return;
Daniel Jasperbac016b2012-12-03 18:12:45 +0000966
Daniel Jasper68ef0df2013-02-01 11:00:45 +0000967 // Reconstruct the solution.
Manuel Klimek32a2fd72013-02-13 10:46:36 +0000968 reconstructPath(InitialState, Queue.top().second);
Alexander Kornienkodd256312013-05-10 11:56:10 +0000969 DEBUG(llvm::dbgs() << "Total number of analyzed states: " << Count << "\n");
970 DEBUG(llvm::dbgs() << "---\n");
Manuel Klimek32a2fd72013-02-13 10:46:36 +0000971 }
972
973 void reconstructPath(LineState &State, StateNode *Current) {
Manuel Klimek9c333b92013-05-29 15:10:11 +0000974 std::deque<StateNode *> Path;
975 // We do not need a break before the initial token.
976 while (Current->Previous) {
977 Path.push_front(Current);
978 Current = Current->Previous;
979 }
980 for (std::deque<StateNode *>::iterator I = Path.begin(), E = Path.end();
981 I != E; ++I) {
982 DEBUG({
983 if ((*I)->NewLine) {
984 llvm::dbgs() << "Penalty for splitting before "
985 << (*I)->Previous->State.NextToken->Tok.getName() << ": "
986 << (*I)->Previous->State.NextToken->SplitPenalty << "\n";
987 }
988 });
989 addTokenToState((*I)->NewLine, false, State);
990 }
Daniel Jasper68ef0df2013-02-01 11:00:45 +0000991 }
992
Manuel Klimek62a48fb2013-02-13 10:54:19 +0000993 /// \brief Add the following state to the analysis queue \c Queue.
Daniel Jasper68ef0df2013-02-01 11:00:45 +0000994 ///
Manuel Klimek62a48fb2013-02-13 10:54:19 +0000995 /// Assume the current state is \p PreviousNode and has been reached with a
Daniel Jasper68ef0df2013-02-01 11:00:45 +0000996 /// penalty of \p Penalty. Insert a line break if \p NewLine is \c true.
Manuel Klimek62a48fb2013-02-13 10:54:19 +0000997 void addNextStateToQueue(unsigned Penalty, StateNode *PreviousNode,
998 bool NewLine) {
Manuel Klimek32a2fd72013-02-13 10:46:36 +0000999 if (NewLine && !canBreak(PreviousNode->State))
Daniel Jasper68ef0df2013-02-01 11:00:45 +00001000 return;
Manuel Klimek32a2fd72013-02-13 10:46:36 +00001001 if (!NewLine && mustBreak(PreviousNode->State))
Daniel Jasper68ef0df2013-02-01 11:00:45 +00001002 return;
Daniel Jasperae8699b2013-01-28 09:35:24 +00001003 if (NewLine)
Manuel Klimek32a2fd72013-02-13 10:46:36 +00001004 Penalty += PreviousNode->State.NextToken->SplitPenalty;
1005
1006 StateNode *Node = new (Allocator.Allocate())
1007 StateNode(PreviousNode->State, NewLine, PreviousNode);
Manuel Klimek8092a942013-02-20 10:15:13 +00001008 Penalty += addTokenToState(NewLine, true, Node->State);
Manuel Klimek32a2fd72013-02-13 10:46:36 +00001009 if (Node->State.Column > getColumnLimit()) {
1010 unsigned ExcessCharacters = Node->State.Column - getColumnLimit();
Daniel Jasper01786732013-02-04 07:21:18 +00001011 Penalty += Style.PenaltyExcessCharacter * ExcessCharacters;
Daniel Jasperceb99ab2013-01-09 10:16:05 +00001012 }
Manuel Klimek32a2fd72013-02-13 10:46:36 +00001013
1014 Queue.push(QueueItem(OrderedPenalty(Penalty, Count), Node));
1015 ++Count;
Daniel Jasper68ef0df2013-02-01 11:00:45 +00001016 }
Daniel Jasperbac016b2012-12-03 18:12:45 +00001017
Daniel Jasper68ef0df2013-02-01 11:00:45 +00001018 /// \brief Returns \c true, if a line break after \p State is allowed.
1019 bool canBreak(const LineState &State) {
Manuel Klimekb3987012013-05-29 14:47:47 +00001020 const FormatToken &Current = *State.NextToken;
1021 const FormatToken &Previous = *Current.Previous;
1022 assert(&Previous == Current.Previous);
Daniel Jasper399914b2013-05-17 09:35:01 +00001023 if (!Current.CanBreakBefore &&
1024 !(Current.is(tok::r_brace) &&
Daniel Jasper68ef0df2013-02-01 11:00:45 +00001025 State.Stack.back().BreakBeforeClosingBrace))
1026 return false;
Daniel Jasper399914b2013-05-17 09:35:01 +00001027 // The opening "{" of a braced list has to be on the same line as the first
1028 // element if it is nested in another braced init list or function call.
1029 if (!Current.MustBreakBefore && Previous.is(tok::l_brace) &&
Manuel Klimekb3987012013-05-29 14:47:47 +00001030 Previous.Previous &&
1031 Previous.Previous->isOneOf(tok::l_brace, tok::l_paren, tok::comma))
Daniel Jasper399914b2013-05-17 09:35:01 +00001032 return false;
Daniel Jasper259a0382013-05-27 11:50:16 +00001033 // This prevents breaks like:
1034 // ...
1035 // SomeParameter, OtherParameter).DoSomething(
1036 // ...
1037 // As they hide "DoSomething" and are generally bad for readability.
Daniel Jasperce912f42013-06-03 09:54:46 +00001038 if (Previous.opensScope() && State.LowestCallLevel < State.StartOfLineLevel)
Daniel Jasper259a0382013-05-27 11:50:16 +00001039 return false;
Daniel Jasper001bf4e2013-04-22 07:59:53 +00001040 return !State.Stack.back().NoLineBreak;
Daniel Jasper68ef0df2013-02-01 11:00:45 +00001041 }
Daniel Jasperbac016b2012-12-03 18:12:45 +00001042
Daniel Jasper68ef0df2013-02-01 11:00:45 +00001043 /// \brief Returns \c true, if a line break after \p State is mandatory.
1044 bool mustBreak(const LineState &State) {
Manuel Klimekb3987012013-05-29 14:47:47 +00001045 const FormatToken &Current = *State.NextToken;
1046 const FormatToken &Previous = *Current.Previous;
Daniel Jasper11e13802013-05-08 14:12:04 +00001047 if (Current.MustBreakBefore || Current.Type == TT_InlineASMColon)
Daniel Jasper68ef0df2013-02-01 11:00:45 +00001048 return true;
Daniel Jasper11e13802013-05-08 14:12:04 +00001049 if (Current.is(tok::r_brace) && State.Stack.back().BreakBeforeClosingBrace)
Daniel Jasper68ef0df2013-02-01 11:00:45 +00001050 return true;
Daniel Jasper11e13802013-05-08 14:12:04 +00001051 if (Previous.is(tok::semi) && State.LineContainsContinuedForLoopSection)
Daniel Jasper68ef0df2013-02-01 11:00:45 +00001052 return true;
Daniel Jasper11e13802013-05-08 14:12:04 +00001053 if ((Previous.isOneOf(tok::comma, tok::semi) || Current.is(tok::question) ||
1054 Current.Type == TT_ConditionalExpr) &&
Daniel Jasperce3d1a62013-02-08 08:22:00 +00001055 State.Stack.back().BreakBeforeParameter &&
Daniel Jasper11e13802013-05-08 14:12:04 +00001056 !Current.isTrailingComment() &&
1057 !Current.isOneOf(tok::r_paren, tok::r_brace))
Daniel Jasper68ef0df2013-02-01 11:00:45 +00001058 return true;
Daniel Jasper11e13802013-05-08 14:12:04 +00001059
1060 // If we need to break somewhere inside the LHS of a binary expression, we
1061 // should also break after the operator.
1062 if (Previous.Type == TT_BinaryOperator &&
Daniel Jasper69c43712013-05-28 07:42:44 +00001063 Current.Type != TT_BinaryOperator && // Special case for ">>".
Daniel Jasper5ef8aac2013-06-03 08:42:05 +00001064 !Current.isTrailingComment() &&
Daniel Jasper11e13802013-05-08 14:12:04 +00001065 !Previous.isOneOf(tok::lessless, tok::question) &&
Manuel Klimekb3987012013-05-29 14:47:47 +00001066 Previous.getPrecedence() != prec::Assignment &&
Daniel Jasperce3d1a62013-02-08 08:22:00 +00001067 State.Stack.back().BreakBeforeParameter)
Daniel Jasper63d7ced2013-02-05 10:07:47 +00001068 return true;
Daniel Jasper11e13802013-05-08 14:12:04 +00001069
1070 // FIXME: Comparing LongestObjCSelectorName to 0 is a hacky way of finding
1071 // out whether it is the first parameter. Clean this up.
1072 if (Current.Type == TT_ObjCSelectorName &&
1073 Current.LongestObjCSelectorName == 0 &&
1074 State.Stack.back().BreakBeforeParameter)
Daniel Jasper68ef0df2013-02-01 11:00:45 +00001075 return true;
Daniel Jasper11e13802013-05-08 14:12:04 +00001076 if ((Current.Type == TT_CtorInitializerColon ||
1077 (Previous.ClosesTemplateDeclaration && State.ParenLevel == 0)))
Daniel Jasper923ebef2013-03-14 13:45:21 +00001078 return true;
Daniel Jasper11e13802013-05-08 14:12:04 +00001079
Daniel Jasper33f4b902013-05-15 09:35:08 +00001080 if (Current.Type == TT_StartOfName && Line.MightBeFunctionDecl &&
1081 State.Stack.back().BreakBeforeParameter && State.ParenLevel == 0)
1082 return true;
Daniel Jasper68ef0df2013-02-01 11:00:45 +00001083 return false;
Daniel Jasperbac016b2012-12-03 18:12:45 +00001084 }
1085
Daniel Jasper3af59ce2013-03-15 14:57:30 +00001086 // Returns the total number of columns required for the remaining tokens.
1087 unsigned getRemainingLength(const LineState &State) {
Manuel Klimekb3987012013-05-29 14:47:47 +00001088 if (State.NextToken && State.NextToken->Previous)
1089 return Line.Last->TotalLength - State.NextToken->Previous->TotalLength;
Daniel Jasper3af59ce2013-03-15 14:57:30 +00001090 return 0;
1091 }
1092
Daniel Jasperbac016b2012-12-03 18:12:45 +00001093 FormatStyle Style;
1094 SourceManager &SourceMgr;
Daniel Jasper995e8202013-01-14 13:08:07 +00001095 const AnnotatedLine &Line;
Manuel Klimek3f8c7f32013-01-10 18:45:26 +00001096 const unsigned FirstIndent;
Manuel Klimekb3987012013-05-29 14:47:47 +00001097 const FormatToken *RootToken;
Daniel Jasperdcc2a622013-01-18 08:44:07 +00001098 WhitespaceManager &Whitespaces;
Manuel Klimek62a48fb2013-02-13 10:54:19 +00001099
1100 llvm::SpecificBumpPtrAllocator<StateNode> Allocator;
1101 QueueType Queue;
1102 // Increasing count of \c StateNode items we have created. This is used
1103 // to create a deterministic order independent of the container.
1104 unsigned Count;
Alexander Kornienko00895102013-06-05 14:09:10 +00001105 encoding::Encoding Encoding;
Daniel Jasperbac016b2012-12-03 18:12:45 +00001106};
1107
Manuel Klimek96e888b2013-05-28 11:55:06 +00001108class FormatTokenLexer {
Alexander Kornienko469a21b2012-12-07 16:15:44 +00001109public:
Alexander Kornienko00895102013-06-05 14:09:10 +00001110 FormatTokenLexer(Lexer &Lex, SourceManager &SourceMgr,
1111 encoding::Encoding Encoding)
Manuel Klimek96e888b2013-05-28 11:55:06 +00001112 : FormatTok(NULL), GreaterStashed(false), TrailingWhitespace(0), Lex(Lex),
Alexander Kornienko00895102013-06-05 14:09:10 +00001113 SourceMgr(SourceMgr), IdentTable(Lex.getLangOpts()),
1114 Encoding(Encoding) {
Alexander Kornienko469a21b2012-12-07 16:15:44 +00001115 Lex.SetKeepWhitespaceMode(true);
1116 }
1117
Manuel Klimek96e888b2013-05-28 11:55:06 +00001118 ArrayRef<FormatToken *> lex() {
1119 assert(Tokens.empty());
1120 do {
1121 Tokens.push_back(getNextToken());
1122 } while (Tokens.back()->Tok.isNot(tok::eof));
1123 return Tokens;
1124 }
1125
1126 IdentifierTable &getIdentTable() { return IdentTable; }
1127
1128private:
1129 FormatToken *getNextToken() {
Alexander Kornienko469a21b2012-12-07 16:15:44 +00001130 if (GreaterStashed) {
Manuel Klimekdcb3f2a2013-05-28 13:42:28 +00001131 // Create a synthesized second '>' token.
1132 Token Greater = FormatTok->Tok;
1133 FormatTok = new (Allocator.Allocate()) FormatToken;
1134 FormatTok->Tok = Greater;
Manuel Klimekad3094b2013-05-23 10:56:37 +00001135 SourceLocation GreaterLocation =
Manuel Klimek96e888b2013-05-28 11:55:06 +00001136 FormatTok->Tok.getLocation().getLocWithOffset(1);
1137 FormatTok->WhitespaceRange =
1138 SourceRange(GreaterLocation, GreaterLocation);
Alexander Kornienko54e6c9d2013-06-07 17:45:07 +00001139 FormatTok->TokenText = ">";
Alexander Kornienko00895102013-06-05 14:09:10 +00001140 FormatTok->CodePointCount = 1;
Alexander Kornienko469a21b2012-12-07 16:15:44 +00001141 GreaterStashed = false;
1142 return FormatTok;
1143 }
1144
Manuel Klimek96e888b2013-05-28 11:55:06 +00001145 FormatTok = new (Allocator.Allocate()) FormatToken;
1146 Lex.LexFromRawLexer(FormatTok->Tok);
1147 StringRef Text = rawTokenText(FormatTok->Tok);
Manuel Klimekde008c02013-05-27 15:23:34 +00001148 SourceLocation WhitespaceStart =
Manuel Klimek96e888b2013-05-28 11:55:06 +00001149 FormatTok->Tok.getLocation().getLocWithOffset(-TrailingWhitespace);
Manuel Klimekad3094b2013-05-23 10:56:37 +00001150 if (SourceMgr.getFileOffset(WhitespaceStart) == 0)
Manuel Klimek96e888b2013-05-28 11:55:06 +00001151 FormatTok->IsFirst = true;
Alexander Kornienko469a21b2012-12-07 16:15:44 +00001152
1153 // Consume and record whitespace until we find a significant token.
Manuel Klimekde008c02013-05-27 15:23:34 +00001154 unsigned WhitespaceLength = TrailingWhitespace;
Manuel Klimek96e888b2013-05-28 11:55:06 +00001155 while (FormatTok->Tok.is(tok::unknown)) {
Manuel Klimeka28fc062013-02-11 12:33:24 +00001156 unsigned Newlines = Text.count('\n');
Daniel Jasper1eee6c42013-03-04 13:43:19 +00001157 if (Newlines > 0)
Manuel Klimek96e888b2013-05-28 11:55:06 +00001158 FormatTok->LastNewlineOffset = WhitespaceLength + Text.rfind('\n') + 1;
Manuel Klimek96e888b2013-05-28 11:55:06 +00001159 FormatTok->NewlinesBefore += Newlines;
Alexander Kornienko54e6c9d2013-06-07 17:45:07 +00001160 unsigned EscapedNewlines = Text.count("\\\n");
Manuel Klimek96e888b2013-05-28 11:55:06 +00001161 FormatTok->HasUnescapedNewline |= EscapedNewlines != Newlines;
1162 WhitespaceLength += FormatTok->Tok.getLength();
Alexander Kornienko469a21b2012-12-07 16:15:44 +00001163
Manuel Klimek96e888b2013-05-28 11:55:06 +00001164 Lex.LexFromRawLexer(FormatTok->Tok);
1165 Text = rawTokenText(FormatTok->Tok);
Manuel Klimekd4397b92013-01-04 23:34:14 +00001166 }
Manuel Klimek95419382013-01-07 07:56:50 +00001167
Manuel Klimekd4397b92013-01-04 23:34:14 +00001168 // In case the token starts with escaped newlines, we want to
1169 // take them into account as whitespace - this pattern is quite frequent
1170 // in macro definitions.
1171 // FIXME: What do we want to do with other escaped spaces, and escaped
1172 // spaces or newlines in the middle of tokens?
1173 // FIXME: Add a more explicit test.
Alexander Kornienko54e6c9d2013-06-07 17:45:07 +00001174 while (Text.size() > 1 && Text[0] == '\\' && Text[1] == '\n') {
Manuel Klimek96e888b2013-05-28 11:55:06 +00001175 // FIXME: ++FormatTok->NewlinesBefore is missing...
Manuel Klimekad3094b2013-05-23 10:56:37 +00001176 WhitespaceLength += 2;
Alexander Kornienko54e6c9d2013-06-07 17:45:07 +00001177 Text = Text.substr(2);
Alexander Kornienko469a21b2012-12-07 16:15:44 +00001178 }
1179
Alexander Kornienko54e6c9d2013-06-07 17:45:07 +00001180 TrailingWhitespace = 0;
1181 if (FormatTok->Tok.is(tok::comment)) {
1182 StringRef UntrimmedText = Text;
1183 Text = Text.rtrim();
1184 TrailingWhitespace = UntrimmedText.size() - Text.size();
1185 } else if (FormatTok->Tok.is(tok::raw_identifier)) {
Manuel Klimekd4397b92013-01-04 23:34:14 +00001186 IdentifierInfo &Info = IdentTable.get(Text);
Manuel Klimek96e888b2013-05-28 11:55:06 +00001187 FormatTok->Tok.setIdentifierInfo(&Info);
1188 FormatTok->Tok.setKind(Info.getTokenID());
Alexander Kornienko54e6c9d2013-06-07 17:45:07 +00001189 } else if (FormatTok->Tok.is(tok::greatergreater)) {
Manuel Klimek96e888b2013-05-28 11:55:06 +00001190 FormatTok->Tok.setKind(tok::greater);
Alexander Kornienko54e6c9d2013-06-07 17:45:07 +00001191 Text = Text.substr(0, 1);
Alexander Kornienko469a21b2012-12-07 16:15:44 +00001192 GreaterStashed = true;
1193 }
1194
Alexander Kornienko54e6c9d2013-06-07 17:45:07 +00001195 // Now FormatTok is the next non-whitespace token.
1196 FormatTok->TokenText = Text;
1197 FormatTok->CodePointCount = encoding::getCodePointCount(Text, Encoding);
Alexander Kornienko00895102013-06-05 14:09:10 +00001198
Manuel Klimek96e888b2013-05-28 11:55:06 +00001199 FormatTok->WhitespaceRange = SourceRange(
Manuel Klimekad3094b2013-05-23 10:56:37 +00001200 WhitespaceStart, WhitespaceStart.getLocWithOffset(WhitespaceLength));
Alexander Kornienko469a21b2012-12-07 16:15:44 +00001201 return FormatTok;
1202 }
1203
Manuel Klimek96e888b2013-05-28 11:55:06 +00001204 FormatToken *FormatTok;
Alexander Kornienko469a21b2012-12-07 16:15:44 +00001205 bool GreaterStashed;
Manuel Klimekde008c02013-05-27 15:23:34 +00001206 unsigned TrailingWhitespace;
Alexander Kornienko469a21b2012-12-07 16:15:44 +00001207 Lexer &Lex;
1208 SourceManager &SourceMgr;
1209 IdentifierTable IdentTable;
Alexander Kornienko00895102013-06-05 14:09:10 +00001210 encoding::Encoding Encoding;
Manuel Klimek96e888b2013-05-28 11:55:06 +00001211 llvm::SpecificBumpPtrAllocator<FormatToken> Allocator;
1212 SmallVector<FormatToken *, 16> Tokens;
Alexander Kornienko469a21b2012-12-07 16:15:44 +00001213
1214 /// Returns the text of \c FormatTok.
Manuel Klimek95419382013-01-07 07:56:50 +00001215 StringRef rawTokenText(Token &Tok) {
Alexander Kornienko469a21b2012-12-07 16:15:44 +00001216 return StringRef(SourceMgr.getCharacterData(Tok.getLocation()),
1217 Tok.getLength());
1218 }
1219};
1220
Daniel Jasperbac016b2012-12-03 18:12:45 +00001221class Formatter : public UnwrappedLineConsumer {
1222public:
Daniel Jaspercaf42a32013-05-15 08:14:19 +00001223 Formatter(const FormatStyle &Style, Lexer &Lex, SourceManager &SourceMgr,
Daniel Jasperbac016b2012-12-03 18:12:45 +00001224 const std::vector<CharSourceRange> &Ranges)
Daniel Jaspercaf42a32013-05-15 08:14:19 +00001225 : Style(Style), Lex(Lex), SourceMgr(SourceMgr),
Alexander Kornienko00895102013-06-05 14:09:10 +00001226 Whitespaces(SourceMgr, Style), Ranges(Ranges),
1227 Encoding(encoding::detectEncoding(Lex.getBuffer())) {
1228 DEBUG(llvm::dbgs()
1229 << "File encoding: "
1230 << (Encoding == encoding::Encoding_UTF8 ? "UTF8" : "unknown")
1231 << "\n");
1232 }
Daniel Jasperbac016b2012-12-03 18:12:45 +00001233
Daniel Jasper7d19bc22013-01-11 14:23:32 +00001234 virtual ~Formatter() {}
Daniel Jasperaccb0b02012-12-04 21:05:31 +00001235
Alexander Kornienkoe74de282013-03-13 14:41:29 +00001236 tooling::Replacements format() {
Alexander Kornienko00895102013-06-05 14:09:10 +00001237 FormatTokenLexer Tokens(Lex, SourceMgr, Encoding);
Manuel Klimek96e888b2013-05-28 11:55:06 +00001238
1239 UnwrappedLineParser Parser(Style, Tokens.lex(), *this);
Manuel Klimek67d080d2013-04-12 14:13:36 +00001240 bool StructuralError = Parser.parse();
Alexander Kornienko00895102013-06-05 14:09:10 +00001241 TokenAnnotator Annotator(Style, Tokens.getIdentTable().get("in"));
Alexander Kornienkoe74de282013-03-13 14:41:29 +00001242 for (unsigned i = 0, e = AnnotatedLines.size(); i != e; ++i) {
1243 Annotator.annotate(AnnotatedLines[i]);
1244 }
1245 deriveLocalStyle();
1246 for (unsigned i = 0, e = AnnotatedLines.size(); i != e; ++i) {
1247 Annotator.calculateFormattingInformation(AnnotatedLines[i]);
1248 }
Daniel Jasper5999f762013-04-09 17:46:55 +00001249
1250 // Adapt level to the next line if this is a comment.
1251 // FIXME: Can/should this be done in the UnwrappedLineParser?
Daniel Jasper1407bee2013-04-11 14:29:13 +00001252 const AnnotatedLine *NextNoneCommentLine = NULL;
Daniel Jasper5999f762013-04-09 17:46:55 +00001253 for (unsigned i = AnnotatedLines.size() - 1; i > 0; --i) {
Manuel Klimekb3987012013-05-29 14:47:47 +00001254 if (NextNoneCommentLine && AnnotatedLines[i].First->is(tok::comment) &&
1255 !AnnotatedLines[i].First->Next)
Daniel Jasper5999f762013-04-09 17:46:55 +00001256 AnnotatedLines[i].Level = NextNoneCommentLine->Level;
1257 else
Alexander Kornienko70ce7882013-04-15 14:28:00 +00001258 NextNoneCommentLine =
Manuel Klimekb3987012013-05-29 14:47:47 +00001259 AnnotatedLines[i].First->isNot(tok::r_brace) ? &AnnotatedLines[i]
1260 : NULL;
Daniel Jasper5999f762013-04-09 17:46:55 +00001261 }
1262
Alexander Kornienkoe74de282013-03-13 14:41:29 +00001263 std::vector<int> IndentForLevel;
1264 bool PreviousLineWasTouched = false;
Manuel Klimekb3987012013-05-29 14:47:47 +00001265 const FormatToken *PreviousLineLastToken = 0;
Daniel Jasper89b3a7f2013-05-10 13:00:49 +00001266 bool FormatPPDirective = false;
Alexander Kornienkoe74de282013-03-13 14:41:29 +00001267 for (std::vector<AnnotatedLine>::iterator I = AnnotatedLines.begin(),
1268 E = AnnotatedLines.end();
1269 I != E; ++I) {
1270 const AnnotatedLine &TheLine = *I;
Manuel Klimekb3987012013-05-29 14:47:47 +00001271 const FormatToken *FirstTok = TheLine.First;
1272 int Offset = getIndentOffset(*TheLine.First);
Daniel Jasper89b3a7f2013-05-10 13:00:49 +00001273
1274 // Check whether this line is part of a formatted preprocessor directive.
Manuel Klimekdcb3f2a2013-05-28 13:42:28 +00001275 if (FirstTok->HasUnescapedNewline)
Daniel Jasper89b3a7f2013-05-10 13:00:49 +00001276 FormatPPDirective = false;
1277 if (!FormatPPDirective && TheLine.InPPDirective &&
1278 (touchesLine(TheLine) || touchesPPDirective(I + 1, E)))
1279 FormatPPDirective = true;
1280
Daniel Jasper1fb8d882013-05-14 09:30:02 +00001281 // Determine indent and try to merge multiple unwrapped lines.
Alexander Kornienkoe74de282013-03-13 14:41:29 +00001282 while (IndentForLevel.size() <= TheLine.Level)
1283 IndentForLevel.push_back(-1);
1284 IndentForLevel.resize(TheLine.Level + 1);
Daniel Jasper1fb8d882013-05-14 09:30:02 +00001285 unsigned Indent = getIndent(IndentForLevel, TheLine.Level);
1286 if (static_cast<int>(Indent) + Offset >= 0)
1287 Indent += Offset;
1288 tryFitMultipleLinesInOne(Indent, I, E);
1289
Manuel Klimekdcb3f2a2013-05-28 13:42:28 +00001290 bool WasMoved = PreviousLineWasTouched && FirstTok->NewlinesBefore == 0;
Manuel Klimekb3987012013-05-29 14:47:47 +00001291 if (TheLine.First->is(tok::eof)) {
Alexander Kornienkoe74de282013-03-13 14:41:29 +00001292 if (PreviousLineWasTouched) {
Manuel Klimekdcb3f2a2013-05-28 13:42:28 +00001293 unsigned NewLines = std::min(FirstTok->NewlinesBefore, 1u);
Manuel Klimekb3987012013-05-29 14:47:47 +00001294 Whitespaces.replaceWhitespace(*TheLine.First, NewLines, /*Indent*/ 0,
Manuel Klimeke573c3f2013-05-22 12:51:29 +00001295 /*TargetColumn*/ 0);
Alexander Kornienkoe74de282013-03-13 14:41:29 +00001296 }
1297 } else if (TheLine.Type != LT_Invalid &&
Daniel Jasper89b3a7f2013-05-10 13:00:49 +00001298 (WasMoved || FormatPPDirective || touchesLine(TheLine))) {
Alexander Kornienkoe74de282013-03-13 14:41:29 +00001299 unsigned LevelIndent = getIndent(IndentForLevel, TheLine.Level);
Manuel Klimekdcb3f2a2013-05-28 13:42:28 +00001300 if (FirstTok->WhitespaceRange.isValid() &&
Manuel Klimek67d080d2013-04-12 14:13:36 +00001301 // Insert a break even if there is a structural error in case where
1302 // we break apart a line consisting of multiple unwrapped lines.
Manuel Klimekdcb3f2a2013-05-28 13:42:28 +00001303 (FirstTok->NewlinesBefore == 0 || !StructuralError)) {
Manuel Klimekb3987012013-05-29 14:47:47 +00001304 formatFirstToken(*TheLine.First, PreviousLineLastToken, Indent,
Manuel Klimeke573c3f2013-05-22 12:51:29 +00001305 TheLine.InPPDirective);
Manuel Klimek67d080d2013-04-12 14:13:36 +00001306 } else {
1307 Indent = LevelIndent =
Manuel Klimekdcb3f2a2013-05-28 13:42:28 +00001308 SourceMgr.getSpellingColumnNumber(FirstTok->Tok.getLocation()) -
1309 1;
Alexander Kornienkoe74de282013-03-13 14:41:29 +00001310 }
Alexander Kornienkoe74de282013-03-13 14:41:29 +00001311 UnwrappedLineFormatter Formatter(Style, SourceMgr, TheLine, Indent,
Alexander Kornienko00895102013-06-05 14:09:10 +00001312 TheLine.First, Whitespaces, Encoding);
Manuel Klimeke573c3f2013-05-22 12:51:29 +00001313 Formatter.format(I + 1 != E ? &*(I + 1) : NULL);
Alexander Kornienkoe74de282013-03-13 14:41:29 +00001314 IndentForLevel[TheLine.Level] = LevelIndent;
1315 PreviousLineWasTouched = true;
1316 } else {
Manuel Klimeke573c3f2013-05-22 12:51:29 +00001317 // Format the first token if necessary, and notify the WhitespaceManager
1318 // about the unchanged whitespace.
Manuel Klimekb3987012013-05-29 14:47:47 +00001319 for (const FormatToken *Tok = TheLine.First; Tok != NULL;
1320 Tok = Tok->Next) {
1321 if (Tok == TheLine.First &&
1322 (Tok->NewlinesBefore > 0 || Tok->IsFirst)) {
1323 unsigned LevelIndent =
1324 SourceMgr.getSpellingColumnNumber(Tok->Tok.getLocation()) - 1;
Manuel Klimeke573c3f2013-05-22 12:51:29 +00001325 // Remove trailing whitespace of the previous line if it was
1326 // touched.
1327 if (PreviousLineWasTouched || touchesEmptyLineBefore(TheLine)) {
1328 formatFirstToken(*Tok, PreviousLineLastToken, LevelIndent,
1329 TheLine.InPPDirective);
1330 } else {
Manuel Klimekb3987012013-05-29 14:47:47 +00001331 Whitespaces.addUntouchableToken(*Tok, TheLine.InPPDirective);
Manuel Klimeke573c3f2013-05-22 12:51:29 +00001332 }
Daniel Jasper1fb8d882013-05-14 09:30:02 +00001333
Manuel Klimeke573c3f2013-05-22 12:51:29 +00001334 if (static_cast<int>(LevelIndent) - Offset >= 0)
1335 LevelIndent -= Offset;
1336 if (Tok->isNot(tok::comment))
1337 IndentForLevel[TheLine.Level] = LevelIndent;
1338 } else {
Manuel Klimekb3987012013-05-29 14:47:47 +00001339 Whitespaces.addUntouchableToken(*Tok, TheLine.InPPDirective);
Manuel Klimeke573c3f2013-05-22 12:51:29 +00001340 }
Alexander Kornienkoe74de282013-03-13 14:41:29 +00001341 }
1342 // If we did not reformat this unwrapped line, the column at the end of
1343 // the last token is unchanged - thus, we can calculate the end of the
1344 // last token.
Alexander Kornienkoe74de282013-03-13 14:41:29 +00001345 PreviousLineWasTouched = false;
1346 }
Alexander Kornienko94b748f2013-03-27 17:08:02 +00001347 PreviousLineLastToken = I->Last;
Alexander Kornienkoe74de282013-03-13 14:41:29 +00001348 }
1349 return Whitespaces.generateReplacements();
1350 }
1351
1352private:
Daniel Jasper8ff690a2013-02-06 14:22:40 +00001353 void deriveLocalStyle() {
1354 unsigned CountBoundToVariable = 0;
1355 unsigned CountBoundToType = 0;
1356 bool HasCpp03IncompatibleFormat = false;
1357 for (unsigned i = 0, e = AnnotatedLines.size(); i != e; ++i) {
Manuel Klimekb3987012013-05-29 14:47:47 +00001358 if (!AnnotatedLines[i].First->Next)
Daniel Jasper8ff690a2013-02-06 14:22:40 +00001359 continue;
Manuel Klimekb3987012013-05-29 14:47:47 +00001360 FormatToken *Tok = AnnotatedLines[i].First->Next;
1361 while (Tok->Next) {
Daniel Jasper8ff690a2013-02-06 14:22:40 +00001362 if (Tok->Type == TT_PointerOrReference) {
Manuel Klimekb3987012013-05-29 14:47:47 +00001363 bool SpacesBefore =
1364 Tok->WhitespaceRange.getBegin() != Tok->WhitespaceRange.getEnd();
1365 bool SpacesAfter = Tok->Next->WhitespaceRange.getBegin() !=
1366 Tok->Next->WhitespaceRange.getEnd();
Daniel Jasper8ff690a2013-02-06 14:22:40 +00001367 if (SpacesBefore && !SpacesAfter)
1368 ++CountBoundToVariable;
1369 else if (!SpacesBefore && SpacesAfter)
1370 ++CountBoundToType;
1371 }
1372
Daniel Jasper29f123b2013-02-08 15:28:42 +00001373 if (Tok->Type == TT_TemplateCloser &&
Manuel Klimekb3987012013-05-29 14:47:47 +00001374 Tok->Previous->Type == TT_TemplateCloser &&
1375 Tok->WhitespaceRange.getBegin() == Tok->WhitespaceRange.getEnd())
Daniel Jasper8ff690a2013-02-06 14:22:40 +00001376 HasCpp03IncompatibleFormat = true;
Manuel Klimekb3987012013-05-29 14:47:47 +00001377 Tok = Tok->Next;
Daniel Jasper8ff690a2013-02-06 14:22:40 +00001378 }
1379 }
1380 if (Style.DerivePointerBinding) {
1381 if (CountBoundToType > CountBoundToVariable)
1382 Style.PointerBindsToType = true;
1383 else if (CountBoundToType < CountBoundToVariable)
1384 Style.PointerBindsToType = false;
1385 }
1386 if (Style.Standard == FormatStyle::LS_Auto) {
1387 Style.Standard = HasCpp03IncompatibleFormat ? FormatStyle::LS_Cpp11
1388 : FormatStyle::LS_Cpp03;
1389 }
1390 }
1391
Manuel Klimek547d5db2013-02-08 17:38:27 +00001392 /// \brief Get the indent of \p Level from \p IndentForLevel.
1393 ///
1394 /// \p IndentForLevel must contain the indent for the level \c l
1395 /// at \p IndentForLevel[l], or a value < 0 if the indent for
1396 /// that level is unknown.
Daniel Jasperfc759082013-02-14 14:26:07 +00001397 unsigned getIndent(const std::vector<int> IndentForLevel, unsigned Level) {
Manuel Klimek547d5db2013-02-08 17:38:27 +00001398 if (IndentForLevel[Level] != -1)
1399 return IndentForLevel[Level];
Manuel Klimek52635ff2013-02-08 19:53:32 +00001400 if (Level == 0)
1401 return 0;
Manuel Klimek07a64ec2013-05-13 08:42:42 +00001402 return getIndent(IndentForLevel, Level - 1) + Style.IndentWidth;
Manuel Klimek547d5db2013-02-08 17:38:27 +00001403 }
1404
1405 /// \brief Get the offset of the line relatively to the level.
1406 ///
1407 /// For example, 'public:' labels in classes are offset by 1 or 2
1408 /// characters to the left from their level.
Manuel Klimekb3987012013-05-29 14:47:47 +00001409 int getIndentOffset(const FormatToken &RootToken) {
Alexander Kornienko94b748f2013-03-27 17:08:02 +00001410 if (RootToken.isAccessSpecifier(false) || RootToken.isObjCAccessSpecifier())
Manuel Klimek547d5db2013-02-08 17:38:27 +00001411 return Style.AccessModifierOffset;
1412 return 0;
1413 }
1414
Manuel Klimek517e8942013-01-11 17:54:10 +00001415 /// \brief Tries to merge lines into one.
1416 ///
1417 /// This will change \c Line and \c AnnotatedLine to contain the merged line,
1418 /// if possible; note that \c I will be incremented when lines are merged.
Daniel Jasper3f8cdbf2013-01-16 10:41:46 +00001419 void tryFitMultipleLinesInOne(unsigned Indent,
Daniel Jasper995e8202013-01-14 13:08:07 +00001420 std::vector<AnnotatedLine>::iterator &I,
1421 std::vector<AnnotatedLine>::iterator E) {
Daniel Jasper3f8cdbf2013-01-16 10:41:46 +00001422 // We can never merge stuff if there are trailing line comments.
1423 if (I->Last->Type == TT_LineComment)
1424 return;
1425
Daniel Jaspera4d46212013-02-28 11:05:57 +00001426 unsigned Limit = Style.ColumnLimit - Indent;
Daniel Jasperf11a7052013-02-21 21:33:55 +00001427 // If we already exceed the column limit, we set 'Limit' to 0. The different
1428 // tryMerge..() functions can then decide whether to still do merging.
1429 Limit = I->Last->TotalLength > Limit ? 0 : Limit - I->Last->TotalLength;
Daniel Jasper55b08e72013-01-16 07:02:34 +00001430
Daniel Jasper9c8c40e2013-01-21 14:18:28 +00001431 if (I + 1 == E || (I + 1)->Type == LT_Invalid)
Daniel Jasper3f8cdbf2013-01-16 10:41:46 +00001432 return;
Manuel Klimek517e8942013-01-11 17:54:10 +00001433
Daniel Jasper5be59ba2013-05-15 14:09:55 +00001434 if (I->Last->is(tok::l_brace)) {
Daniel Jasperfeb18f52013-01-14 14:14:23 +00001435 tryMergeSimpleBlock(I, E, Limit);
Daniel Jasperf11bbb92013-05-16 12:12:21 +00001436 } else if (Style.AllowShortIfStatementsOnASingleLine &&
Manuel Klimekb3987012013-05-29 14:47:47 +00001437 I->First->is(tok::kw_if)) {
Daniel Jasperf11bbb92013-05-16 12:12:21 +00001438 tryMergeSimpleControlStatement(I, E, Limit);
1439 } else if (Style.AllowShortLoopsOnASingleLine &&
Manuel Klimekb3987012013-05-29 14:47:47 +00001440 I->First->isOneOf(tok::kw_for, tok::kw_while)) {
Daniel Jasperf11bbb92013-05-16 12:12:21 +00001441 tryMergeSimpleControlStatement(I, E, Limit);
Manuel Klimekb3987012013-05-29 14:47:47 +00001442 } else if (I->InPPDirective &&
1443 (I->First->HasUnescapedNewline || I->First->IsFirst)) {
Daniel Jaspere0b15ea2013-01-14 15:40:57 +00001444 tryMergeSimplePPDirective(I, E, Limit);
Daniel Jasperfeb18f52013-01-14 14:14:23 +00001445 }
Daniel Jasperfeb18f52013-01-14 14:14:23 +00001446 }
1447
Daniel Jaspere0b15ea2013-01-14 15:40:57 +00001448 void tryMergeSimplePPDirective(std::vector<AnnotatedLine>::iterator &I,
1449 std::vector<AnnotatedLine>::iterator E,
1450 unsigned Limit) {
Daniel Jasperf11a7052013-02-21 21:33:55 +00001451 if (Limit == 0)
1452 return;
Daniel Jaspere0b15ea2013-01-14 15:40:57 +00001453 AnnotatedLine &Line = *I;
Manuel Klimekb3987012013-05-29 14:47:47 +00001454 if (!(I + 1)->InPPDirective || (I + 1)->First->HasUnescapedNewline)
Daniel Jasper2b9c10b2013-01-14 15:52:06 +00001455 return;
Daniel Jaspere0b15ea2013-01-14 15:40:57 +00001456 if (I + 2 != E && (I + 2)->InPPDirective &&
Manuel Klimekb3987012013-05-29 14:47:47 +00001457 !(I + 2)->First->HasUnescapedNewline)
Daniel Jaspere0b15ea2013-01-14 15:40:57 +00001458 return;
Manuel Klimek2f1ac412013-01-21 16:42:44 +00001459 if (1 + (I + 1)->Last->TotalLength > Limit)
Daniel Jasper3f8cdbf2013-01-16 10:41:46 +00001460 return;
Daniel Jaspere0b15ea2013-01-14 15:40:57 +00001461 join(Line, *(++I));
1462 }
1463
Daniel Jasperf11bbb92013-05-16 12:12:21 +00001464 void tryMergeSimpleControlStatement(std::vector<AnnotatedLine>::iterator &I,
1465 std::vector<AnnotatedLine>::iterator E,
1466 unsigned Limit) {
Daniel Jasperf11a7052013-02-21 21:33:55 +00001467 if (Limit == 0)
1468 return;
Manuel Klimek4c128122013-01-18 14:46:43 +00001469 if ((I + 1)->InPPDirective != I->InPPDirective ||
Manuel Klimekb3987012013-05-29 14:47:47 +00001470 ((I + 1)->InPPDirective && (I + 1)->First->HasUnescapedNewline))
Manuel Klimek4c128122013-01-18 14:46:43 +00001471 return;
Daniel Jasperfeb18f52013-01-14 14:14:23 +00001472 AnnotatedLine &Line = *I;
Daniel Jasper55b08e72013-01-16 07:02:34 +00001473 if (Line.Last->isNot(tok::r_paren))
1474 return;
Manuel Klimek2f1ac412013-01-21 16:42:44 +00001475 if (1 + (I + 1)->Last->TotalLength > Limit)
Daniel Jasperfeb18f52013-01-14 14:14:23 +00001476 return;
Manuel Klimekb3987012013-05-29 14:47:47 +00001477 if ((I + 1)->First->isOneOf(tok::semi, tok::kw_if, tok::kw_for,
1478 tok::kw_while) ||
1479 (I + 1)->First->Type == TT_LineComment)
Daniel Jasperfeb18f52013-01-14 14:14:23 +00001480 return;
1481 // Only inline simple if's (no nested if or else).
Manuel Klimekb3987012013-05-29 14:47:47 +00001482 if (I + 2 != E && Line.First->is(tok::kw_if) &&
1483 (I + 2)->First->is(tok::kw_else))
Daniel Jasperfeb18f52013-01-14 14:14:23 +00001484 return;
1485 join(Line, *(++I));
1486 }
1487
1488 void tryMergeSimpleBlock(std::vector<AnnotatedLine>::iterator &I,
Daniel Jasper1a1ce832013-01-29 11:27:30 +00001489 std::vector<AnnotatedLine>::iterator E,
1490 unsigned Limit) {
Daniel Jasper5be59ba2013-05-15 14:09:55 +00001491 // No merging if the brace already is on the next line.
1492 if (Style.BreakBeforeBraces != FormatStyle::BS_Attach)
1493 return;
1494
Manuel Klimek517e8942013-01-11 17:54:10 +00001495 // First, check that the current line allows merging. This is the case if
1496 // we're not in a control flow statement and the last token is an opening
1497 // brace.
Daniel Jasperfeb18f52013-01-14 14:14:23 +00001498 AnnotatedLine &Line = *I;
Manuel Klimekb3987012013-05-29 14:47:47 +00001499 if (Line.First->isOneOf(tok::kw_if, tok::kw_while, tok::kw_do, tok::r_brace,
1500 tok::kw_else, tok::kw_try, tok::kw_catch,
Daniel Jasper8893b8a2013-05-31 14:56:20 +00001501 tok::kw_for,
Manuel Klimekb3987012013-05-29 14:47:47 +00001502 // This gets rid of all ObjC @ keywords and methods.
1503 tok::at, tok::minus, tok::plus))
Daniel Jasperfeb18f52013-01-14 14:14:23 +00001504 return;
Manuel Klimek517e8942013-01-11 17:54:10 +00001505
Manuel Klimekb3987012013-05-29 14:47:47 +00001506 FormatToken *Tok = (I + 1)->First;
Daniel Jasper8893b8a2013-05-31 14:56:20 +00001507 if (Tok->is(tok::r_brace) && !Tok->MustBreakBefore &&
1508 (Tok->getNextNoneComment() == NULL ||
1509 Tok->getNextNoneComment()->is(tok::semi))) {
Daniel Jasperf11a7052013-02-21 21:33:55 +00001510 // We merge empty blocks even if the line exceeds the column limit.
Daniel Jasper729a7432013-02-11 12:36:37 +00001511 Tok->SpacesRequiredBefore = 0;
Daniel Jasperf11a7052013-02-21 21:33:55 +00001512 Tok->CanBreakBefore = true;
Manuel Klimek2f1ac412013-01-21 16:42:44 +00001513 join(Line, *(I + 1));
1514 I += 1;
Daniel Jasper8893b8a2013-05-31 14:56:20 +00001515 } else if (Limit != 0 && Line.First->isNot(tok::kw_namespace)) {
Manuel Klimek2f1ac412013-01-21 16:42:44 +00001516 // Check that we still have three lines and they fit into the limit.
1517 if (I + 2 == E || (I + 2)->Type == LT_Invalid ||
1518 !nextTwoLinesFitInto(I, Limit))
Daniel Jasperfeb18f52013-01-14 14:14:23 +00001519 return;
Manuel Klimek517e8942013-01-11 17:54:10 +00001520
Manuel Klimek2f1ac412013-01-21 16:42:44 +00001521 // Second, check that the next line does not contain any braces - if it
1522 // does, readability declines when putting it into a single line.
1523 if ((I + 1)->Last->Type == TT_LineComment || Tok->MustBreakBefore)
1524 return;
1525 do {
Alexander Kornienkoe74de282013-03-13 14:41:29 +00001526 if (Tok->isOneOf(tok::l_brace, tok::r_brace))
Manuel Klimek2f1ac412013-01-21 16:42:44 +00001527 return;
Manuel Klimekb3987012013-05-29 14:47:47 +00001528 Tok = Tok->Next;
Manuel Klimek2f1ac412013-01-21 16:42:44 +00001529 } while (Tok != NULL);
Manuel Klimek517e8942013-01-11 17:54:10 +00001530
Manuel Klimek2f1ac412013-01-21 16:42:44 +00001531 // Last, check that the third line contains a single closing brace.
Manuel Klimekb3987012013-05-29 14:47:47 +00001532 Tok = (I + 2)->First;
Daniel Jasper058f6f82013-05-16 10:17:39 +00001533 if (Tok->getNextNoneComment() != NULL || Tok->isNot(tok::r_brace) ||
Manuel Klimek2f1ac412013-01-21 16:42:44 +00001534 Tok->MustBreakBefore)
1535 return;
1536
1537 join(Line, *(I + 1));
1538 join(Line, *(I + 2));
1539 I += 2;
Manuel Klimek517e8942013-01-11 17:54:10 +00001540 }
Daniel Jasperfeb18f52013-01-14 14:14:23 +00001541 }
1542
1543 bool nextTwoLinesFitInto(std::vector<AnnotatedLine>::iterator I,
1544 unsigned Limit) {
Manuel Klimek2f1ac412013-01-21 16:42:44 +00001545 return 1 + (I + 1)->Last->TotalLength + 1 + (I + 2)->Last->TotalLength <=
1546 Limit;
Manuel Klimek517e8942013-01-11 17:54:10 +00001547 }
1548
Daniel Jasper995e8202013-01-14 13:08:07 +00001549 void join(AnnotatedLine &A, const AnnotatedLine &B) {
Manuel Klimekb3987012013-05-29 14:47:47 +00001550 assert(!A.Last->Next);
1551 assert(!B.First->Previous);
1552 A.Last->Next = B.First;
1553 B.First->Previous = A.Last;
1554 unsigned LengthA = A.Last->TotalLength + B.First->SpacesRequiredBefore;
1555 for (FormatToken *Tok = B.First; Tok; Tok = Tok->Next) {
1556 Tok->TotalLength += LengthA;
1557 A.Last = Tok;
Daniel Jasper995e8202013-01-14 13:08:07 +00001558 }
Manuel Klimekf9ea2ed2013-01-10 19:49:59 +00001559 }
1560
Daniel Jasper6f21a982013-03-13 07:49:51 +00001561 bool touchesRanges(const CharSourceRange &Range) {
Daniel Jasperf3023542013-03-07 20:50:00 +00001562 for (unsigned i = 0, e = Ranges.size(); i != e; ++i) {
1563 if (!SourceMgr.isBeforeInTranslationUnit(Range.getEnd(),
1564 Ranges[i].getBegin()) &&
1565 !SourceMgr.isBeforeInTranslationUnit(Ranges[i].getEnd(),
1566 Range.getBegin()))
1567 return true;
1568 }
1569 return false;
1570 }
1571
1572 bool touchesLine(const AnnotatedLine &TheLine) {
Manuel Klimekb3987012013-05-29 14:47:47 +00001573 const FormatToken *First = TheLine.First;
1574 const FormatToken *Last = TheLine.Last;
Daniel Jasper84f5ddf2013-05-14 10:31:09 +00001575 CharSourceRange LineRange = CharSourceRange::getCharRange(
Manuel Klimekad3094b2013-05-23 10:56:37 +00001576 First->WhitespaceRange.getBegin().getLocWithOffset(
1577 First->LastNewlineOffset),
Alexander Kornienko54e6c9d2013-06-07 17:45:07 +00001578 Last->Tok.getLocation().getLocWithOffset(Last->TokenText.size() - 1));
Daniel Jasperf3023542013-03-07 20:50:00 +00001579 return touchesRanges(LineRange);
1580 }
1581
Daniel Jasper89b3a7f2013-05-10 13:00:49 +00001582 bool touchesPPDirective(std::vector<AnnotatedLine>::iterator I,
1583 std::vector<AnnotatedLine>::iterator E) {
1584 for (; I != E; ++I) {
Manuel Klimekb3987012013-05-29 14:47:47 +00001585 if (I->First->HasUnescapedNewline)
Daniel Jasper89b3a7f2013-05-10 13:00:49 +00001586 return false;
1587 if (touchesLine(*I))
1588 return true;
1589 }
1590 return false;
1591 }
1592
Daniel Jasperf3023542013-03-07 20:50:00 +00001593 bool touchesEmptyLineBefore(const AnnotatedLine &TheLine) {
Manuel Klimekb3987012013-05-29 14:47:47 +00001594 const FormatToken *First = TheLine.First;
Daniel Jasperf3023542013-03-07 20:50:00 +00001595 CharSourceRange LineRange = CharSourceRange::getCharRange(
Manuel Klimekad3094b2013-05-23 10:56:37 +00001596 First->WhitespaceRange.getBegin(),
1597 First->WhitespaceRange.getBegin().getLocWithOffset(
1598 First->LastNewlineOffset));
Daniel Jasperf3023542013-03-07 20:50:00 +00001599 return touchesRanges(LineRange);
Manuel Klimekf9ea2ed2013-01-10 19:49:59 +00001600 }
1601
1602 virtual void consumeUnwrappedLine(const UnwrappedLine &TheLine) {
Daniel Jaspercbb6c412013-01-16 09:10:19 +00001603 AnnotatedLines.push_back(AnnotatedLine(TheLine));
Daniel Jasperbac016b2012-12-03 18:12:45 +00001604 }
1605
Manuel Klimek3f8c7f32013-01-10 18:45:26 +00001606 /// \brief Add a new line and the required indent before the first Token
1607 /// of the \c UnwrappedLine if there was no structural parsing error.
1608 /// Returns the indent level of the \c UnwrappedLine.
Manuel Klimekb3987012013-05-29 14:47:47 +00001609 void formatFirstToken(const FormatToken &RootToken,
1610 const FormatToken *PreviousToken, unsigned Indent,
Manuel Klimeke573c3f2013-05-22 12:51:29 +00001611 bool InPPDirective) {
Daniel Jasper1a1ce832013-01-29 11:27:30 +00001612 unsigned Newlines =
Manuel Klimekb3987012013-05-29 14:47:47 +00001613 std::min(RootToken.NewlinesBefore, Style.MaxEmptyLinesToKeep + 1);
Daniel Jasper15f33f02013-06-03 16:16:41 +00001614 // Remove empty lines before "}" where applicable.
1615 if (RootToken.is(tok::r_brace) &&
1616 (!RootToken.Next ||
1617 (RootToken.Next->is(tok::semi) && !RootToken.Next->Next)))
1618 Newlines = std::min(Newlines, 1u);
Manuel Klimekb3987012013-05-29 14:47:47 +00001619 if (Newlines == 0 && !RootToken.IsFirst)
Manuel Klimek3f8c7f32013-01-10 18:45:26 +00001620 Newlines = 1;
Manuel Klimek3f8c7f32013-01-10 18:45:26 +00001621
Manuel Klimeke573c3f2013-05-22 12:51:29 +00001622 // Insert extra new line before access specifiers.
1623 if (PreviousToken && PreviousToken->isOneOf(tok::semi, tok::r_brace) &&
Manuel Klimekb3987012013-05-29 14:47:47 +00001624 RootToken.isAccessSpecifier() && RootToken.NewlinesBefore == 1)
Manuel Klimeke573c3f2013-05-22 12:51:29 +00001625 ++Newlines;
Alexander Kornienko94b748f2013-03-27 17:08:02 +00001626
Manuel Klimekb3987012013-05-29 14:47:47 +00001627 Whitespaces.replaceWhitespace(
1628 RootToken, Newlines, Indent, Indent,
1629 InPPDirective && !RootToken.HasUnescapedNewline);
Manuel Klimek3f8c7f32013-01-10 18:45:26 +00001630 }
1631
Daniel Jasperbac016b2012-12-03 18:12:45 +00001632 FormatStyle Style;
1633 Lexer &Lex;
1634 SourceManager &SourceMgr;
Daniel Jasperdcc2a622013-01-18 08:44:07 +00001635 WhitespaceManager Whitespaces;
Daniel Jasperbac016b2012-12-03 18:12:45 +00001636 std::vector<CharSourceRange> Ranges;
Daniel Jasper995e8202013-01-14 13:08:07 +00001637 std::vector<AnnotatedLine> AnnotatedLines;
Alexander Kornienko00895102013-06-05 14:09:10 +00001638
1639 encoding::Encoding Encoding;
Daniel Jasperbac016b2012-12-03 18:12:45 +00001640};
1641
Alexander Kornienko70ce7882013-04-15 14:28:00 +00001642tooling::Replacements reformat(const FormatStyle &Style, Lexer &Lex,
1643 SourceManager &SourceMgr,
Daniel Jaspercaf42a32013-05-15 08:14:19 +00001644 std::vector<CharSourceRange> Ranges) {
1645 Formatter formatter(Style, Lex, SourceMgr, Ranges);
Daniel Jasperbac016b2012-12-03 18:12:45 +00001646 return formatter.format();
1647}
1648
Daniel Jasper8a999452013-05-16 10:40:07 +00001649tooling::Replacements reformat(const FormatStyle &Style, StringRef Code,
1650 std::vector<tooling::Range> Ranges,
1651 StringRef FileName) {
1652 FileManager Files((FileSystemOptions()));
1653 DiagnosticsEngine Diagnostics(
1654 IntrusiveRefCntPtr<DiagnosticIDs>(new DiagnosticIDs),
1655 new DiagnosticOptions);
1656 SourceManager SourceMgr(Diagnostics, Files);
1657 llvm::MemoryBuffer *Buf = llvm::MemoryBuffer::getMemBuffer(Code, FileName);
1658 const clang::FileEntry *Entry =
1659 Files.getVirtualFile(FileName, Buf->getBufferSize(), 0);
1660 SourceMgr.overrideFileContents(Entry, Buf);
1661 FileID ID =
1662 SourceMgr.createFileID(Entry, SourceLocation(), clang::SrcMgr::C_User);
Alexander Kornienkoa1753f42013-06-28 12:51:24 +00001663 Lexer Lex(ID, SourceMgr.getBuffer(ID), SourceMgr,
1664 getFormattingLangOpts(Style.Standard));
Daniel Jasper8a999452013-05-16 10:40:07 +00001665 SourceLocation StartOfFile = SourceMgr.getLocForStartOfFile(ID);
1666 std::vector<CharSourceRange> CharRanges;
1667 for (unsigned i = 0, e = Ranges.size(); i != e; ++i) {
1668 SourceLocation Start = StartOfFile.getLocWithOffset(Ranges[i].getOffset());
1669 SourceLocation End = Start.getLocWithOffset(Ranges[i].getLength());
1670 CharRanges.push_back(CharSourceRange::getCharRange(Start, End));
1671 }
1672 return reformat(Style, Lex, SourceMgr, CharRanges);
1673}
1674
Alexander Kornienkoa1753f42013-06-28 12:51:24 +00001675LangOptions getFormattingLangOpts(FormatStyle::LanguageStandard Standard) {
Daniel Jasper46ef8522013-01-10 13:08:12 +00001676 LangOptions LangOpts;
1677 LangOpts.CPlusPlus = 1;
Alexander Kornienkoa1753f42013-06-28 12:51:24 +00001678 LangOpts.CPlusPlus11 = Standard == FormatStyle::LS_Cpp03 ? 0 : 1;
Daniel Jasperb64eca02013-03-22 10:01:29 +00001679 LangOpts.LineComment = 1;
Daniel Jasper46ef8522013-01-10 13:08:12 +00001680 LangOpts.Bool = 1;
1681 LangOpts.ObjC1 = 1;
1682 LangOpts.ObjC2 = 1;
1683 return LangOpts;
1684}
1685
Daniel Jaspercd162382013-01-07 13:26:07 +00001686} // namespace format
1687} // namespace clang