blob: a5477a996327b6de01a2335a659dae08572c5a77 [file] [log] [blame]
Alexander Kornienkocb45bc12013-04-15 14:28:00 +00001//===--- WhitespaceManager.cpp - Format C++ code --------------------------===//
2//
3// The LLVM Compiler Infrastructure
4//
5// This file is distributed under the University of Illinois Open Source
6// License. See LICENSE.TXT for details.
7//
8//===----------------------------------------------------------------------===//
9///
10/// \file
11/// \brief This file implements WhitespaceManager class.
12///
13//===----------------------------------------------------------------------===//
14
15#include "WhitespaceManager.h"
16#include "llvm/ADT/STLExtras.h"
17
18namespace clang {
19namespace format {
20
Daniel Jasperb05a81d2014-05-09 13:11:16 +000021bool WhitespaceManager::Change::IsBeforeInFile::
22operator()(const Change &C1, const Change &C2) const {
Manuel Klimek4fe43002013-05-22 12:51:29 +000023 return SourceMgr.isBeforeInTranslationUnit(
24 C1.OriginalWhitespaceRange.getBegin(),
25 C2.OriginalWhitespaceRange.getBegin());
26}
Daniel Jasper6fe2f002013-04-25 08:56:26 +000027
Daniel Jasper7d42f3f2017-01-31 11:25:01 +000028WhitespaceManager::Change::Change(const FormatToken &Tok,
29 bool CreateReplacement,
30 SourceRange OriginalWhitespaceRange,
31 int Spaces, unsigned StartOfTokenColumn,
32 unsigned NewlinesBefore,
33 StringRef PreviousLinePostfix,
34 StringRef CurrentLinePrefix,
35 bool ContinuesPPDirective, bool IsInsideToken)
36 : Tok(&Tok), CreateReplacement(CreateReplacement),
Manuel Klimek4fe43002013-05-22 12:51:29 +000037 OriginalWhitespaceRange(OriginalWhitespaceRange),
38 StartOfTokenColumn(StartOfTokenColumn), NewlinesBefore(NewlinesBefore),
39 PreviousLinePostfix(PreviousLinePostfix),
Daniel Jasper7d42f3f2017-01-31 11:25:01 +000040 CurrentLinePrefix(CurrentLinePrefix),
41 ContinuesPPDirective(ContinuesPPDirective), Spaces(Spaces),
42 IsInsideToken(IsInsideToken), IsTrailingComment(false), TokenLength(0),
43 PreviousEndOfTokenColumn(0), EscapedNewlineColumn(0),
Manuel Klimek2d293402015-03-03 14:21:48 +000044 StartOfBlockComment(nullptr), IndentationOffset(0) {}
Manuel Klimek4fe43002013-05-22 12:51:29 +000045
Manuel Klimek71814b42013-10-11 21:25:45 +000046void WhitespaceManager::replaceWhitespace(FormatToken &Tok, unsigned Newlines,
Daniel Jasper7d42f3f2017-01-31 11:25:01 +000047 unsigned Spaces,
Manuel Klimek4fe43002013-05-22 12:51:29 +000048 unsigned StartOfTokenColumn,
49 bool InPPDirective) {
Manuel Klimek71814b42013-10-11 21:25:45 +000050 if (Tok.Finalized)
51 return;
52 Tok.Decision = (Newlines > 0) ? FD_Break : FD_Continue;
Nikola Smiljanic92b397f2017-03-23 02:51:25 +000053 Changes.push_back(Change(Tok, /*CreateReplacement=*/true, Tok.WhitespaceRange,
54 Spaces, StartOfTokenColumn, Newlines, "", "",
55 InPPDirective && !Tok.IsFirst,
Daniel Jasper7d42f3f2017-01-31 11:25:01 +000056 /*IsInsideToken=*/false));
Alexander Kornienkocb45bc12013-04-15 14:28:00 +000057}
58
Manuel Klimek4fe43002013-05-22 12:51:29 +000059void WhitespaceManager::addUntouchableToken(const FormatToken &Tok,
60 bool InPPDirective) {
Manuel Klimek71814b42013-10-11 21:25:45 +000061 if (Tok.Finalized)
62 return;
Daniel Jasper7d42f3f2017-01-31 11:25:01 +000063 Changes.push_back(Change(Tok, /*CreateReplacement=*/false,
64 Tok.WhitespaceRange, /*Spaces=*/0,
65 Tok.OriginalColumn, Tok.NewlinesBefore, "", "",
66 InPPDirective && !Tok.IsFirst,
67 /*IsInsideToken=*/false));
Alexander Kornienkocb45bc12013-04-15 14:28:00 +000068}
69
Krasimir Georgiev9ad83fe2017-10-30 14:01:50 +000070llvm::Error
71WhitespaceManager::addReplacement(const tooling::Replacement &Replacement) {
72 return Replaces.add(Replacement);
73}
74
Alexander Kornienko555efc32013-06-11 16:01:49 +000075void WhitespaceManager::replaceWhitespaceInToken(
76 const FormatToken &Tok, unsigned Offset, unsigned ReplaceChars,
77 StringRef PreviousPostfix, StringRef CurrentPrefix, bool InPPDirective,
Daniel Jasper7d42f3f2017-01-31 11:25:01 +000078 unsigned Newlines, int Spaces) {
Manuel Klimek71814b42013-10-11 21:25:45 +000079 if (Tok.Finalized)
80 return;
Alexander Kornienko67d9c8c2014-04-17 16:12:46 +000081 SourceLocation Start = Tok.getStartOfNonWhitespace().getLocWithOffset(Offset);
Daniel Jasper7d42f3f2017-01-31 11:25:01 +000082 Changes.push_back(
83 Change(Tok, /*CreateReplacement=*/true,
84 SourceRange(Start, Start.getLocWithOffset(ReplaceChars)), Spaces,
85 std::max(0, Spaces), Newlines, PreviousPostfix, CurrentPrefix,
86 InPPDirective && !Tok.IsFirst, /*IsInsideToken=*/true));
Alexander Kornienkocb45bc12013-04-15 14:28:00 +000087}
88
Manuel Klimek4fe43002013-05-22 12:51:29 +000089const tooling::Replacements &WhitespaceManager::generateReplacements() {
90 if (Changes.empty())
91 return Replaces;
92
93 std::sort(Changes.begin(), Changes.end(), Change::IsBeforeInFile(SourceMgr));
94 calculateLineBreakInformation();
Daniel Jaspere12597c2015-10-01 10:06:54 +000095 alignConsecutiveDeclarations();
Daniel Jaspera44991332015-04-29 13:06:49 +000096 alignConsecutiveAssignments();
Manuel Klimek4fe43002013-05-22 12:51:29 +000097 alignTrailingComments();
98 alignEscapedNewlines();
99 generateChanges();
100
101 return Replaces;
102}
103
104void WhitespaceManager::calculateLineBreakInformation() {
105 Changes[0].PreviousEndOfTokenColumn = 0;
Benjamin Kramerdab50462016-01-11 16:27:16 +0000106 Change *LastOutsideTokenChange = &Changes[0];
Manuel Klimek4fe43002013-05-22 12:51:29 +0000107 for (unsigned i = 1, e = Changes.size(); i != e; ++i) {
Krasimir Georgieve1518822017-06-07 14:05:06 +0000108 SourceLocation OriginalWhitespaceStart =
109 Changes[i].OriginalWhitespaceRange.getBegin();
110 SourceLocation PreviousOriginalWhitespaceEnd =
111 Changes[i - 1].OriginalWhitespaceRange.getEnd();
112 unsigned OriginalWhitespaceStartOffset =
113 SourceMgr.getFileOffset(OriginalWhitespaceStart);
114 unsigned PreviousOriginalWhitespaceEndOffset =
115 SourceMgr.getFileOffset(PreviousOriginalWhitespaceEnd);
116 assert(PreviousOriginalWhitespaceEndOffset <=
117 OriginalWhitespaceStartOffset);
118 const char *const PreviousOriginalWhitespaceEndData =
119 SourceMgr.getCharacterData(PreviousOriginalWhitespaceEnd);
120 StringRef Text(PreviousOriginalWhitespaceEndData,
121 SourceMgr.getCharacterData(OriginalWhitespaceStart) -
122 PreviousOriginalWhitespaceEndData);
123 // Usually consecutive changes would occur in consecutive tokens. This is
124 // not the case however when analyzing some preprocessor runs of the
125 // annotated lines. For example, in this code:
126 //
127 // #if A // line 1
128 // int i = 1;
129 // #else B // line 2
130 // int i = 2;
131 // #endif // line 3
132 //
133 // one of the runs will produce the sequence of lines marked with line 1, 2
134 // and 3. So the two consecutive whitespace changes just before '// line 2'
135 // and before '#endif // line 3' span multiple lines and tokens:
136 //
137 // #else B{change X}[// line 2
138 // int i = 2;
139 // ]{change Y}#endif // line 3
140 //
141 // For this reason, if the text between consecutive changes spans multiple
142 // newlines, the token length must be adjusted to the end of the original
143 // line of the token.
144 auto NewlinePos = Text.find_first_of('\n');
145 if (NewlinePos == StringRef::npos) {
146 Changes[i - 1].TokenLength = OriginalWhitespaceStartOffset -
147 PreviousOriginalWhitespaceEndOffset +
148 Changes[i].PreviousLinePostfix.size() +
149 Changes[i - 1].CurrentLinePrefix.size();
150 } else {
151 Changes[i - 1].TokenLength =
152 NewlinePos + Changes[i - 1].CurrentLinePrefix.size();
153 }
Manuel Klimek4fe43002013-05-22 12:51:29 +0000154
Benjamin Kramerdab50462016-01-11 16:27:16 +0000155 // If there are multiple changes in this token, sum up all the changes until
156 // the end of the line.
Krasimir Georgiev59ed77b2017-06-04 19:27:02 +0000157 if (Changes[i - 1].IsInsideToken && Changes[i - 1].NewlinesBefore == 0)
Benjamin Kramerdab50462016-01-11 16:27:16 +0000158 LastOutsideTokenChange->TokenLength +=
159 Changes[i - 1].TokenLength + Changes[i - 1].Spaces;
160 else
161 LastOutsideTokenChange = &Changes[i - 1];
162
Manuel Klimek4fe43002013-05-22 12:51:29 +0000163 Changes[i].PreviousEndOfTokenColumn =
164 Changes[i - 1].StartOfTokenColumn + Changes[i - 1].TokenLength;
165
166 Changes[i - 1].IsTrailingComment =
Daniel Jasper7d42f3f2017-01-31 11:25:01 +0000167 (Changes[i].NewlinesBefore > 0 || Changes[i].Tok->is(tok::eof) ||
168 (Changes[i].IsInsideToken && Changes[i].Tok->is(tok::comment))) &&
169 Changes[i - 1].Tok->is(tok::comment) &&
Krasimir Georgiev91834222017-01-25 13:58:58 +0000170 // FIXME: This is a dirty hack. The problem is that
171 // BreakableLineCommentSection does comment reflow changes and here is
172 // the aligning of trailing comments. Consider the case where we reflow
173 // the second line up in this example:
Manuel Klimek89628f62017-09-20 09:51:03 +0000174 //
Krasimir Georgiev91834222017-01-25 13:58:58 +0000175 // // line 1
176 // // line 2
Manuel Klimek89628f62017-09-20 09:51:03 +0000177 //
Krasimir Georgiev91834222017-01-25 13:58:58 +0000178 // That amounts to 2 changes by BreakableLineCommentSection:
179 // - the first, delimited by (), for the whitespace between the tokens,
180 // - and second, delimited by [], for the whitespace at the beginning
181 // of the second token:
Manuel Klimek89628f62017-09-20 09:51:03 +0000182 //
Krasimir Georgiev91834222017-01-25 13:58:58 +0000183 // // line 1(
184 // )[// ]line 2
185 //
186 // So in the end we have two changes like this:
187 //
188 // // line1()[ ]line 2
189 //
190 // Note that the OriginalWhitespaceStart of the second change is the
191 // same as the PreviousOriginalWhitespaceEnd of the first change.
192 // In this case, the below check ensures that the second change doesn't
193 // get treated as a trailing comment change here, since this might
194 // trigger additional whitespace to be wrongly inserted before "line 2"
195 // by the comment aligner here.
196 //
197 // For a proper solution we need a mechanism to say to WhitespaceManager
198 // that a particular change breaks the current sequence of trailing
199 // comments.
200 OriginalWhitespaceStart != PreviousOriginalWhitespaceEnd;
Manuel Klimek4fe43002013-05-22 12:51:29 +0000201 }
Manuel Klimek05c67892013-05-22 14:01:08 +0000202 // FIXME: The last token is currently not always an eof token; in those
203 // cases, setting TokenLength of the last token to 0 is wrong.
204 Changes.back().TokenLength = 0;
Daniel Jasper7d42f3f2017-01-31 11:25:01 +0000205 Changes.back().IsTrailingComment = Changes.back().Tok->is(tok::comment);
Alexander Kornienko67d9c8c2014-04-17 16:12:46 +0000206
207 const WhitespaceManager::Change *LastBlockComment = nullptr;
208 for (auto &Change : Changes) {
Benjamin Kramerdab50462016-01-11 16:27:16 +0000209 // Reset the IsTrailingComment flag for changes inside of trailing comments
Krasimir Georgievd105b722017-02-03 10:18:25 +0000210 // so they don't get realigned later. Comment line breaks however still need
211 // to be aligned.
212 if (Change.IsInsideToken && Change.NewlinesBefore == 0)
Benjamin Kramerdab50462016-01-11 16:27:16 +0000213 Change.IsTrailingComment = false;
Alexander Kornienko67d9c8c2014-04-17 16:12:46 +0000214 Change.StartOfBlockComment = nullptr;
215 Change.IndentationOffset = 0;
Daniel Jasper7d42f3f2017-01-31 11:25:01 +0000216 if (Change.Tok->is(tok::comment)) {
217 if (Change.Tok->is(TT_LineComment) || !Change.IsInsideToken)
218 LastBlockComment = &Change;
219 else {
220 if ((Change.StartOfBlockComment = LastBlockComment))
221 Change.IndentationOffset =
222 Change.StartOfTokenColumn -
223 Change.StartOfBlockComment->StartOfTokenColumn;
224 }
Alexander Kornienko67d9c8c2014-04-17 16:12:46 +0000225 } else {
226 LastBlockComment = nullptr;
227 }
228 }
Manuel Klimek4fe43002013-05-22 12:51:29 +0000229}
230
Daniel Jasperec90e512015-12-01 12:00:43 +0000231// Align a single sequence of tokens, see AlignTokens below.
232template <typename F>
233static void
234AlignTokenSequence(unsigned Start, unsigned End, unsigned Column, F &&Matches,
235 SmallVector<WhitespaceManager::Change, 16> &Changes) {
236 bool FoundMatchOnLine = false;
237 int Shift = 0;
Nikola Smiljanic92b397f2017-03-23 02:51:25 +0000238
239 // ScopeStack keeps track of the current scope depth. It contains indices of
240 // the first token on each scope.
241 // We only run the "Matches" function on tokens from the outer-most scope.
242 // However, we do need to pay special attention to one class of tokens
243 // that are not in the outer-most scope, and that is function parameters
244 // which are split across multiple lines, as illustrated by this example:
245 // double a(int x);
246 // int b(int y,
247 // double z);
248 // In the above example, we need to take special care to ensure that
249 // 'double z' is indented along with it's owning function 'b'.
250 SmallVector<unsigned, 16> ScopeStack;
251
Daniel Jasperec90e512015-12-01 12:00:43 +0000252 for (unsigned i = Start; i != End; ++i) {
Nikola Smiljanic92b397f2017-03-23 02:51:25 +0000253 if (ScopeStack.size() != 0 &&
Daniel Jasper4917af62017-08-25 19:14:53 +0000254 Changes[i].indentAndNestingLevel() <
255 Changes[ScopeStack.back()].indentAndNestingLevel())
Nikola Smiljanic92b397f2017-03-23 02:51:25 +0000256 ScopeStack.pop_back();
257
Daniel Jasper4917af62017-08-25 19:14:53 +0000258 if (i != Start && Changes[i].indentAndNestingLevel() >
259 Changes[i - 1].indentAndNestingLevel())
Nikola Smiljanic92b397f2017-03-23 02:51:25 +0000260 ScopeStack.push_back(i);
261
262 bool InsideNestedScope = ScopeStack.size() != 0;
263
264 if (Changes[i].NewlinesBefore > 0 && !InsideNestedScope) {
Daniel Jasperec90e512015-12-01 12:00:43 +0000265 Shift = 0;
Nikola Smiljanic92b397f2017-03-23 02:51:25 +0000266 FoundMatchOnLine = false;
Daniel Jasperec90e512015-12-01 12:00:43 +0000267 }
268
269 // If this is the first matching token to be aligned, remember by how many
270 // spaces it has to be shifted, so the rest of the changes on the line are
271 // shifted by the same amount
Nikola Smiljanic92b397f2017-03-23 02:51:25 +0000272 if (!FoundMatchOnLine && !InsideNestedScope && Matches(Changes[i])) {
Daniel Jasperec90e512015-12-01 12:00:43 +0000273 FoundMatchOnLine = true;
274 Shift = Column - Changes[i].StartOfTokenColumn;
275 Changes[i].Spaces += Shift;
276 }
277
Nikola Smiljanic92b397f2017-03-23 02:51:25 +0000278 // This is for function parameters that are split across multiple lines,
279 // as mentioned in the ScopeStack comment.
280 if (InsideNestedScope && Changes[i].NewlinesBefore > 0) {
281 unsigned ScopeStart = ScopeStack.back();
282 if (Changes[ScopeStart - 1].Tok->is(TT_FunctionDeclarationName) ||
283 (ScopeStart > Start + 1 &&
284 Changes[ScopeStart - 2].Tok->is(TT_FunctionDeclarationName)))
285 Changes[i].Spaces += Shift;
286 }
287
Daniel Jasperec90e512015-12-01 12:00:43 +0000288 assert(Shift >= 0);
289 Changes[i].StartOfTokenColumn += Shift;
290 if (i + 1 != Changes.size())
291 Changes[i + 1].PreviousEndOfTokenColumn += Shift;
292 }
293}
294
Nikola Smiljanic92b397f2017-03-23 02:51:25 +0000295// Walk through a subset of the changes, starting at StartAt, and find
296// sequences of matching tokens to align. To do so, keep track of the lines and
297// whether or not a matching token was found on a line. If a matching token is
298// found, extend the current sequence. If the current line cannot be part of a
299// sequence, e.g. because there is an empty line before it or it contains only
300// non-matching tokens, finalize the previous sequence.
301// The value returned is the token on which we stopped, either because we
302// exhausted all items inside Changes, or because we hit a scope level higher
303// than our initial scope.
304// This function is recursive. Each invocation processes only the scope level
305// equal to the initial level, which is the level of Changes[StartAt].
306// If we encounter a scope level greater than the initial level, then we call
307// ourselves recursively, thereby avoiding the pollution of the current state
308// with the alignment requirements of the nested sub-level. This recursive
309// behavior is necessary for aligning function prototypes that have one or more
310// arguments.
311// If this function encounters a scope level less than the initial level,
312// it returns the current position.
313// There is a non-obvious subtlety in the recursive behavior: Even though we
314// defer processing of nested levels to recursive invocations of this
315// function, when it comes time to align a sequence of tokens, we run the
316// alignment on the entire sequence, including the nested levels.
317// When doing so, most of the nested tokens are skipped, because their
318// alignment was already handled by the recursive invocations of this function.
319// However, the special exception is that we do NOT skip function parameters
320// that are split across multiple lines. See the test case in FormatTest.cpp
321// that mentions "split function parameter alignment" for an example of this.
Daniel Jasperec90e512015-12-01 12:00:43 +0000322template <typename F>
Nikola Smiljanic92b397f2017-03-23 02:51:25 +0000323static unsigned AlignTokens(const FormatStyle &Style, F &&Matches,
324 SmallVector<WhitespaceManager::Change, 16> &Changes,
325 unsigned StartAt) {
Daniel Jasperec90e512015-12-01 12:00:43 +0000326 unsigned MinColumn = 0;
327 unsigned MaxColumn = UINT_MAX;
328
329 // Line number of the start and the end of the current token sequence.
330 unsigned StartOfSequence = 0;
331 unsigned EndOfSequence = 0;
332
Nikola Smiljanic92b397f2017-03-23 02:51:25 +0000333 // Measure the scope level (i.e. depth of (), [], {}) of the first token, and
334 // abort when we hit any token in a higher scope than the starting one.
Daniel Jasper4917af62017-08-25 19:14:53 +0000335 auto IndentAndNestingLevel = StartAt < Changes.size()
336 ? Changes[StartAt].indentAndNestingLevel()
Nikola Smiljanic92b397f2017-03-23 02:51:25 +0000337 : std::pair<unsigned, unsigned>(0, 0);
Daniel Jasperec90e512015-12-01 12:00:43 +0000338
339 // Keep track of the number of commas before the matching tokens, we will only
340 // align a sequence of matching tokens if they are preceded by the same number
341 // of commas.
342 unsigned CommasBeforeLastMatch = 0;
343 unsigned CommasBeforeMatch = 0;
344
345 // Whether a matching token has been found on the current line.
346 bool FoundMatchOnLine = false;
347
348 // Aligns a sequence of matching tokens, on the MinColumn column.
349 //
350 // Sequences start from the first matching token to align, and end at the
351 // first token of the first line that doesn't need to be aligned.
352 //
353 // We need to adjust the StartOfTokenColumn of each Change that is on a line
354 // containing any matching token to be aligned and located after such token.
355 auto AlignCurrentSequence = [&] {
356 if (StartOfSequence > 0 && StartOfSequence < EndOfSequence)
357 AlignTokenSequence(StartOfSequence, EndOfSequence, MinColumn, Matches,
358 Changes);
359 MinColumn = 0;
360 MaxColumn = UINT_MAX;
361 StartOfSequence = 0;
362 EndOfSequence = 0;
363 };
364
Nikola Smiljanic92b397f2017-03-23 02:51:25 +0000365 unsigned i = StartAt;
366 for (unsigned e = Changes.size(); i != e; ++i) {
Daniel Jasper4917af62017-08-25 19:14:53 +0000367 if (Changes[i].indentAndNestingLevel() < IndentAndNestingLevel)
Nikola Smiljanic92b397f2017-03-23 02:51:25 +0000368 break;
369
Daniel Jasperec90e512015-12-01 12:00:43 +0000370 if (Changes[i].NewlinesBefore != 0) {
371 CommasBeforeMatch = 0;
372 EndOfSequence = i;
373 // If there is a blank line, or if the last line didn't contain any
374 // matching token, the sequence ends here.
375 if (Changes[i].NewlinesBefore > 1 || !FoundMatchOnLine)
376 AlignCurrentSequence();
377
378 FoundMatchOnLine = false;
379 }
380
Daniel Jasper7d42f3f2017-01-31 11:25:01 +0000381 if (Changes[i].Tok->is(tok::comma)) {
Daniel Jasperec90e512015-12-01 12:00:43 +0000382 ++CommasBeforeMatch;
Daniel Jasper4917af62017-08-25 19:14:53 +0000383 } else if (Changes[i].indentAndNestingLevel() > IndentAndNestingLevel) {
Nikola Smiljanic92b397f2017-03-23 02:51:25 +0000384 // Call AlignTokens recursively, skipping over this scope block.
385 unsigned StoppedAt = AlignTokens(Style, Matches, Changes, i);
386 i = StoppedAt - 1;
387 continue;
Daniel Jasperec90e512015-12-01 12:00:43 +0000388 }
389
390 if (!Matches(Changes[i]))
391 continue;
392
393 // If there is more than one matching token per line, or if the number of
Nikola Smiljanic92b397f2017-03-23 02:51:25 +0000394 // preceding commas, do not match anymore, end the sequence.
395 if (FoundMatchOnLine || CommasBeforeMatch != CommasBeforeLastMatch)
Daniel Jasperec90e512015-12-01 12:00:43 +0000396 AlignCurrentSequence();
397
398 CommasBeforeLastMatch = CommasBeforeMatch;
Daniel Jasperec90e512015-12-01 12:00:43 +0000399 FoundMatchOnLine = true;
400
401 if (StartOfSequence == 0)
402 StartOfSequence = i;
403
404 unsigned ChangeMinColumn = Changes[i].StartOfTokenColumn;
405 int LineLengthAfter = -Changes[i].Spaces;
406 for (unsigned j = i; j != e && Changes[j].NewlinesBefore == 0; ++j)
407 LineLengthAfter += Changes[j].Spaces + Changes[j].TokenLength;
408 unsigned ChangeMaxColumn = Style.ColumnLimit - LineLengthAfter;
409
410 // If we are restricted by the maximum column width, end the sequence.
411 if (ChangeMinColumn > MaxColumn || ChangeMaxColumn < MinColumn ||
412 CommasBeforeLastMatch != CommasBeforeMatch) {
413 AlignCurrentSequence();
414 StartOfSequence = i;
415 }
416
417 MinColumn = std::max(MinColumn, ChangeMinColumn);
418 MaxColumn = std::min(MaxColumn, ChangeMaxColumn);
419 }
420
Nikola Smiljanic92b397f2017-03-23 02:51:25 +0000421 EndOfSequence = i;
Daniel Jasperec90e512015-12-01 12:00:43 +0000422 AlignCurrentSequence();
Nikola Smiljanic92b397f2017-03-23 02:51:25 +0000423 return i;
Daniel Jasperec90e512015-12-01 12:00:43 +0000424}
425
Daniel Jaspera44991332015-04-29 13:06:49 +0000426void WhitespaceManager::alignConsecutiveAssignments() {
427 if (!Style.AlignConsecutiveAssignments)
428 return;
429
Daniel Jasperec90e512015-12-01 12:00:43 +0000430 AlignTokens(Style,
431 [&](const Change &C) {
432 // Do not align on equal signs that are first on a line.
433 if (C.NewlinesBefore > 0)
434 return false;
Daniel Jaspera44991332015-04-29 13:06:49 +0000435
Daniel Jasperec90e512015-12-01 12:00:43 +0000436 // Do not align on equal signs that are last on a line.
437 if (&C != &Changes.back() && (&C + 1)->NewlinesBefore > 0)
438 return false;
Daniel Jaspera44991332015-04-29 13:06:49 +0000439
Daniel Jasper7d42f3f2017-01-31 11:25:01 +0000440 return C.Tok->is(tok::equal);
Daniel Jasperec90e512015-12-01 12:00:43 +0000441 },
Nikola Smiljanic92b397f2017-03-23 02:51:25 +0000442 Changes, /*StartAt=*/0);
Daniel Jaspera44991332015-04-29 13:06:49 +0000443}
444
Daniel Jaspere12597c2015-10-01 10:06:54 +0000445void WhitespaceManager::alignConsecutiveDeclarations() {
446 if (!Style.AlignConsecutiveDeclarations)
447 return;
448
Daniel Jasperec90e512015-12-01 12:00:43 +0000449 // FIXME: Currently we don't handle properly the PointerAlignment: Right
450 // The * and & are not aligned and are left dangling. Something has to be done
451 // about it, but it raises the question of alignment of code like:
452 // const char* const* v1;
453 // float const* v2;
454 // SomeVeryLongType const& v3;
Daniel Jasper7d42f3f2017-01-31 11:25:01 +0000455 AlignTokens(Style,
456 [](Change const &C) {
Nikola Smiljanic92b397f2017-03-23 02:51:25 +0000457 // tok::kw_operator is necessary for aligning operator overload
458 // definitions.
459 return C.Tok->is(TT_StartOfName) ||
460 C.Tok->is(TT_FunctionDeclarationName) ||
461 C.Tok->is(tok::kw_operator);
Daniel Jasper7d42f3f2017-01-31 11:25:01 +0000462 },
Nikola Smiljanic92b397f2017-03-23 02:51:25 +0000463 Changes, /*StartAt=*/0);
Daniel Jaspere12597c2015-10-01 10:06:54 +0000464}
465
Manuel Klimek4fe43002013-05-22 12:51:29 +0000466void WhitespaceManager::alignTrailingComments() {
467 unsigned MinColumn = 0;
468 unsigned MaxColumn = UINT_MAX;
469 unsigned StartOfSequence = 0;
470 bool BreakBeforeNext = false;
471 unsigned Newlines = 0;
472 for (unsigned i = 0, e = Changes.size(); i != e; ++i) {
Alexander Kornienko67d9c8c2014-04-17 16:12:46 +0000473 if (Changes[i].StartOfBlockComment)
474 continue;
475 Newlines += Changes[i].NewlinesBefore;
476 if (!Changes[i].IsTrailingComment)
477 continue;
478
Manuel Klimek4fe43002013-05-22 12:51:29 +0000479 unsigned ChangeMinColumn = Changes[i].StartOfTokenColumn;
Krasimir Georgiev4a9c2602017-08-23 07:18:36 +0000480 unsigned ChangeMaxColumn;
481
482 if (Style.ColumnLimit == 0)
483 ChangeMaxColumn = UINT_MAX;
484 else if (Style.ColumnLimit >= Changes[i].TokenLength)
485 ChangeMaxColumn = Style.ColumnLimit - Changes[i].TokenLength;
486 else
487 ChangeMaxColumn = ChangeMinColumn;
Daniel Jasper417fc812016-01-09 15:56:53 +0000488
489 // If we don't create a replacement for this change, we have to consider
490 // it to be immovable.
491 if (!Changes[i].CreateReplacement)
492 ChangeMaxColumn = ChangeMinColumn;
493
Daniel Jasper66935022014-04-27 10:03:19 +0000494 if (i + 1 != e && Changes[i + 1].ContinuesPPDirective)
495 ChangeMaxColumn -= 2;
Alexander Kornienko67d9c8c2014-04-17 16:12:46 +0000496 // If this comment follows an } in column 0, it probably documents the
497 // closing of a namespace and we don't want to align it.
498 bool FollowsRBraceInColumn0 = i > 0 && Changes[i].NewlinesBefore == 0 &&
Daniel Jasper7d42f3f2017-01-31 11:25:01 +0000499 Changes[i - 1].Tok->is(tok::r_brace) &&
Alexander Kornienko67d9c8c2014-04-17 16:12:46 +0000500 Changes[i - 1].StartOfTokenColumn == 0;
501 bool WasAlignedWithStartOfNextLine = false;
502 if (Changes[i].NewlinesBefore == 1) { // A comment on its own line.
Daniel Jasper49532102015-01-07 14:00:11 +0000503 unsigned CommentColumn = SourceMgr.getSpellingColumnNumber(
504 Changes[i].OriginalWhitespaceRange.getEnd());
Alexander Kornienko67d9c8c2014-04-17 16:12:46 +0000505 for (unsigned j = i + 1; j != e; ++j) {
Daniel Jasper7d42f3f2017-01-31 11:25:01 +0000506 if (Changes[j].Tok->is(tok::comment))
Daniel Jasperbb37a2f2016-02-01 11:20:55 +0000507 continue;
508
509 unsigned NextColumn = SourceMgr.getSpellingColumnNumber(
510 Changes[j].OriginalWhitespaceRange.getEnd());
511 // The start of the next token was previously aligned with the
512 // start of this comment.
513 WasAlignedWithStartOfNextLine =
514 CommentColumn == NextColumn ||
515 CommentColumn == NextColumn + Style.IndentWidth;
516 break;
Daniel Jasper0e93cdb2013-11-08 23:31:14 +0000517 }
Manuel Klimek4fe43002013-05-22 12:51:29 +0000518 }
Alexander Kornienko67d9c8c2014-04-17 16:12:46 +0000519 if (!Style.AlignTrailingComments || FollowsRBraceInColumn0) {
520 alignTrailingComments(StartOfSequence, i, MinColumn);
521 MinColumn = ChangeMinColumn;
522 MaxColumn = ChangeMinColumn;
523 StartOfSequence = i;
524 } else if (BreakBeforeNext || Newlines > 1 ||
525 (ChangeMinColumn > MaxColumn || ChangeMaxColumn < MinColumn) ||
526 // Break the comment sequence if the previous line did not end
527 // in a trailing comment.
528 (Changes[i].NewlinesBefore == 1 && i > 0 &&
529 !Changes[i - 1].IsTrailingComment) ||
530 WasAlignedWithStartOfNextLine) {
531 alignTrailingComments(StartOfSequence, i, MinColumn);
532 MinColumn = ChangeMinColumn;
533 MaxColumn = ChangeMaxColumn;
534 StartOfSequence = i;
535 } else {
536 MinColumn = std::max(MinColumn, ChangeMinColumn);
537 MaxColumn = std::min(MaxColumn, ChangeMaxColumn);
538 }
539 BreakBeforeNext =
540 (i == 0) || (Changes[i].NewlinesBefore > 1) ||
541 // Never start a sequence with a comment at the beginning of
542 // the line.
543 (Changes[i].NewlinesBefore == 1 && StartOfSequence == i);
544 Newlines = 0;
Manuel Klimek4fe43002013-05-22 12:51:29 +0000545 }
546 alignTrailingComments(StartOfSequence, Changes.size(), MinColumn);
547}
548
549void WhitespaceManager::alignTrailingComments(unsigned Start, unsigned End,
550 unsigned Column) {
551 for (unsigned i = Start; i != End; ++i) {
Alexander Kornienko67d9c8c2014-04-17 16:12:46 +0000552 int Shift = 0;
Manuel Klimek4fe43002013-05-22 12:51:29 +0000553 if (Changes[i].IsTrailingComment) {
Alexander Kornienko67d9c8c2014-04-17 16:12:46 +0000554 Shift = Column - Changes[i].StartOfTokenColumn;
Manuel Klimek4fe43002013-05-22 12:51:29 +0000555 }
Alexander Kornienko67d9c8c2014-04-17 16:12:46 +0000556 if (Changes[i].StartOfBlockComment) {
557 Shift = Changes[i].IndentationOffset +
558 Changes[i].StartOfBlockComment->StartOfTokenColumn -
559 Changes[i].StartOfTokenColumn;
560 }
561 assert(Shift >= 0);
562 Changes[i].Spaces += Shift;
Andi-Bogdan Postelnicua9a8fde2016-10-26 07:44:51 +0000563 if (i + 1 != Changes.size())
Alexander Kornienko67d9c8c2014-04-17 16:12:46 +0000564 Changes[i + 1].PreviousEndOfTokenColumn += Shift;
565 Changes[i].StartOfTokenColumn += Shift;
Manuel Klimek4fe43002013-05-22 12:51:29 +0000566 }
567}
568
569void WhitespaceManager::alignEscapedNewlines() {
Daniel Jasper7fdbb3f2017-05-08 15:08:00 +0000570 if (Style.AlignEscapedNewlines == FormatStyle::ENAS_DontAlign)
571 return;
572
573 bool AlignLeft = Style.AlignEscapedNewlines == FormatStyle::ENAS_Left;
574 unsigned MaxEndOfLine = AlignLeft ? 0 : Style.ColumnLimit;
Manuel Klimek4fe43002013-05-22 12:51:29 +0000575 unsigned StartOfMacro = 0;
576 for (unsigned i = 1, e = Changes.size(); i < e; ++i) {
577 Change &C = Changes[i];
578 if (C.NewlinesBefore > 0) {
579 if (C.ContinuesPPDirective) {
Daniel Jaspera49393f2013-08-28 09:07:32 +0000580 MaxEndOfLine = std::max(C.PreviousEndOfTokenColumn + 2, MaxEndOfLine);
Manuel Klimek4fe43002013-05-22 12:51:29 +0000581 } else {
582 alignEscapedNewlines(StartOfMacro + 1, i, MaxEndOfLine);
Daniel Jasper7fdbb3f2017-05-08 15:08:00 +0000583 MaxEndOfLine = AlignLeft ? 0 : Style.ColumnLimit;
Manuel Klimek4fe43002013-05-22 12:51:29 +0000584 StartOfMacro = i;
585 }
586 }
587 }
588 alignEscapedNewlines(StartOfMacro + 1, Changes.size(), MaxEndOfLine);
589}
590
591void WhitespaceManager::alignEscapedNewlines(unsigned Start, unsigned End,
592 unsigned Column) {
593 for (unsigned i = Start; i < End; ++i) {
594 Change &C = Changes[i];
595 if (C.NewlinesBefore > 0) {
596 assert(C.ContinuesPPDirective);
597 if (C.PreviousEndOfTokenColumn + 1 > Column)
598 C.EscapedNewlineColumn = 0;
599 else
600 C.EscapedNewlineColumn = Column;
601 }
602 }
603}
604
605void WhitespaceManager::generateChanges() {
606 for (unsigned i = 0, e = Changes.size(); i != e; ++i) {
607 const Change &C = Changes[i];
Daniel Jasper47b35ae2015-01-29 10:47:14 +0000608 if (i > 0) {
609 assert(Changes[i - 1].OriginalWhitespaceRange.getBegin() !=
610 C.OriginalWhitespaceRange.getBegin() &&
611 "Generating two replacements for the same location");
612 }
Manuel Klimek4fe43002013-05-22 12:51:29 +0000613 if (C.CreateReplacement) {
Alexander Kornienko9e649af2013-09-11 12:25:57 +0000614 std::string ReplacementText = C.PreviousLinePostfix;
615 if (C.ContinuesPPDirective)
Jacob Bandes-Storchd6a7e982017-08-10 00:15:31 +0000616 appendEscapedNewlineText(ReplacementText, C.NewlinesBefore,
617 C.PreviousEndOfTokenColumn,
618 C.EscapedNewlineColumn);
Alexander Kornienko9e649af2013-09-11 12:25:57 +0000619 else
620 appendNewlineText(ReplacementText, C.NewlinesBefore);
Daniel Jasper7d42f3f2017-01-31 11:25:01 +0000621 appendIndentText(ReplacementText, C.Tok->IndentLevel,
622 std::max(0, C.Spaces),
Alexander Kornienko67d9c8c2014-04-17 16:12:46 +0000623 C.StartOfTokenColumn - std::max(0, C.Spaces));
Alexander Kornienko9e649af2013-09-11 12:25:57 +0000624 ReplacementText.append(C.CurrentLinePrefix);
Manuel Klimek4fe43002013-05-22 12:51:29 +0000625 storeReplacement(C.OriginalWhitespaceRange, ReplacementText);
626 }
627 }
628}
629
Manuel Klimek89628f62017-09-20 09:51:03 +0000630void WhitespaceManager::storeReplacement(SourceRange Range, StringRef Text) {
Manuel Klimek4fe43002013-05-22 12:51:29 +0000631 unsigned WhitespaceLength = SourceMgr.getFileOffset(Range.getEnd()) -
632 SourceMgr.getFileOffset(Range.getBegin());
633 // Don't create a replacement, if it does not change anything.
634 if (StringRef(SourceMgr.getCharacterData(Range.getBegin()),
Daniel Jasper3ac9b9e2013-07-08 14:34:09 +0000635 WhitespaceLength) == Text)
Manuel Klimek4fe43002013-05-22 12:51:29 +0000636 return;
Eric Liu40ef2fb2016-08-01 10:16:37 +0000637 auto Err = Replaces.add(tooling::Replacement(
Manuel Klimek4fe43002013-05-22 12:51:29 +0000638 SourceMgr, CharSourceRange::getCharRange(Range), Text));
Eric Liu40ef2fb2016-08-01 10:16:37 +0000639 // FIXME: better error handling. For now, just print an error message in the
640 // release version.
Piotr Padlewski1ec383c2016-12-23 11:40:44 +0000641 if (Err) {
Eric Liu40ef2fb2016-08-01 10:16:37 +0000642 llvm::errs() << llvm::toString(std::move(Err)) << "\n";
Piotr Padlewski1ec383c2016-12-23 11:40:44 +0000643 assert(false);
644 }
Alexander Kornienkocb45bc12013-04-15 14:28:00 +0000645}
646
Alexander Kornienko9e649af2013-09-11 12:25:57 +0000647void WhitespaceManager::appendNewlineText(std::string &Text,
648 unsigned Newlines) {
649 for (unsigned i = 0; i < Newlines; ++i)
650 Text.append(UseCRLF ? "\r\n" : "\n");
Alexander Kornienkocb45bc12013-04-15 14:28:00 +0000651}
652
Manuel Klimek89628f62017-09-20 09:51:03 +0000653void WhitespaceManager::appendEscapedNewlineText(
654 std::string &Text, unsigned Newlines, unsigned PreviousEndOfTokenColumn,
655 unsigned EscapedNewlineColumn) {
Alexander Kornienko555efc32013-06-11 16:01:49 +0000656 if (Newlines > 0) {
Jacob Bandes-Storchd6a7e982017-08-10 00:15:31 +0000657 unsigned Spaces =
658 std::max<int>(1, EscapedNewlineColumn - PreviousEndOfTokenColumn - 1);
Alexander Kornienko555efc32013-06-11 16:01:49 +0000659 for (unsigned i = 0; i < Newlines; ++i) {
Jacob Bandes-Storchd6a7e982017-08-10 00:15:31 +0000660 Text.append(Spaces, ' ');
Alexander Kornienko9e649af2013-09-11 12:25:57 +0000661 Text.append(UseCRLF ? "\\\r\n" : "\\\n");
Jacob Bandes-Storchd6a7e982017-08-10 00:15:31 +0000662 Spaces = std::max<int>(0, EscapedNewlineColumn - 1);
Alexander Kornienkocb45bc12013-04-15 14:28:00 +0000663 }
664 }
Manuel Klimekb9eae4c2013-05-13 09:22:11 +0000665}
666
Alexander Kornienko3c3d09c2013-09-27 16:14:22 +0000667void WhitespaceManager::appendIndentText(std::string &Text,
668 unsigned IndentLevel, unsigned Spaces,
Alexander Kornienkodb4c21f2013-09-27 09:45:40 +0000669 unsigned WhitespaceStartColumn) {
Alexander Kornienko3c3d09c2013-09-27 16:14:22 +0000670 switch (Style.UseTab) {
671 case FormatStyle::UT_Never:
Benjamin Kramerddf1cda2015-05-28 19:55:49 +0000672 Text.append(Spaces, ' ');
Alexander Kornienko3c3d09c2013-09-27 16:14:22 +0000673 break;
674 case FormatStyle::UT_Always: {
Alexander Kornienkodb4c21f2013-09-27 09:45:40 +0000675 unsigned FirstTabWidth =
676 Style.TabWidth - WhitespaceStartColumn % Style.TabWidth;
677 // Indent with tabs only when there's at least one full tab.
678 if (FirstTabWidth + Style.TabWidth <= Spaces) {
679 Spaces -= FirstTabWidth;
680 Text.append("\t");
681 }
Benjamin Kramerddf1cda2015-05-28 19:55:49 +0000682 Text.append(Spaces / Style.TabWidth, '\t');
683 Text.append(Spaces % Style.TabWidth, ' ');
Alexander Kornienko3c3d09c2013-09-27 16:14:22 +0000684 break;
685 }
686 case FormatStyle::UT_ForIndentation:
687 if (WhitespaceStartColumn == 0) {
688 unsigned Indentation = IndentLevel * Style.IndentWidth;
Alexander Kornienko45dc1b22013-09-27 16:40:11 +0000689 // This happens, e.g. when a line in a block comment is indented less than
690 // the first one.
Alexander Kornienko3c3d09c2013-09-27 16:14:22 +0000691 if (Indentation > Spaces)
692 Indentation = Spaces;
693 unsigned Tabs = Indentation / Style.TabWidth;
Benjamin Kramerddf1cda2015-05-28 19:55:49 +0000694 Text.append(Tabs, '\t');
Alexander Kornienko3c3d09c2013-09-27 16:14:22 +0000695 Spaces -= Tabs * Style.TabWidth;
696 }
Benjamin Kramerddf1cda2015-05-28 19:55:49 +0000697 Text.append(Spaces, ' ');
Alexander Kornienko3c3d09c2013-09-27 16:14:22 +0000698 break;
Marianne Mailhot-Sarrasin51fe2792016-04-14 14:52:26 +0000699 case FormatStyle::UT_ForContinuationAndIndentation:
700 if (WhitespaceStartColumn == 0) {
701 unsigned Tabs = Spaces / Style.TabWidth;
702 Text.append(Tabs, '\t');
703 Spaces -= Tabs * Style.TabWidth;
704 }
705 Text.append(Spaces, ' ');
706 break;
Alexander Kornienko9e649af2013-09-11 12:25:57 +0000707 }
Alexander Kornienkocb45bc12013-04-15 14:28:00 +0000708}
709
Alexander Kornienkocb45bc12013-04-15 14:28:00 +0000710} // namespace format
711} // namespace clang