Alexander Kornienko | 70ce788 | 2013-04-15 14:28:00 +0000 | [diff] [blame] | 1 | //===--- WhitespaceManager.cpp - Format C++ code --------------------------===// |
| 2 | // |
| 3 | // The LLVM Compiler Infrastructure |
| 4 | // |
| 5 | // This file is distributed under the University of Illinois Open Source |
| 6 | // License. See LICENSE.TXT for details. |
| 7 | // |
| 8 | //===----------------------------------------------------------------------===// |
| 9 | /// |
| 10 | /// \file |
| 11 | /// \brief This file implements WhitespaceManager class. |
| 12 | /// |
| 13 | //===----------------------------------------------------------------------===// |
| 14 | |
| 15 | #include "WhitespaceManager.h" |
| 16 | #include "llvm/ADT/STLExtras.h" |
| 17 | |
| 18 | namespace clang { |
| 19 | namespace format { |
| 20 | |
Manuel Klimek | e573c3f | 2013-05-22 12:51:29 +0000 | [diff] [blame] | 21 | bool |
| 22 | WhitespaceManager::Change::IsBeforeInFile::operator()(const Change &C1, |
| 23 | const Change &C2) const { |
| 24 | return SourceMgr.isBeforeInTranslationUnit( |
| 25 | C1.OriginalWhitespaceRange.getBegin(), |
| 26 | C2.OriginalWhitespaceRange.getBegin()); |
| 27 | } |
Daniel Jasper | 2972d04 | 2013-04-25 08:56:26 +0000 | [diff] [blame] | 28 | |
Manuel Klimek | e573c3f | 2013-05-22 12:51:29 +0000 | [diff] [blame] | 29 | WhitespaceManager::Change::Change( |
| 30 | bool CreateReplacement, const SourceRange &OriginalWhitespaceRange, |
| 31 | unsigned Spaces, unsigned StartOfTokenColumn, unsigned NewlinesBefore, |
| 32 | StringRef PreviousLinePostfix, StringRef CurrentLinePrefix, |
| 33 | tok::TokenKind Kind, bool ContinuesPPDirective) |
| 34 | : CreateReplacement(CreateReplacement), |
| 35 | OriginalWhitespaceRange(OriginalWhitespaceRange), |
| 36 | StartOfTokenColumn(StartOfTokenColumn), NewlinesBefore(NewlinesBefore), |
| 37 | PreviousLinePostfix(PreviousLinePostfix), |
| 38 | CurrentLinePrefix(CurrentLinePrefix), Kind(Kind), |
| 39 | ContinuesPPDirective(ContinuesPPDirective), Spaces(Spaces) {} |
| 40 | |
Manuel Klimek | b398701 | 2013-05-29 14:47:47 +0000 | [diff] [blame] | 41 | void WhitespaceManager::replaceWhitespace(const FormatToken &Tok, |
Manuel Klimek | e573c3f | 2013-05-22 12:51:29 +0000 | [diff] [blame] | 42 | unsigned Newlines, unsigned Spaces, |
| 43 | unsigned StartOfTokenColumn, |
| 44 | bool InPPDirective) { |
Manuel Klimek | dcb3f2a | 2013-05-28 13:42:28 +0000 | [diff] [blame] | 45 | Changes.push_back( |
Manuel Klimek | b398701 | 2013-05-29 14:47:47 +0000 | [diff] [blame] | 46 | Change(true, Tok.WhitespaceRange, Spaces, StartOfTokenColumn, Newlines, |
| 47 | "", "", Tok.Tok.getKind(), InPPDirective && !Tok.IsFirst)); |
Alexander Kornienko | 70ce788 | 2013-04-15 14:28:00 +0000 | [diff] [blame] | 48 | } |
| 49 | |
Manuel Klimek | e573c3f | 2013-05-22 12:51:29 +0000 | [diff] [blame] | 50 | void WhitespaceManager::addUntouchableToken(const FormatToken &Tok, |
| 51 | bool InPPDirective) { |
Manuel Klimek | ad3094b | 2013-05-23 10:56:37 +0000 | [diff] [blame] | 52 | Changes.push_back( |
| 53 | Change(false, Tok.WhitespaceRange, /*Spaces=*/0, |
| 54 | SourceMgr.getSpellingColumnNumber(Tok.Tok.getLocation()) - 1, |
| 55 | Tok.NewlinesBefore, "", "", Tok.Tok.getKind(), |
| 56 | InPPDirective && !Tok.IsFirst)); |
Alexander Kornienko | 70ce788 | 2013-04-15 14:28:00 +0000 | [diff] [blame] | 57 | } |
| 58 | |
| 59 | void WhitespaceManager::breakToken(const FormatToken &Tok, unsigned Offset, |
Manuel Klimek | e573c3f | 2013-05-22 12:51:29 +0000 | [diff] [blame] | 60 | unsigned ReplaceChars, |
| 61 | StringRef PreviousPostfix, |
| 62 | StringRef CurrentPrefix, bool InPPDirective, |
| 63 | unsigned Spaces) { |
| 64 | Changes.push_back(Change( |
| 65 | true, SourceRange(Tok.getStartOfNonWhitespace().getLocWithOffset(Offset), |
| 66 | Tok.getStartOfNonWhitespace().getLocWithOffset( |
| 67 | Offset + ReplaceChars)), |
| 68 | Spaces, Spaces, 1, PreviousPostfix, CurrentPrefix, |
| 69 | // FIXME: Unify token adjustment, so we don't split it between |
| 70 | // BreakableToken and the WhitespaceManager. That would also allow us to |
| 71 | // correctly store a tok::TokenKind instead of rolling our own enum. |
| 72 | tok::unknown, InPPDirective && !Tok.IsFirst)); |
Alexander Kornienko | 70ce788 | 2013-04-15 14:28:00 +0000 | [diff] [blame] | 73 | } |
| 74 | |
Manuel Klimek | e573c3f | 2013-05-22 12:51:29 +0000 | [diff] [blame] | 75 | const tooling::Replacements &WhitespaceManager::generateReplacements() { |
| 76 | if (Changes.empty()) |
| 77 | return Replaces; |
| 78 | |
| 79 | std::sort(Changes.begin(), Changes.end(), Change::IsBeforeInFile(SourceMgr)); |
| 80 | calculateLineBreakInformation(); |
| 81 | alignTrailingComments(); |
| 82 | alignEscapedNewlines(); |
| 83 | generateChanges(); |
| 84 | |
| 85 | return Replaces; |
| 86 | } |
| 87 | |
| 88 | void WhitespaceManager::calculateLineBreakInformation() { |
| 89 | Changes[0].PreviousEndOfTokenColumn = 0; |
| 90 | for (unsigned i = 1, e = Changes.size(); i != e; ++i) { |
| 91 | unsigned OriginalWhitespaceStart = |
| 92 | SourceMgr.getFileOffset(Changes[i].OriginalWhitespaceRange.getBegin()); |
| 93 | unsigned PreviousOriginalWhitespaceEnd = SourceMgr.getFileOffset( |
| 94 | Changes[i - 1].OriginalWhitespaceRange.getEnd()); |
| 95 | Changes[i - 1].TokenLength = |
| 96 | OriginalWhitespaceStart - PreviousOriginalWhitespaceEnd + |
| 97 | Changes[i].PreviousLinePostfix.size() + |
| 98 | Changes[i - 1].CurrentLinePrefix.size(); |
| 99 | |
| 100 | Changes[i].PreviousEndOfTokenColumn = |
| 101 | Changes[i - 1].StartOfTokenColumn + Changes[i - 1].TokenLength; |
| 102 | |
| 103 | Changes[i - 1].IsTrailingComment = |
| 104 | (Changes[i].NewlinesBefore > 0 || Changes[i].Kind == tok::eof) && |
| 105 | Changes[i - 1].Kind == tok::comment; |
| 106 | } |
Manuel Klimek | 0cd57b5 | 2013-05-22 14:01:08 +0000 | [diff] [blame] | 107 | // FIXME: The last token is currently not always an eof token; in those |
| 108 | // cases, setting TokenLength of the last token to 0 is wrong. |
| 109 | Changes.back().TokenLength = 0; |
Manuel Klimek | e573c3f | 2013-05-22 12:51:29 +0000 | [diff] [blame] | 110 | Changes.back().IsTrailingComment = Changes.back().Kind == tok::comment; |
| 111 | } |
| 112 | |
| 113 | void WhitespaceManager::alignTrailingComments() { |
| 114 | unsigned MinColumn = 0; |
| 115 | unsigned MaxColumn = UINT_MAX; |
| 116 | unsigned StartOfSequence = 0; |
| 117 | bool BreakBeforeNext = false; |
| 118 | unsigned Newlines = 0; |
| 119 | for (unsigned i = 0, e = Changes.size(); i != e; ++i) { |
| 120 | unsigned ChangeMinColumn = Changes[i].StartOfTokenColumn; |
| 121 | // FIXME: Correctly handle ChangeMaxColumn in PP directives. |
| 122 | unsigned ChangeMaxColumn = Style.ColumnLimit - Changes[i].TokenLength; |
| 123 | Newlines += Changes[i].NewlinesBefore; |
| 124 | if (Changes[i].IsTrailingComment) { |
Manuel Klimek | ebfb88c | 2013-05-23 11:42:52 +0000 | [diff] [blame] | 125 | bool WasAlignedWithStartOfNextLine = |
| 126 | // A comment on its own line. |
| 127 | Changes[i].NewlinesBefore == 1 && |
| 128 | // Not the last line. |
| 129 | i + 1 != e && |
| 130 | // The start of the next token was previously aligned with |
| 131 | // the start of this comment. |
| 132 | (SourceMgr.getSpellingColumnNumber( |
| 133 | Changes[i].OriginalWhitespaceRange.getEnd()) == |
| 134 | SourceMgr.getSpellingColumnNumber( |
| 135 | Changes[i + 1].OriginalWhitespaceRange.getEnd())) && |
| 136 | // Which is not a comment itself. |
| 137 | Changes[i + 1].Kind != tok::comment; |
Manuel Klimek | e573c3f | 2013-05-22 12:51:29 +0000 | [diff] [blame] | 138 | if (BreakBeforeNext || Newlines > 1 || |
| 139 | (ChangeMinColumn > MaxColumn || ChangeMaxColumn < MinColumn) || |
| 140 | // Break the comment sequence if the previous line did not end |
| 141 | // in a trailing comment. |
| 142 | (Changes[i].NewlinesBefore == 1 && i > 0 && |
Manuel Klimek | ebfb88c | 2013-05-23 11:42:52 +0000 | [diff] [blame] | 143 | !Changes[i - 1].IsTrailingComment) || |
| 144 | WasAlignedWithStartOfNextLine) { |
Manuel Klimek | e573c3f | 2013-05-22 12:51:29 +0000 | [diff] [blame] | 145 | alignTrailingComments(StartOfSequence, i, MinColumn); |
| 146 | MinColumn = ChangeMinColumn; |
| 147 | MaxColumn = ChangeMaxColumn; |
| 148 | StartOfSequence = i; |
| 149 | } else { |
| 150 | MinColumn = std::max(MinColumn, ChangeMinColumn); |
| 151 | MaxColumn = std::min(MaxColumn, ChangeMaxColumn); |
| 152 | } |
Manuel Klimek | 854ca79 | 2013-05-23 20:46:07 +0000 | [diff] [blame] | 153 | BreakBeforeNext = |
| 154 | (i == 0) || (Changes[i].NewlinesBefore > 1) || |
| 155 | // Never start a sequence with a comment at the beginning of |
| 156 | // the line. |
| 157 | (Changes[i].NewlinesBefore == 1 && StartOfSequence == i); |
Manuel Klimek | e573c3f | 2013-05-22 12:51:29 +0000 | [diff] [blame] | 158 | Newlines = 0; |
| 159 | } |
| 160 | } |
| 161 | alignTrailingComments(StartOfSequence, Changes.size(), MinColumn); |
| 162 | } |
| 163 | |
| 164 | void WhitespaceManager::alignTrailingComments(unsigned Start, unsigned End, |
| 165 | unsigned Column) { |
| 166 | for (unsigned i = Start; i != End; ++i) { |
| 167 | if (Changes[i].IsTrailingComment) { |
| 168 | assert(Column >= Changes[i].StartOfTokenColumn); |
| 169 | Changes[i].Spaces += Column - Changes[i].StartOfTokenColumn; |
| 170 | Changes[i].StartOfTokenColumn = Column; |
| 171 | } |
| 172 | } |
| 173 | } |
| 174 | |
| 175 | void WhitespaceManager::alignEscapedNewlines() { |
| 176 | unsigned MaxEndOfLine = 0; |
| 177 | unsigned StartOfMacro = 0; |
| 178 | for (unsigned i = 1, e = Changes.size(); i < e; ++i) { |
| 179 | Change &C = Changes[i]; |
| 180 | if (C.NewlinesBefore > 0) { |
| 181 | if (C.ContinuesPPDirective) { |
| 182 | if (Style.AlignEscapedNewlinesLeft) |
| 183 | MaxEndOfLine = std::max(C.PreviousEndOfTokenColumn + 2, MaxEndOfLine); |
| 184 | else |
| 185 | MaxEndOfLine = Style.ColumnLimit; |
| 186 | } else { |
| 187 | alignEscapedNewlines(StartOfMacro + 1, i, MaxEndOfLine); |
| 188 | MaxEndOfLine = 0; |
| 189 | StartOfMacro = i; |
| 190 | } |
| 191 | } |
| 192 | } |
| 193 | alignEscapedNewlines(StartOfMacro + 1, Changes.size(), MaxEndOfLine); |
| 194 | } |
| 195 | |
| 196 | void WhitespaceManager::alignEscapedNewlines(unsigned Start, unsigned End, |
| 197 | unsigned Column) { |
| 198 | for (unsigned i = Start; i < End; ++i) { |
| 199 | Change &C = Changes[i]; |
| 200 | if (C.NewlinesBefore > 0) { |
| 201 | assert(C.ContinuesPPDirective); |
| 202 | if (C.PreviousEndOfTokenColumn + 1 > Column) |
| 203 | C.EscapedNewlineColumn = 0; |
| 204 | else |
| 205 | C.EscapedNewlineColumn = Column; |
| 206 | } |
| 207 | } |
| 208 | } |
| 209 | |
| 210 | void WhitespaceManager::generateChanges() { |
| 211 | for (unsigned i = 0, e = Changes.size(); i != e; ++i) { |
| 212 | const Change &C = Changes[i]; |
| 213 | if (C.CreateReplacement) { |
| 214 | std::string ReplacementText = |
| 215 | C.PreviousLinePostfix + |
| 216 | (C.ContinuesPPDirective |
| 217 | ? getNewLineText(C.NewlinesBefore, C.Spaces, |
| 218 | C.PreviousEndOfTokenColumn, |
| 219 | C.EscapedNewlineColumn) |
| 220 | : getNewLineText(C.NewlinesBefore, C.Spaces)) + |
| 221 | C.CurrentLinePrefix; |
| 222 | storeReplacement(C.OriginalWhitespaceRange, ReplacementText); |
| 223 | } |
| 224 | } |
| 225 | } |
| 226 | |
| 227 | void WhitespaceManager::storeReplacement(const SourceRange &Range, |
| 228 | StringRef Text) { |
| 229 | unsigned WhitespaceLength = SourceMgr.getFileOffset(Range.getEnd()) - |
| 230 | SourceMgr.getFileOffset(Range.getBegin()); |
| 231 | // Don't create a replacement, if it does not change anything. |
| 232 | if (StringRef(SourceMgr.getCharacterData(Range.getBegin()), |
| 233 | WhitespaceLength) == |
| 234 | Text) |
| 235 | return; |
| 236 | Replaces.insert(tooling::Replacement( |
| 237 | SourceMgr, CharSourceRange::getCharRange(Range), Text)); |
Alexander Kornienko | 70ce788 | 2013-04-15 14:28:00 +0000 | [diff] [blame] | 238 | } |
| 239 | |
Alexander Kornienko | 70ce788 | 2013-04-15 14:28:00 +0000 | [diff] [blame] | 240 | std::string WhitespaceManager::getNewLineText(unsigned NewLines, |
| 241 | unsigned Spaces) { |
Manuel Klimek | 7c9a93e | 2013-05-13 09:22:11 +0000 | [diff] [blame] | 242 | return std::string(NewLines, '\n') + getIndentText(Spaces); |
Alexander Kornienko | 70ce788 | 2013-04-15 14:28:00 +0000 | [diff] [blame] | 243 | } |
| 244 | |
| 245 | std::string WhitespaceManager::getNewLineText(unsigned NewLines, |
| 246 | unsigned Spaces, |
Manuel Klimek | e573c3f | 2013-05-22 12:51:29 +0000 | [diff] [blame] | 247 | unsigned PreviousEndOfTokenColumn, |
Daniel Jasper | 2972d04 | 2013-04-25 08:56:26 +0000 | [diff] [blame] | 248 | unsigned EscapedNewlineColumn) { |
Alexander Kornienko | 70ce788 | 2013-04-15 14:28:00 +0000 | [diff] [blame] | 249 | std::string NewLineText; |
| 250 | if (NewLines > 0) { |
| 251 | unsigned Offset = |
Manuel Klimek | e573c3f | 2013-05-22 12:51:29 +0000 | [diff] [blame] | 252 | std::min<int>(EscapedNewlineColumn - 1, PreviousEndOfTokenColumn); |
Alexander Kornienko | 70ce788 | 2013-04-15 14:28:00 +0000 | [diff] [blame] | 253 | for (unsigned i = 0; i < NewLines; ++i) { |
Daniel Jasper | 2972d04 | 2013-04-25 08:56:26 +0000 | [diff] [blame] | 254 | NewLineText += std::string(EscapedNewlineColumn - Offset - 1, ' '); |
Alexander Kornienko | 70ce788 | 2013-04-15 14:28:00 +0000 | [diff] [blame] | 255 | NewLineText += "\\\n"; |
| 256 | Offset = 0; |
| 257 | } |
| 258 | } |
Manuel Klimek | 7c9a93e | 2013-05-13 09:22:11 +0000 | [diff] [blame] | 259 | return NewLineText + getIndentText(Spaces); |
| 260 | } |
| 261 | |
| 262 | std::string WhitespaceManager::getIndentText(unsigned Spaces) { |
Manuel Klimek | 967d9e9 | 2013-05-13 12:53:04 +0000 | [diff] [blame] | 263 | if (!Style.UseTab) |
Manuel Klimek | 7c9a93e | 2013-05-13 09:22:11 +0000 | [diff] [blame] | 264 | return std::string(Spaces, ' '); |
Manuel Klimek | 967d9e9 | 2013-05-13 12:53:04 +0000 | [diff] [blame] | 265 | |
Manuel Klimek | 7c9a93e | 2013-05-13 09:22:11 +0000 | [diff] [blame] | 266 | return std::string(Spaces / Style.IndentWidth, '\t') + |
| 267 | std::string(Spaces % Style.IndentWidth, ' '); |
Alexander Kornienko | 70ce788 | 2013-04-15 14:28:00 +0000 | [diff] [blame] | 268 | } |
| 269 | |
Alexander Kornienko | 70ce788 | 2013-04-15 14:28:00 +0000 | [diff] [blame] | 270 | } // namespace format |
| 271 | } // namespace clang |