Blame - clang/lib/Format/BreakableToken.cpp - toolchain/llvm-project

2013-04-15 14:28:00 +0000

[diff] [blame]

1

//===--- BreakableToken.cpp - Format C++ code -----------------------------===//

2

//

3

// The LLVM Compiler Infrastructure

4

//

5

// This file is distributed under the University of Illinois Open Source

6

// License. See LICENSE.TXT for details.

7

//

8

//===----------------------------------------------------------------------===//

9

///

10

/// \file

11

/// \brief Contains implementation of BreakableToken class and classes derived

12

/// from it.

13

///

14

//===----------------------------------------------------------------------===//

15

16

#include "BreakableToken.h"

Krasimir Georgiev

2017-01-25 13:58:58 +0000

[diff] [blame]

17

#include "ContinuationIndenter.h"

Alexander Kornienko

2013-06-11 16:01:49 +0000

[diff] [blame]

18

#include "clang/Basic/CharInfo.h"

Manuel Klimek

2013-05-27 15:23:34 +0000

[diff] [blame]

19

#include "clang/Format/Format.h"

Alexander Kornienko

2013-04-17 17:34:05 +0000

[diff] [blame]

20

#include "llvm/ADT/STLExtras.h"

Manuel Klimek

2013-05-27 15:23:34 +0000

[diff] [blame]

21

#include "llvm/Support/Debug.h"

Alexander Kornienko

2013-04-15 14:28:00 +0000

[diff] [blame]

22

#include <algorithm>

23

Chandler Carruth

1034666

2014-04-22 03:17:02 +0000

[diff] [blame]

24

#define DEBUG_TYPE "format-token-breaker"

25

Alexander Kornienko

2013-04-15 14:28:00 +0000

[diff] [blame]

namespace clang {

namespace format {

Daniel Jasper

2013-10-30 07:36:40 +0000

[diff] [blame]

29

static const char *const Blanks = " \t\v\f\r";

Alexander Kornienko

2013-06-20 13:58:37 +0000

[diff] [blame]

30

static bool IsBlank(char C) {

31

switch (C) {

Daniel Jasper

3ac9b9e

2013-07-08 14:34:09 +0000

[diff] [blame]

case ' ':

case '\t':

case '\v':

case '\f':

Daniel Jasper

580da27

2013-10-30 07:36:40 +0000

[diff] [blame]

36

case '\r':

Daniel Jasper

3ac9b9e

2013-07-08 14:34:09 +0000

[diff] [blame]

37

return true;

38

default:

39

return false;

Alexander Kornienko

2013-06-20 13:58:37 +0000

[diff] [blame]

}

}

Krasimir Georgiev

2017-01-25 13:58:58 +0000

[diff] [blame]

43

static StringRef getLineCommentIndentPrefix(StringRef Comment) {

44

static const char *const KnownPrefixes[] = {"///", "//", "//!"};

45

StringRef LongestPrefix;

46

for (StringRef KnownPrefix : KnownPrefixes) {

47

if (Comment.startswith(KnownPrefix)) {

48

size_t PrefixLength = KnownPrefix.size();

49

while (PrefixLength < Comment.size() && Comment[PrefixLength] == ' ')

50

++PrefixLength;

51

if (PrefixLength > LongestPrefix.size())

52

LongestPrefix = Comment.substr(0, PrefixLength);

53

}

54

}

55

return LongestPrefix;

56

}

57

Craig Topper

bfb5c40

2013-07-01 03:38:29 +0000

[diff] [blame]

58

static BreakableToken::Split getCommentSplit(StringRef Text,

59

unsigned ContentStartColumn,

60

unsigned ColumnLimit,

Alexander Kornienko

2013-09-05 14:08:34 +0000

[diff] [blame]

61

unsigned TabWidth,

Craig Topper

bfb5c40

2013-07-01 03:38:29 +0000

[diff] [blame]

62

encoding::Encoding Encoding) {

Alexander Kornienko

2013-04-17 17:34:05 +0000

[diff] [blame]

63

if (ColumnLimit <= ContentStartColumn + 1)

Manuel Klimek

2013-05-27 15:23:34 +0000

[diff] [blame]

64

return BreakableToken::Split(StringRef::npos, 0);

Alexander Kornienko

2013-04-17 17:34:05 +0000

[diff] [blame]

65

66

unsigned MaxSplit = ColumnLimit - ContentStartColumn + 1;

Alexander Kornienko

2013-06-05 14:09:10 +0000

[diff] [blame]

67

unsigned MaxSplitBytes = 0;

68

69

for (unsigned NumChars = 0;

Alexander Kornienko

2013-09-05 14:08:34 +0000

[diff] [blame]

70

NumChars < MaxSplit && MaxSplitBytes < Text.size();) {

71

unsigned BytesInChar =

Alexander Kornienko

2013-06-05 14:09:10 +0000

[diff] [blame]

72

encoding::getCodePointNumBytes(Text[MaxSplitBytes], Encoding);

Alexander Kornienko

2013-09-05 14:08:34 +0000

[diff] [blame]

73

NumChars +=

74

encoding::columnWidthWithTabs(Text.substr(MaxSplitBytes, BytesInChar),

75

ContentStartColumn, TabWidth, Encoding);

76

MaxSplitBytes += BytesInChar;

77

}

Alexander Kornienko

2013-06-05 14:09:10 +0000

[diff] [blame]

78

Alexander Kornienko

2013-06-20 13:58:37 +0000

[diff] [blame]

79

StringRef::size_type SpaceOffset = Text.find_last_of(Blanks, MaxSplitBytes);

Alexander Kornienko

2013-04-17 17:34:05 +0000

[diff] [blame]

80

if (SpaceOffset == StringRef::npos ||

Manuel Klimek

2013-05-27 15:23:34 +0000

[diff] [blame]

81

// Don't break at leading whitespace.

Alexander Kornienko

2013-06-20 13:58:37 +0000

[diff] [blame]

82

Text.find_last_not_of(Blanks, SpaceOffset) == StringRef::npos) {

Manuel Klimek

ae1fbfb

2013-05-29 22:06:18 +0000

[diff] [blame]

83

// Make sure that we don't break at leading whitespace that

84

// reaches past MaxSplit.

Alexander Kornienko

2013-06-20 13:58:37 +0000

[diff] [blame]

85

StringRef::size_type FirstNonWhitespace = Text.find_first_not_of(Blanks);

Manuel Klimek

ae1fbfb

2013-05-29 22:06:18 +0000

[diff] [blame]

86

if (FirstNonWhitespace == StringRef::npos)

87

// If the comment is only whitespace, we cannot split.

88

return BreakableToken::Split(StringRef::npos, 0);

Alexander Kornienko

2013-06-20 13:58:37 +0000

[diff] [blame]

89

SpaceOffset = Text.find_first_of(

90

Blanks, std::max<unsigned>(MaxSplitBytes, FirstNonWhitespace));

Manuel Klimek

ae1fbfb

2013-05-29 22:06:18 +0000

[diff] [blame]

91

}

Alexander Kornienko

2013-04-17 17:34:05 +0000

[diff] [blame]

92

if (SpaceOffset != StringRef::npos && SpaceOffset != 0) {

Alexander Kornienko

2013-06-20 13:58:37 +0000

[diff] [blame]

93

StringRef BeforeCut = Text.substr(0, SpaceOffset).rtrim(Blanks);

94

StringRef AfterCut = Text.substr(SpaceOffset).ltrim(Blanks);

Alexander Kornienko

2013-04-17 17:34:05 +0000

[diff] [blame]

95

return BreakableToken::Split(BeforeCut.size(),

96

AfterCut.begin() - BeforeCut.end());

97

}

98

return BreakableToken::Split(StringRef::npos, 0);

99

}

100

Daniel Jasper

b05a81d

2014-05-09 13:11:16 +0000

[diff] [blame]

101

static BreakableToken::Split

102

getStringSplit(StringRef Text, unsigned UsedColumns, unsigned ColumnLimit,

103

unsigned TabWidth, encoding::Encoding Encoding) {

Manuel Klimek

2013-05-27 15:23:34 +0000

[diff] [blame]

104

// FIXME: Reduce unit test case.

105

if (Text.empty())

106

return BreakableToken::Split(StringRef::npos, 0);

Alexander Kornienko

2013-09-16 20:20:49 +0000

[diff] [blame]

107

if (ColumnLimit <= UsedColumns)

Manuel Klimek

2013-05-27 15:23:34 +0000

[diff] [blame]

108

return BreakableToken::Split(StringRef::npos, 0);

Alexander Kornienko

71d95d6

2013-11-26 10:38:53 +0000

[diff] [blame]

109

unsigned MaxSplit = ColumnLimit - UsedColumns;

Alexander Kornienko

2013-06-05 14:09:10 +0000

[diff] [blame]

110

StringRef::size_type SpaceOffset = 0;

111

StringRef::size_type SlashOffset = 0;

Alexander Kornienko

7285207

2013-06-19 14:22:47 +0000

[diff] [blame]

112

StringRef::size_type WordStartOffset = 0;

Alexander Kornienko

2013-06-05 14:09:10 +0000

[diff] [blame]

113

StringRef::size_type SplitPoint = 0;

114

for (unsigned Chars = 0;;) {

115

unsigned Advance;

116

if (Text[0] == '\\') {

117

Advance = encoding::getEscapeSequenceLength(Text);

118

Chars += Advance;

119

} else {

120

Advance = encoding::getCodePointNumBytes(Text[0], Encoding);

Alexander Kornienko

2013-09-16 20:20:49 +0000

[diff] [blame]

121

Chars += encoding::columnWidthWithTabs(

122

Text.substr(0, Advance), UsedColumns + Chars, TabWidth, Encoding);

Alexander Kornienko

2013-06-05 14:09:10 +0000

[diff] [blame]

123

}

124

Daniel Jasper

e4b48c6

2015-01-21 19:50:35 +0000

[diff] [blame]

125

if (Chars > MaxSplit || Text.size() <= Advance)

Alexander Kornienko

2013-06-05 14:09:10 +0000

[diff] [blame]

126

break;

127

Alexander Kornienko

2013-06-20 13:58:37 +0000

[diff] [blame]

128

if (IsBlank(Text[0]))

Alexander Kornienko

2013-06-05 14:09:10 +0000

[diff] [blame]

129

SpaceOffset = SplitPoint;

130

if (Text[0] == '/')

131

SlashOffset = SplitPoint;

Alexander Kornienko

2013-06-20 13:58:37 +0000

[diff] [blame]

132

if (Advance == 1 && !isAlphanumeric(Text[0]))

Alexander Kornienko

7285207

2013-06-19 14:22:47 +0000

[diff] [blame]

133

WordStartOffset = SplitPoint;

Alexander Kornienko

2013-06-05 14:09:10 +0000

[diff] [blame]

134

135

SplitPoint += Advance;

136

Text = Text.substr(Advance);

137

}

138

139

if (SpaceOffset != 0)

140

return BreakableToken::Split(SpaceOffset + 1, 0);

141

if (SlashOffset != 0)

142

return BreakableToken::Split(SlashOffset + 1, 0);

Alexander Kornienko

7285207

2013-06-19 14:22:47 +0000

[diff] [blame]

143

if (WordStartOffset != 0)

144

return BreakableToken::Split(WordStartOffset + 1, 0);

Alexander Kornienko

2013-06-05 14:09:10 +0000

[diff] [blame]

145

if (SplitPoint != 0)

146

return BreakableToken::Split(SplitPoint, 0);

147

return BreakableToken::Split(StringRef::npos, 0);

Alexander Kornienko

2013-04-17 17:34:05 +0000

[diff] [blame]

148

}

149

Krasimir Georgiev

2017-01-25 13:58:58 +0000

[diff] [blame]

150

bool switchesFormatting(const FormatToken &Token) {

151

assert((Token.is(TT_BlockComment) || Token.is(TT_LineComment)) &&

152

"formatting regions are switched by comment tokens");

153

StringRef Content = Token.TokenText.substr(2).ltrim();

154

return Content.startswith("clang-format on") ||

155

Content.startswith("clang-format off");

}

unsigned

BreakableToken::getLineLengthAfterCompression(unsigned RemainingTokenColumns,

160

Split Split) const {

161

// Example: consider the content

162

// lala lala

163

// - RemainingTokenColumns is the original number of columns, 10;

164

// - Split is (4, 2), denoting the two spaces between the two words;

165

//

166

// We compute the number of columns when the split is compressed into a single

167

// space, like:

168

// lala lala

169

return RemainingTokenColumns + 1 - Split.second;

170

}

171

Manuel Klimek

2013-05-27 15:23:34 +0000

[diff] [blame]

172

unsigned BreakableSingleLineToken::getLineCount() const { return 1; }

Alexander Kornienko

2013-04-15 14:28:00 +0000

[diff] [blame]

173

Alexander Kornienko

dd7ece5

2013-06-07 16:02:52 +0000

[diff] [blame]

174

unsigned BreakableSingleLineToken::getLineLengthAfterSplit(

Krasimir Georgiev

2017-01-25 13:58:58 +0000

[diff] [blame]

175

unsigned LineIndex, unsigned TailOffset,

176

StringRef::size_type Length) const {

Alexander Kornienko

2013-06-05 14:09:10 +0000

[diff] [blame]

177

return StartColumn + Prefix.size() + Postfix.size() +

Krasimir Georgiev

2017-01-25 13:58:58 +0000

[diff] [blame]

178

encoding::columnWidthWithTabs(Line.substr(TailOffset, Length),

Alexander Kornienko

2013-09-05 14:08:34 +0000

[diff] [blame]

179

StartColumn + Prefix.size(),

180

Style.TabWidth, Encoding);

Alexander Kornienko

2013-04-15 14:28:00 +0000

[diff] [blame]

181

}

182

Alexander Kornienko

2013-06-14 11:46:10 +0000

[diff] [blame]

183

BreakableSingleLineToken::BreakableSingleLineToken(

Daniel Jasper

2017-01-31 11:25:01 +0000

[diff] [blame]

184

const FormatToken &Tok, unsigned StartColumn, StringRef Prefix,

185

StringRef Postfix, bool InPPDirective, encoding::Encoding Encoding,

186

const FormatStyle &Style)

187

: BreakableToken(Tok, InPPDirective, Encoding, Style),

Alexander Kornienko

2013-09-05 14:08:34 +0000

[diff] [blame]

188

StartColumn(StartColumn), Prefix(Prefix), Postfix(Postfix) {

Daniel Jasper

174b012

2014-01-09 14:18:12 +0000

[diff] [blame]

189

assert(Tok.TokenText.endswith(Postfix));

Manuel Klimek

2013-05-27 15:23:34 +0000

[diff] [blame]

190

Line = Tok.TokenText.substr(

191

Prefix.size(), Tok.TokenText.size() - Prefix.size() - Postfix.size());

Alexander Kornienko

2013-04-15 14:28:00 +0000

[diff] [blame]

192

}

193

Alexander Kornienko

2013-09-16 20:20:49 +0000

[diff] [blame]

194

BreakableStringLiteral::BreakableStringLiteral(

Daniel Jasper

2017-01-31 11:25:01 +0000

[diff] [blame]

195

const FormatToken &Tok, unsigned StartColumn, StringRef Prefix,

196

StringRef Postfix, bool InPPDirective, encoding::Encoding Encoding,

197

const FormatStyle &Style)

198

: BreakableSingleLineToken(Tok, StartColumn, Prefix, Postfix, InPPDirective,

199

Encoding, Style) {}

Manuel Klimek

2013-05-27 15:23:34 +0000

[diff] [blame]

200

201

BreakableToken::Split

202

BreakableStringLiteral::getSplit(unsigned LineIndex, unsigned TailOffset,

203

unsigned ColumnLimit) const {

Alexander Kornienko

2013-09-16 20:20:49 +0000

[diff] [blame]

204

return getStringSplit(Line.substr(TailOffset),

205

StartColumn + Prefix.size() + Postfix.size(),

206

ColumnLimit, Style.TabWidth, Encoding);

Alexander Kornienko

2013-04-17 17:34:05 +0000

[diff] [blame]

207

}

208

Alexander Kornienko

2013-06-11 16:01:49 +0000

[diff] [blame]

209

void BreakableStringLiteral::insertBreak(unsigned LineIndex,

210

unsigned TailOffset, Split Split,

Alexander Kornienko

2013-06-11 16:01:49 +0000

[diff] [blame]

211

WhitespaceManager &Whitespaces) {

Daniel Jasper

d07c2ee

2014-01-14 09:53:07 +0000

[diff] [blame]

212

unsigned LeadingSpaces = StartColumn;

213

// The '@' of an ObjC string literal (@"Test") does not become part of the

214

// string token.

215

// FIXME: It might be a cleaner solution to merge the tokens as a

216

// precomputation step.

217

if (Prefix.startswith("@"))

218

--LeadingSpaces;

Alexander Kornienko

2013-06-11 16:01:49 +0000

[diff] [blame]

219

Whitespaces.replaceWhitespaceInToken(

220

Tok, Prefix.size() + TailOffset + Split.first, Split.second, Postfix,

Daniel Jasper

2017-01-31 11:25:01 +0000

[diff] [blame]

221

Prefix, InPPDirective, 1, LeadingSpaces);

Alexander Kornienko

2013-06-11 16:01:49 +0000

[diff] [blame]

222

}

223

Krasimir Georgiev

2017-01-25 13:58:58 +0000

[diff] [blame]

224

BreakableComment::BreakableComment(const FormatToken &Token,

Daniel Jasper

2017-01-31 11:25:01 +0000

[diff] [blame]

225

unsigned StartColumn,

Krasimir Georgiev

2017-01-25 13:58:58 +0000

[diff] [blame]

226

unsigned OriginalStartColumn,

227

bool FirstInLine, bool InPPDirective,

228

encoding::Encoding Encoding,

229

const FormatStyle &Style)

Daniel Jasper

2017-01-31 11:25:01 +0000

[diff] [blame]

230

: BreakableToken(Token, InPPDirective, Encoding, Style),

Krasimir Georgiev

2017-01-25 13:58:58 +0000

[diff] [blame]

231

StartColumn(StartColumn), OriginalStartColumn(OriginalStartColumn),

232

FirstInLine(FirstInLine) {}

Manuel Klimek

2013-05-27 15:23:34 +0000

[diff] [blame]

233

Krasimir Georgiev

2017-01-25 13:58:58 +0000

[diff] [blame]

234

unsigned BreakableComment::getLineCount() const { return Lines.size(); }

235

236

BreakableToken::Split BreakableComment::getSplit(unsigned LineIndex,

237

unsigned TailOffset,

238

unsigned ColumnLimit) const {

239

return getCommentSplit(Content[LineIndex].substr(TailOffset),

240

getContentStartColumn(LineIndex, TailOffset),

Alexander Kornienko

2013-09-05 14:08:34 +0000

[diff] [blame]

241

ColumnLimit, Style.TabWidth, Encoding);

Manuel Klimek

2013-05-27 15:23:34 +0000

[diff] [blame]

242

}

243

Krasimir Georgiev

2017-01-25 13:58:58 +0000

[diff] [blame]

244

void BreakableComment::compressWhitespace(unsigned LineIndex,

245

unsigned TailOffset, Split Split,

246

WhitespaceManager &Whitespaces) {

247

StringRef Text = Content[LineIndex].substr(TailOffset);

248

// Text is relative to the content line, but Whitespaces operates relative to

249

// the start of the corresponding token, so compute the start of the Split

250

// that needs to be compressed into a single space relative to the start of

251

// its token.

252

unsigned BreakOffsetInToken =

253

Text.data() - tokenAt(LineIndex).TokenText.data() + Split.first;

254

unsigned CharsToRemove = Split.second;

Alexander Kornienko

2013-06-11 16:01:49 +0000

[diff] [blame]

255

Whitespaces.replaceWhitespaceInToken(

Krasimir Georgiev

2017-01-25 13:58:58 +0000

[diff] [blame]

256

tokenAt(LineIndex), BreakOffsetInToken, CharsToRemove, "", "",

Daniel Jasper

2017-01-31 11:25:01 +0000

[diff] [blame]

257

/*InPPDirective=*/false, /*Newlines=*/0, /*Spaces=*/1);

Alexander Kornienko

875395f

2013-11-12 17:50:13 +0000

[diff] [blame]

258

}

259

Krasimir Georgiev

2017-01-25 13:58:58 +0000

[diff] [blame]

260

BreakableToken::Split

261

BreakableComment::getReflowSplit(StringRef Text, StringRef ReflowPrefix,

262

unsigned PreviousEndColumn,

263

unsigned ColumnLimit) const {

264

unsigned ReflowStartColumn = PreviousEndColumn + ReflowPrefix.size();

265

StringRef TrimmedText = Text.rtrim(Blanks);

266

// This is the width of the resulting line in case the full line of Text gets

267

// reflown up starting at ReflowStartColumn.

268

unsigned FullWidth = ReflowStartColumn + encoding::columnWidthWithTabs(

269

TrimmedText, ReflowStartColumn,

270

Style.TabWidth, Encoding);

271

// If the full line fits up, we return a reflow split after it,

272

// otherwise we compute the largest piece of text that fits after

273

// ReflowStartColumn.

274

Split ReflowSplit =

275

FullWidth <= ColumnLimit

276

? Split(TrimmedText.size(), Text.size() - TrimmedText.size())

277

: getCommentSplit(Text, ReflowStartColumn, ColumnLimit,

278

Style.TabWidth, Encoding);

Alexander Kornienko

2013-06-11 16:01:49 +0000

[diff] [blame]

279

Krasimir Georgiev

2017-01-25 13:58:58 +0000

[diff] [blame]

280

// We need to be extra careful here, because while it's OK to keep a long line

281

// if it can't be broken into smaller pieces (like when the first word of a

282

// long line is longer than the column limit), it's not OK to reflow that long

283

// word up. So we recompute the size of the previous line after reflowing and

284

// only return the reflow split if that's under the line limit.

285

if (ReflowSplit.first != StringRef::npos &&

286

// Check if the width of the newly reflown line is under the limit.

287

PreviousEndColumn + ReflowPrefix.size() +

288

encoding::columnWidthWithTabs(Text.substr(0, ReflowSplit.first),

289

PreviousEndColumn +

290

ReflowPrefix.size(),

291

Style.TabWidth, Encoding) <=

292

ColumnLimit) {

293

return ReflowSplit;

Alexander Kornienko

2013-06-11 16:01:49 +0000

[diff] [blame]

294

}

Krasimir Georgiev

2017-01-25 13:58:58 +0000

[diff] [blame]

295

return Split(StringRef::npos, 0);

296

}

297

298

const FormatToken &BreakableComment::tokenAt(unsigned LineIndex) const {

299

return Tokens[LineIndex] ? *Tokens[LineIndex] : Tok;

300

}

301

302

static bool mayReflowContent(StringRef Content) {

303

Content = Content.trim(Blanks);

304

// Simple heuristic for what to reflow: content should contain at least two

305

// characters and either the first or second character must be

306

// non-punctuation.

Krasimir Georgiev

8f62cf7

2017-01-31 11:38:02 +0000

[diff] [blame]

307

return Content.size() >= 2 &&

308

// Lines starting with '@' commonly have special meaning.

309

!Content.startswith("@") && !Content.endswith("\\") &&

Krasimir Georgiev

2017-01-25 13:58:58 +0000

[diff] [blame]

310

// Note that this is UTF-8 safe, since if isPunctuation(Content[0]) is

311

// true, then the first code point must be 1 byte long.

312

(!isPunctuation(Content[0]) || !isPunctuation(Content[1]));

313

}

314

315

bool BreakableComment::mayReflow(unsigned LineIndex) const {

316

return LineIndex > 0 && mayReflowContent(Content[LineIndex]) &&

317

!Tok.Finalized && !switchesFormatting(tokenAt(LineIndex)) &&

318

(!Tok.is(TT_LineComment) ||

319

OriginalPrefix[LineIndex] == OriginalPrefix[LineIndex - 1]);

Alexander Kornienko

2013-06-11 16:01:49 +0000

[diff] [blame]

320

}

321

Alexander Kornienko

2013-06-05 14:09:10 +0000

[diff] [blame]

322

BreakableBlockComment::BreakableBlockComment(

Daniel Jasper

2017-01-31 11:25:01 +0000

[diff] [blame]

323

const FormatToken &Token, unsigned StartColumn,

Alexander Kornienko

2013-06-14 11:46:10 +0000

[diff] [blame]

324

unsigned OriginalStartColumn, bool FirstInLine, bool InPPDirective,

Alexander Kornienko

2013-09-05 14:08:34 +0000

[diff] [blame]

325

encoding::Encoding Encoding, const FormatStyle &Style)

Daniel Jasper

2017-01-31 11:25:01 +0000

[diff] [blame]

326

: BreakableComment(Token, StartColumn, OriginalStartColumn, FirstInLine,

327

InPPDirective, Encoding, Style) {

Krasimir Georgiev

2017-01-25 13:58:58 +0000

[diff] [blame]

328

assert(Tok.is(TT_BlockComment) &&

329

"block comment section must start with a block comment");

330

331

StringRef TokenText(Tok.TokenText);

Manuel Klimek

2013-05-27 15:23:34 +0000

[diff] [blame]

332

assert(TokenText.startswith("/*") && TokenText.endswith("*/"));

333

TokenText.substr(2, TokenText.size() - 4).split(Lines, "\n");

334

335

int IndentDelta = StartColumn - OriginalStartColumn;

Krasimir Georgiev

2017-01-25 13:58:58 +0000

[diff] [blame]

336

Content.resize(Lines.size());

337

Content[0] = Lines[0];

338

ContentColumn.resize(Lines.size());

339

// Account for the initial '/*'.

340

ContentColumn[0] = StartColumn + 2;

341

Tokens.resize(Lines.size());

Alexander Kornienko

2013-07-08 14:12:07 +0000

[diff] [blame]

342

for (size_t i = 1; i < Lines.size(); ++i)

Alexander Kornienko

2013-09-05 14:08:34 +0000

[diff] [blame]

343

adjustWhitespace(i, IndentDelta);

Alexander Kornienko

2013-07-08 14:12:07 +0000

[diff] [blame]

344

345

Decoration = "* ";

Manuel Klimek

2013-05-27 15:23:34 +0000

[diff] [blame]

346

if (Lines.size() == 1 && !FirstInLine) {

347

// Comments for which FirstInLine is false can start on arbitrary column,

348

// and available horizontal space can be too small to align consecutive

349

// lines with the first one.

350

// FIXME: We could, probably, align them to current indentation level, but

351

// now we just wrap them without stars.

Alexander Kornienko

2013-07-08 14:12:07 +0000

[diff] [blame]

352

Decoration = "";

Manuel Klimek

2013-05-27 15:23:34 +0000

[diff] [blame]

353

}

Alexander Kornienko

2013-07-08 14:12:07 +0000

[diff] [blame]

354

for (size_t i = 1, e = Lines.size(); i < e && !Decoration.empty(); ++i) {

355

// If the last line is empty, the closing "*/" will have a star.

Krasimir Georgiev

2017-01-25 13:58:58 +0000

[diff] [blame]

356

if (i + 1 == e && Content[i].empty())

Alexander Kornienko

2013-07-08 14:12:07 +0000

[diff] [blame]

357

break;

Krasimir Georgiev

2017-01-25 13:58:58 +0000

[diff] [blame]

358

if (!Content[i].empty() && i + 1 != e &&

359

Decoration.startswith(Content[i]))

Daniel Jasper

6d9b88d

2015-05-06 07:17:22 +0000

[diff] [blame]

360

continue;

Krasimir Georgiev

2017-01-25 13:58:58 +0000

[diff] [blame]

361

while (!Content[i].startswith(Decoration))

Alexander Kornienko

2013-07-08 14:12:07 +0000

[diff] [blame]

362

Decoration = Decoration.substr(0, Decoration.size() - 1);

Manuel Klimek

2013-05-27 15:23:34 +0000

[diff] [blame]

363

}

Alexander Kornienko

2013-07-08 14:12:07 +0000

[diff] [blame]

364

365

LastLineNeedsDecoration = true;

Krasimir Georgiev

2017-01-25 13:58:58 +0000

[diff] [blame]

366

IndentAtLineBreak = ContentColumn[0] + 1;

367

for (size_t i = 1, e = Lines.size(); i < e; ++i) {

368

if (Content[i].empty()) {

369

if (i + 1 == e) {

Alexander Kornienko

2013-07-08 14:12:07 +0000

[diff] [blame]

370

// Empty last line means that we already have a star as a part of the

371

// trailing */. We also need to preserve whitespace, so that */ is

372

// correctly indented.

373

LastLineNeedsDecoration = false;

374

} else if (Decoration.empty()) {

375

// For all other lines, set the start column to 0 if they're empty, so

376

// we do not insert trailing whitespace anywhere.

Krasimir Georgiev

2017-01-25 13:58:58 +0000

[diff] [blame]

377

ContentColumn[i] = 0;

Alexander Kornienko

2013-07-08 14:12:07 +0000

[diff] [blame]

378

}

Manuel Klimek

2013-05-27 15:23:34 +0000

[diff] [blame]

379

continue;

380

}

Daniel Jasper

6d9b88d

2015-05-06 07:17:22 +0000

[diff] [blame]

381

Alexander Kornienko

2013-07-08 14:12:07 +0000

[diff] [blame]

382

// The first line already excludes the star.

383

// For all other lines, adjust the line to exclude the star and

384

// (optionally) the first whitespace.

Krasimir Georgiev

2017-01-25 13:58:58 +0000

[diff] [blame]

385

unsigned DecorationSize = Decoration.startswith(Content[i])

386

? Content[i].size()

387

: Decoration.size();

388

ContentColumn[i] += DecorationSize;

389

Content[i] = Content[i].substr(DecorationSize);

390

if (!Decoration.startswith(Content[i]))

Daniel Jasper

6d9b88d

2015-05-06 07:17:22 +0000

[diff] [blame]

391

IndentAtLineBreak =

Krasimir Georgiev

2017-01-25 13:58:58 +0000

[diff] [blame]

392

std::min<int>(IndentAtLineBreak, std::max(0, ContentColumn[i]));

Manuel Klimek

2013-05-27 15:23:34 +0000

[diff] [blame]

393

}

Krasimir Georgiev

2017-01-25 13:58:58 +0000

[diff] [blame]

394

IndentAtLineBreak =

395

std::max<unsigned>(IndentAtLineBreak, Decoration.size());

396

Manuel Klimek

2013-05-27 15:23:34 +0000

[diff] [blame]

397

DEBUG({

Alexander Kornienko

2013-07-08 14:12:07 +0000

[diff] [blame]

398

llvm::dbgs() << "IndentAtLineBreak " << IndentAtLineBreak << "\n";

Manuel Klimek

2013-05-27 15:23:34 +0000

[diff] [blame]

399

for (size_t i = 0; i < Lines.size(); ++i) {

Krasimir Georgiev

2017-01-25 13:58:58 +0000

[diff] [blame]

400

llvm::dbgs() << i << " |" << Content[i] << "| "

401

<< (Content[i].data() - Lines[i].data()) << "\n";

Manuel Klimek

2013-05-27 15:23:34 +0000

[diff] [blame]

}

});

}

Alexander Kornienko

2013-09-05 14:08:34 +0000

[diff] [blame]

406

void BreakableBlockComment::adjustWhitespace(unsigned LineIndex,

Manuel Klimek

2013-05-27 15:23:34 +0000

[diff] [blame]

407

int IndentDelta) {

Alexander Kornienko

2013-06-14 11:46:10 +0000

[diff] [blame]

408

// When in a preprocessor directive, the trailing backslash in a block comment

409

// is not needed, but can serve a purpose of uniformity with necessary escaped

410

// newlines outside the comment. In this case we remove it here before

411

// trimming the trailing whitespace. The backslash will be re-added later when

412

// inserting a line break.

413

size_t EndOfPreviousLine = Lines[LineIndex - 1].size();

414

if (InPPDirective && Lines[LineIndex - 1].endswith("\\"))

415

--EndOfPreviousLine;

416

Manuel Klimek

2013-05-27 15:23:34 +0000

[diff] [blame]

417

// Calculate the end of the non-whitespace text in the previous line.

Alexander Kornienko

2013-06-14 11:46:10 +0000

[diff] [blame]

418

EndOfPreviousLine =

Alexander Kornienko

2013-06-20 13:58:37 +0000

[diff] [blame]

419

Lines[LineIndex - 1].find_last_not_of(Blanks, EndOfPreviousLine);

Manuel Klimek

2013-05-27 15:23:34 +0000

[diff] [blame]

420

if (EndOfPreviousLine == StringRef::npos)

421

EndOfPreviousLine = 0;

422

else

423

++EndOfPreviousLine;

424

// Calculate the start of the non-whitespace text in the current line.

Alexander Kornienko

2013-06-20 13:58:37 +0000

[diff] [blame]

425

size_t StartOfLine = Lines[LineIndex].find_first_not_of(Blanks);

Manuel Klimek

2013-05-27 15:23:34 +0000

[diff] [blame]

426

if (StartOfLine == StringRef::npos)

Daniel Jasper

d6e6188

2015-06-17 12:23:15 +0000

[diff] [blame]

427

StartOfLine = Lines[LineIndex].rtrim("\r\n").size();

Manuel Klimek

2013-05-27 15:23:34 +0000

[diff] [blame]

428

Alexander Kornienko

2013-09-05 14:08:34 +0000

[diff] [blame]

429

StringRef Whitespace = Lines[LineIndex].substr(0, StartOfLine);

Manuel Klimek

2013-05-27 15:23:34 +0000

[diff] [blame]

430

// Adjust Lines to only contain relevant text.

Krasimir Georgiev

2017-01-25 13:58:58 +0000

[diff] [blame]

431

size_t PreviousContentOffset =

432

Content[LineIndex - 1].data() - Lines[LineIndex - 1].data();

433

Content[LineIndex - 1] = Lines[LineIndex - 1].substr(

434

PreviousContentOffset, EndOfPreviousLine - PreviousContentOffset);

435

Content[LineIndex] = Lines[LineIndex].substr(StartOfLine);

Manuel Klimek

34d1515

2013-05-28 10:01:59 +0000

[diff] [blame]

436

Alp Toker

f6a24ce

2013-12-05 16:25:25 +0000

[diff] [blame]

437

// Adjust the start column uniformly across all lines.

Krasimir Georgiev

2017-01-25 13:58:58 +0000

[diff] [blame]

438

ContentColumn[LineIndex] =

Alexander Kornienko

39856b7

2013-09-10 09:38:25 +0000

[diff] [blame]

439

encoding::columnWidthWithTabs(Whitespace, 0, Style.TabWidth, Encoding) +

Alexander Kornienko

67d9c8c

2014-04-17 16:12:46 +0000

[diff] [blame]

440

IndentDelta;

Manuel Klimek

2013-05-27 15:23:34 +0000

[diff] [blame]

441

}

442

Alexander Kornienko

dd7ece5

2013-06-07 16:02:52 +0000

[diff] [blame]

443

unsigned BreakableBlockComment::getLineLengthAfterSplit(

Krasimir Georgiev

2017-01-25 13:58:58 +0000

[diff] [blame]

444

unsigned LineIndex, unsigned TailOffset,

445

StringRef::size_type Length) const {

446

unsigned ContentStartColumn = getContentStartColumn(LineIndex, TailOffset);

447

unsigned LineLength =

448

ContentStartColumn + encoding::columnWidthWithTabs(

449

Content[LineIndex].substr(TailOffset, Length),

450

ContentStartColumn, Style.TabWidth, Encoding);

451

// The last line gets a "*/" postfix.

452

if (LineIndex + 1 == Lines.size()) {

453

LineLength += 2;

454

// We never need a decoration when breaking just the trailing "*/" postfix.

455

// Note that checking that Length == 0 is not enough, since Length could

456

// also be StringRef::npos.

457

if (Content[LineIndex].substr(TailOffset, Length).empty()) {

458

LineLength -= Decoration.size();

459

}

460

}

461

return LineLength;

Manuel Klimek

2013-05-27 15:23:34 +0000

[diff] [blame]

462

}

463

464

void BreakableBlockComment::insertBreak(unsigned LineIndex, unsigned TailOffset,

Alexander Kornienko

2013-06-14 11:46:10 +0000

[diff] [blame]

465

Split Split,

Manuel Klimek

2013-05-27 15:23:34 +0000

[diff] [blame]

466

WhitespaceManager &Whitespaces) {

Krasimir Georgiev

2017-01-25 13:58:58 +0000

[diff] [blame]

467

StringRef Text = Content[LineIndex].substr(TailOffset);

Manuel Klimek

2013-05-27 15:23:34 +0000

[diff] [blame]

468

StringRef Prefix = Decoration;

Krasimir Georgiev

2017-01-25 13:58:58 +0000

[diff] [blame]

469

// We need this to account for the case when we have a decoration "* " for all

470

// the lines except for the last one, where the star in "*/" acts as a

471

// decoration.

472

unsigned LocalIndentAtLineBreak = IndentAtLineBreak;

Manuel Klimek

2013-05-27 15:23:34 +0000

[diff] [blame]

473

if (LineIndex + 1 == Lines.size() &&

474

Text.size() == Split.first + Split.second) {

475

// For the last line we need to break before "*/", but not to add "* ".

476

Prefix = "";

Krasimir Georgiev

2017-01-25 13:58:58 +0000

[diff] [blame]

477

if (LocalIndentAtLineBreak >= 2)

478

LocalIndentAtLineBreak -= 2;

479

}

480

// The split offset is from the beginning of the line. Convert it to an offset

481

// from the beginning of the token text.

482

unsigned BreakOffsetInToken =

483

Text.data() - tokenAt(LineIndex).TokenText.data() + Split.first;

484

unsigned CharsToRemove = Split.second;

485

assert(LocalIndentAtLineBreak >= Prefix.size());

486

Whitespaces.replaceWhitespaceInToken(

487

tokenAt(LineIndex), BreakOffsetInToken, CharsToRemove, "", Prefix,

Daniel Jasper

2017-01-31 11:25:01 +0000

[diff] [blame]

488

InPPDirective, /*Newlines=*/1,

Krasimir Georgiev

2017-01-25 13:58:58 +0000

[diff] [blame]

489

/*Spaces=*/LocalIndentAtLineBreak - Prefix.size());

490

}

491

492

BreakableToken::Split BreakableBlockComment::getSplitBefore(

493

unsigned LineIndex,

494

unsigned PreviousEndColumn,

495

unsigned ColumnLimit) const {

496

if (!mayReflow(LineIndex))

497

return Split(StringRef::npos, 0);

498

StringRef TrimmedContent = Content[LineIndex].ltrim(Blanks);

499

return getReflowSplit(TrimmedContent, ReflowPrefix, PreviousEndColumn,

ColumnLimit);

}

unsigned BreakableBlockComment::getReflownColumn(

504

StringRef Content,

505

unsigned LineIndex,

506

unsigned PreviousEndColumn) const {

507

unsigned StartColumn = PreviousEndColumn + ReflowPrefix.size();

508

// If this is the last line, it will carry around its '*/' postfix.

509

unsigned PostfixLength = (LineIndex + 1 == Lines.size() ? 2 : 0);

510

// The line is composed of previous text, reflow prefix, reflown text and

511

// postfix.

512

unsigned ReflownColumn =

513

StartColumn + encoding::columnWidthWithTabs(Content, StartColumn,

514

Style.TabWidth, Encoding) +

515

PostfixLength;

516

return ReflownColumn;

517

}

518

519

unsigned BreakableBlockComment::getLineLengthAfterSplitBefore(

520

unsigned LineIndex, unsigned TailOffset,

521

unsigned PreviousEndColumn,

522

unsigned ColumnLimit,

523

Split SplitBefore) const {

Krasimir Georgiev

af1b962

2017-01-31 14:31:44 +0000

[diff] [blame]

524

if (SplitBefore.first == StringRef::npos ||

525

// Block comment line contents contain the trailing whitespace after the

526

// decoration, so the need of left trim. Note that this behavior is

527

// consistent with the breaking of block comments where the indentation of

528

// a broken line is uniform across all the lines of the block comment.

529

SplitBefore.first + SplitBefore.second <

530

Content[LineIndex].ltrim().size()) {

531

// A piece of line, not the whole, gets reflown.

532

return getLineLengthAfterSplit(LineIndex, TailOffset, StringRef::npos);

Krasimir Georgiev

2017-01-25 13:58:58 +0000

[diff] [blame]

533

} else {

534

// The whole line gets reflown, need to check if we need to insert a break

535

// for the postfix or not.

536

StringRef TrimmedContent = Content[LineIndex].ltrim(Blanks);

537

unsigned ReflownColumn =

538

getReflownColumn(TrimmedContent, LineIndex, PreviousEndColumn);

539

if (ReflownColumn <= ColumnLimit) {

540

return ReflownColumn;

541

}

542

return getLineLengthAfterSplit(LineIndex, TailOffset, StringRef::npos);

543

}

544

}

545

void BreakableBlockComment::replaceWhitespaceBefore(

546

unsigned LineIndex, unsigned PreviousEndColumn, unsigned ColumnLimit,

547

Split SplitBefore, WhitespaceManager &Whitespaces) {

548

if (LineIndex == 0) return;

549

StringRef TrimmedContent = Content[LineIndex].ltrim(Blanks);

550

if (SplitBefore.first != StringRef::npos) {

551

// Here we need to reflow.

552

assert(Tokens[LineIndex - 1] == Tokens[LineIndex] &&

553

"Reflowing whitespace within a token");

554

// This is the offset of the end of the last line relative to the start of

555

// the token text in the token.

556

unsigned WhitespaceOffsetInToken = Content[LineIndex - 1].data() +

557

Content[LineIndex - 1].size() -

558

tokenAt(LineIndex).TokenText.data();

559

unsigned WhitespaceLength = TrimmedContent.data() -

560

tokenAt(LineIndex).TokenText.data() -

561

WhitespaceOffsetInToken;

562

Whitespaces.replaceWhitespaceInToken(

563

tokenAt(LineIndex), WhitespaceOffsetInToken,

Daniel Jasper

2017-01-31 11:25:01 +0000

[diff] [blame]

564

/*ReplaceChars=*/WhitespaceLength, /*PreviousPostfix=*/"",

565

/*CurrentPrefix=*/ReflowPrefix, InPPDirective, /*Newlines=*/0,

566

/*Spaces=*/0);

Krasimir Georgiev

2017-01-25 13:58:58 +0000

[diff] [blame]

567

// Check if we need to also insert a break at the whitespace range.

568

// For this we first adapt the reflow split relative to the beginning of the

569

// content.

570

// Note that we don't need a penalty for this break, since it doesn't change

571

// the total number of lines.

572

Split BreakSplit = SplitBefore;

573

BreakSplit.first += TrimmedContent.data() - Content[LineIndex].data();

574

unsigned ReflownColumn =

575

getReflownColumn(TrimmedContent, LineIndex, PreviousEndColumn);

576

if (ReflownColumn > ColumnLimit) {

577

insertBreak(LineIndex, 0, BreakSplit, Whitespaces);

578

}

579

return;

Manuel Klimek

2013-05-27 15:23:34 +0000

[diff] [blame]

580

}

581

Krasimir Georgiev

2017-01-25 13:58:58 +0000

[diff] [blame]

582

// Here no reflow with the previous line will happen.

583

// Fix the decoration of the line at LineIndex.

Manuel Klimek

2013-05-27 15:23:34 +0000

[diff] [blame]

584

StringRef Prefix = Decoration;

Krasimir Georgiev

2017-01-25 13:58:58 +0000

[diff] [blame]

585

if (Content[LineIndex].empty()) {

Manuel Klimek

281dcbe

2013-05-28 08:55:01 +0000

[diff] [blame]

586

if (LineIndex + 1 == Lines.size()) {

Alexander Kornienko

2013-07-08 14:12:07 +0000

[diff] [blame]

587

if (!LastLineNeedsDecoration) {

588

// If the last line was empty, we don't need a prefix, as the */ will

589

// line up with the decoration (if it exists).

590

Prefix = "";

591

}

Manuel Klimek

281dcbe

2013-05-28 08:55:01 +0000

[diff] [blame]

592

} else if (!Decoration.empty()) {

593

// For other empty lines, if we do have a decoration, adapt it to not

594

// contain a trailing whitespace.

595

Prefix = Prefix.substr(0, 1);

596

}

Daniel Jasper

51fb2b2

2013-05-30 06:40:07 +0000

[diff] [blame]

597

} else {

Krasimir Georgiev

2017-01-25 13:58:58 +0000

[diff] [blame]

598

if (ContentColumn[LineIndex] == 1) {

Alexander Kornienko

2013-07-08 14:12:07 +0000

[diff] [blame]

599

// This line starts immediately after the decorating *.

Daniel Jasper

51fb2b2

2013-05-30 06:40:07 +0000

[diff] [blame]

600

Prefix = Prefix.substr(0, 1);

601

}

Manuel Klimek

281dcbe

2013-05-28 08:55:01 +0000

[diff] [blame]

602

}

Krasimir Georgiev

2017-01-25 13:58:58 +0000

[diff] [blame]

603

// This is the offset of the end of the last line relative to the start of the

604

// token text in the token.

605

unsigned WhitespaceOffsetInToken = Content[LineIndex - 1].data() +

606

Content[LineIndex - 1].size() -

607

tokenAt(LineIndex).TokenText.data();

608

unsigned WhitespaceLength = Content[LineIndex].data() -

609

tokenAt(LineIndex).TokenText.data() -

610

WhitespaceOffsetInToken;

Alexander Kornienko

2013-06-11 16:01:49 +0000

[diff] [blame]

611

Whitespaces.replaceWhitespaceInToken(

Daniel Jasper

2017-01-31 11:25:01 +0000

[diff] [blame]

612

tokenAt(LineIndex), WhitespaceOffsetInToken, WhitespaceLength, "", Prefix,

613

InPPDirective, /*Newlines=*/1, ContentColumn[LineIndex] - Prefix.size());

Manuel Klimek

2013-05-27 15:23:34 +0000

[diff] [blame]

}

unsigned

BreakableBlockComment::getContentStartColumn(unsigned LineIndex,

618

unsigned TailOffset) const {

619

// If we break, we always break at the predefined indent.

620

if (TailOffset != 0)

621

return IndentAtLineBreak;

Krasimir Georgiev

2017-01-25 13:58:58 +0000

[diff] [blame]

622

return std::max(0, ContentColumn[LineIndex]);

623

}

624

625

BreakableLineCommentSection::BreakableLineCommentSection(

Daniel Jasper

2017-01-31 11:25:01 +0000

[diff] [blame]

626

const FormatToken &Token, unsigned StartColumn,

Krasimir Georgiev

2017-01-25 13:58:58 +0000

[diff] [blame]

627

unsigned OriginalStartColumn, bool FirstInLine, bool InPPDirective,

628

encoding::Encoding Encoding, const FormatStyle &Style)

Daniel Jasper

2017-01-31 11:25:01 +0000

[diff] [blame]

629

: BreakableComment(Token, StartColumn, OriginalStartColumn, FirstInLine,

630

InPPDirective, Encoding, Style) {

Krasimir Georgiev

2017-01-25 13:58:58 +0000

[diff] [blame]

631

assert(Tok.is(TT_LineComment) &&

632

"line comment section must start with a line comment");

633

FormatToken *LineTok = nullptr;

634

for (const FormatToken *CurrentTok = &Tok;

635

CurrentTok && CurrentTok->is(TT_LineComment);

636

CurrentTok = CurrentTok->Next) {

637

LastLineTok = LineTok;

638

StringRef TokenText(CurrentTok->TokenText);

639

assert(TokenText.startswith("//"));

640

size_t FirstLineIndex = Lines.size();

641

TokenText.split(Lines, "\n");

642

Content.resize(Lines.size());

643

ContentColumn.resize(Lines.size());

644

OriginalContentColumn.resize(Lines.size());

645

Tokens.resize(Lines.size());

646

Prefix.resize(Lines.size());

647

OriginalPrefix.resize(Lines.size());

648

for (size_t i = FirstLineIndex, e = Lines.size(); i < e; ++i) {

Krasimir Georgiev

e518e0b

2017-01-30 21:00:01 +0000

[diff] [blame]

649

// We need to trim the blanks in case this is not the first line in a

650

// multiline comment. Then the indent is included in Lines[i].

651

StringRef IndentPrefix =

652

getLineCommentIndentPrefix(Lines[i].ltrim(Blanks));

653

assert(IndentPrefix.startswith("//"));

Krasimir Georgiev

2017-01-25 13:58:58 +0000

[diff] [blame]

654

OriginalPrefix[i] = Prefix[i] = IndentPrefix;

655

if (Lines[i].size() > Prefix[i].size() &&

656

isAlphanumeric(Lines[i][Prefix[i].size()])) {

657

if (Prefix[i] == "//")

658

Prefix[i] = "// ";

659

else if (Prefix[i] == "///")

660

Prefix[i] = "/// ";

661

else if (Prefix[i] == "//!")

Prefix[i] = "//! ";

}

Tokens[i] = LineTok;

Content[i] = Lines[i].substr(IndentPrefix.size());

667

OriginalContentColumn[i] =

668

StartColumn +

669

encoding::columnWidthWithTabs(OriginalPrefix[i],

StartColumn,

Style.TabWidth,

Encoding);

ContentColumn[i] =

StartColumn +

encoding::columnWidthWithTabs(Prefix[i],

StartColumn,

Style.TabWidth,

Encoding);

// Calculate the end of the non-whitespace text in this line.

681

size_t EndOfLine = Content[i].find_last_not_of(Blanks);

682

if (EndOfLine == StringRef::npos)

683

EndOfLine = Content[i].size();

684

else

685

++EndOfLine;

686

Content[i] = Content[i].substr(0, EndOfLine);

687

}

688

LineTok = CurrentTok->Next;

Krasimir Georgiev

753625b

2017-01-31 13:32:38 +0000

[diff] [blame]

689

if (CurrentTok->Next && CurrentTok->Next->NewlinesBefore > 1) {

690

// A line comment section needs to broken by a line comment that is

691

// preceded by at least two newlines. Note that we put this break here

692

// instead of breaking at a previous stage during parsing, since that

693

// would split the contents of the enum into two unwrapped lines in this

694

// example, which is undesirable:

695

// enum A {

696

// a, // comment about a

697

//

698

// // comment about b

// b

// };

//

// FIXME: Consider putting separate line comment sections as children to

703

// the unwrapped line instead.

704

break;

705

}

Krasimir Georgiev

2017-01-25 13:58:58 +0000

[diff] [blame]

}

}

unsigned BreakableLineCommentSection::getLineLengthAfterSplit(

710

unsigned LineIndex, unsigned TailOffset,

711

StringRef::size_type Length) const {

712

unsigned ContentStartColumn =

713

(TailOffset == 0 ? ContentColumn[LineIndex]

714

: OriginalContentColumn[LineIndex]);

715

return ContentStartColumn + encoding::columnWidthWithTabs(

716

Content[LineIndex].substr(TailOffset, Length),

717

ContentStartColumn, Style.TabWidth, Encoding);

718

}

719

720

void BreakableLineCommentSection::insertBreak(unsigned LineIndex,

721

unsigned TailOffset, Split Split,

722

WhitespaceManager &Whitespaces) {

723

StringRef Text = Content[LineIndex].substr(TailOffset);

724

// Compute the offset of the split relative to the beginning of the token

725

// text.

726

unsigned BreakOffsetInToken =

727

Text.data() - tokenAt(LineIndex).TokenText.data() + Split.first;

728

unsigned CharsToRemove = Split.second;

729

// Compute the size of the new indent, including the size of the new prefix of

730

// the newly broken line.

731

unsigned IndentAtLineBreak = OriginalContentColumn[LineIndex] +

732

Prefix[LineIndex].size() -

733

OriginalPrefix[LineIndex].size();

734

assert(IndentAtLineBreak >= Prefix[LineIndex].size());

735

Whitespaces.replaceWhitespaceInToken(

736

tokenAt(LineIndex), BreakOffsetInToken, CharsToRemove, "",

Daniel Jasper

2017-01-31 11:25:01 +0000

[diff] [blame]

737

Prefix[LineIndex], InPPDirective, /*Newlines=*/1,

Krasimir Georgiev

2017-01-25 13:58:58 +0000

[diff] [blame]

738

/*Spaces=*/IndentAtLineBreak - Prefix[LineIndex].size());

739

}

740

741

BreakableComment::Split BreakableLineCommentSection::getSplitBefore(

742

unsigned LineIndex,

743

unsigned PreviousEndColumn,

744

unsigned ColumnLimit) const {

745

if (!mayReflow(LineIndex)) return Split(StringRef::npos, 0);

746

return getReflowSplit(Content[LineIndex], ReflowPrefix, PreviousEndColumn,

ColumnLimit);

}

unsigned BreakableLineCommentSection::getLineLengthAfterSplitBefore(

751

unsigned LineIndex, unsigned TailOffset,

752

unsigned PreviousEndColumn,

753

unsigned ColumnLimit,

754

Split SplitBefore) const {

755

if (SplitBefore.first == StringRef::npos ||

756

SplitBefore.first + SplitBefore.second < Content[LineIndex].size()) {

757

// A piece of line, not the whole line, gets reflown.

758

return getLineLengthAfterSplit(LineIndex, TailOffset, StringRef::npos);

759

} else {

760

// The whole line gets reflown.

761

unsigned StartColumn = PreviousEndColumn + ReflowPrefix.size();

762

return StartColumn + encoding::columnWidthWithTabs(Content[LineIndex],

StartColumn,

Style.TabWidth,

Encoding);

}

}

void BreakableLineCommentSection::replaceWhitespaceBefore(

770

unsigned LineIndex, unsigned PreviousEndColumn, unsigned ColumnLimit,

771

Split SplitBefore, WhitespaceManager &Whitespaces) {

772

// If this is the first line of a token, we need to inform Whitespace Manager

773

// about it: either adapt the whitespace range preceding it, or mark it as an

774

// untouchable token.

775

// This happens for instance here:

776

// // line 1 \

777

// // line 2

778

if (LineIndex > 0 && Tokens[LineIndex] != Tokens[LineIndex - 1]) {

779

if (SplitBefore.first != StringRef::npos) {

780

// Reflow happens between tokens. Replace the whitespace between the

781

// tokens by the empty string.

Daniel Jasper

2017-01-31 11:25:01 +0000

[diff] [blame]

782

Whitespaces.replaceWhitespace(

783

*Tokens[LineIndex], /*Newlines=*/0, /*Spaces=*/0,

784

/*StartOfTokenColumn=*/StartColumn, /*InPPDirective=*/false);

Krasimir Georgiev

2017-01-25 13:58:58 +0000

[diff] [blame]

785

// Replace the indent and prefix of the token with the reflow prefix.

786

unsigned WhitespaceLength =

787

Content[LineIndex].data() - tokenAt(LineIndex).TokenText.data();

788

Whitespaces.replaceWhitespaceInToken(*Tokens[LineIndex],

789

/*Offset=*/0,

790

/*ReplaceChars=*/WhitespaceLength,

791

/*PreviousPostfix=*/"",

792

/*CurrentPrefix=*/ReflowPrefix,

793

/*InPPDirective=*/false,

794

/*Newlines=*/0,

Krasimir Georgiev

2017-01-25 13:58:58 +0000

[diff] [blame]

795

/*Spaces=*/0);

796

} else {

797

// This is the first line for the current token, but no reflow with the

798

// previous token is necessary. However, we still may need to adjust the

799

// start column.

800

unsigned LineColumn =

801

ContentColumn[LineIndex] -

802

(Content[LineIndex].data() - Lines[LineIndex].data());

803

if (tokenAt(LineIndex).OriginalColumn != LineColumn) {

804

Whitespaces.replaceWhitespace(*Tokens[LineIndex],

805

/*Newlines=*/1,

Krasimir Georgiev

2017-01-25 13:58:58 +0000

[diff] [blame]

806

/*Spaces=*/LineColumn,

807

/*StartOfTokenColumn=*/LineColumn,

808

/*InPPDirective=*/false);

809

} else {

810

// The whitespace preceding the first line of this token does not need

811

// to be touched.

812

Whitespaces.addUntouchableToken(tokenAt(LineIndex),

813

/*InPPDirective=*/false);

814

}

815

}

816

} else if (OriginalPrefix[LineIndex] != Prefix[LineIndex]) {

817

// This is not the first line of the token. Adjust the prefix if necessary.

818

819

// Take care of the space possibly introduced after a decoration.

820

assert(Prefix[LineIndex] == (OriginalPrefix[LineIndex] + " ").str() &&

821

"Expecting a block comment decoration to differ from original by "

822

"at most a space");

823

Whitespaces.replaceWhitespaceInToken(

824

tokenAt(LineIndex), OriginalPrefix[LineIndex].size(), 0, "", "",

Daniel Jasper

2017-01-31 11:25:01 +0000

[diff] [blame]

825

/*InPPDirective=*/false, /*Newlines=*/0, /*Spaces=*/1);

Krasimir Georgiev

2017-01-25 13:58:58 +0000

[diff] [blame]

826

}

827

// Add a break after a reflow split has been introduced, if necessary.

828

// Note that this break doesn't need to be penalized, since it doesn't change

829

// the number of lines.

830

if (SplitBefore.first != StringRef::npos &&

831

SplitBefore.first + SplitBefore.second < Content[LineIndex].size()) {

832

insertBreak(LineIndex, 0, SplitBefore, Whitespaces);

}

}

void BreakableLineCommentSection::updateNextToken(LineState& State) const {

837

if (LastLineTok) {

838

State.NextToken = LastLineTok->Next;

}

}

unsigned

BreakableLineCommentSection::getContentStartColumn(unsigned LineIndex,

844

unsigned TailOffset) const {

845

if (TailOffset != 0) {

846

return OriginalContentColumn[LineIndex];

847

}

848

return ContentColumn[LineIndex];

Manuel Klimek

2013-05-27 15:23:34 +0000

[diff] [blame]

849

}

850

Alexander Kornienko