Blame - clang/lib/Format/BreakableToken.h - toolchain/llvm-project

blob: 8ef26ef464da9ea8b085ec26994edac178ea8fcd [file] [log] [blame]

Alexander Kornienko	cb45bc1	2013-04-15 14:28:00 +0000	[diff] [blame]	1	//===--- BreakableToken.h - Format C++ code -------------------------------===//
				2	//
				3	// The LLVM Compiler Infrastructure
				4	//
				5	// This file is distributed under the University of Illinois Open Source
				6	// License. See LICENSE.TXT for details.
				7	//
				8	//===----------------------------------------------------------------------===//
				9	///
				10	/// \file
Krasimir Georgiev	9183422	2017-01-25 13:58:58 +0000	[diff] [blame]	11	/// \brief Declares BreakableToken, BreakableStringLiteral, BreakableComment,
				12	/// BreakableBlockComment and BreakableLineCommentSection classes, that contain
				13	/// token type-specific logic to break long lines in tokens and reflow content
				14	/// between tokens.
Alexander Kornienko	cb45bc1	2013-04-15 14:28:00 +0000	[diff] [blame]	15	///
				16	//===----------------------------------------------------------------------===//
				17
Benjamin Kramer	2f5db8b	2014-08-13 16:25:19 +0000	[diff] [blame]	18	#ifndef LLVM_CLANG_LIB_FORMAT_BREAKABLETOKEN_H
				19	#define LLVM_CLANG_LIB_FORMAT_BREAKABLETOKEN_H
Alexander Kornienko	cb45bc1	2013-04-15 14:28:00 +0000	[diff] [blame]	20
Alexander Kornienko	ffcc010	2013-06-05 14:09:10 +0000	[diff] [blame]	21	#include "Encoding.h"
Alexander Kornienko	cb45bc1	2013-04-15 14:28:00 +0000	[diff] [blame]	22	#include "TokenAnnotator.h"
				23	#include "WhitespaceManager.h"
Krasimir Georgiev	00c5c72	2017-02-02 15:32:19 +0000	[diff] [blame]	24	#include "llvm/Support/Regex.h"
Alexander Kornienko	cb45bc1	2013-04-15 14:28:00 +0000	[diff] [blame]	25	#include <utility>
				26
				27	namespace clang {
				28	namespace format {
				29
Krasimir Georgiev	9183422	2017-01-25 13:58:58 +0000	[diff] [blame]	30	/// \brief Checks if \p Token switches formatting, like /* clang-format off */.
				31	/// \p Token must be a comment.
				32	bool switchesFormatting(const FormatToken &Token);
				33
Manuel Klimek	9043c74	2013-05-27 15:23:34 +0000	[diff] [blame]	34	struct FormatStyle;
				35
Manuel Klimek	93699f4	2017-11-29 14:29:43 +0000	[diff] [blame]	36	/// \brief Base class for tokens / ranges of tokens that can allow breaking
				37	/// within the tokens - for example, to avoid whitespace beyond the column
				38	/// limit, or to reflow text.
Manuel Klimek	9043c74	2013-05-27 15:23:34 +0000	[diff] [blame]	39	///
Manuel Klimek	93699f4	2017-11-29 14:29:43 +0000	[diff] [blame]	40	/// Generally, a breakable token consists of logical lines, addressed by a line
				41	/// index. For example, in a sequence of line comments, each line comment is its
				42	/// own logical line; similarly, for a block comment, each line in the block
				43	/// comment is on its own logical line.
				44	///
				45	/// There are two methods to compute the layout of the token:
				46	/// - getRangeLength measures the number of columns needed for a range of text
				47	/// within a logical line, and
				48	/// - getContentStartColumn returns the start column at which we want the
				49	/// content of a logical line to start (potentially after introducing a line
				50	/// break).
				51	///
				52	/// The mechanism to adapt the layout of the breakable token is organised
				53	/// around the concept of a \c Split, which is a whitespace range that signifies
				54	/// a position of the content of a token where a reformatting might be done.
				55	///
				56	/// Operating with splits is divided into two operations:
Krasimir Georgiev	9183422	2017-01-25 13:58:58 +0000	[diff] [blame]	57	/// - getSplit, for finding a split starting at a position,
Krasimir Georgiev	9183422	2017-01-25 13:58:58 +0000	[diff] [blame]	58	/// - insertBreak, for executing the split using a whitespace manager.
				59	///
				60	/// There is a pair of operations that are used to compress a long whitespace
Manuel Klimek	93699f4	2017-11-29 14:29:43 +0000	[diff] [blame]	61	/// range with a single space if that will bring the line length under the
Krasimir Georgiev	9183422	2017-01-25 13:58:58 +0000	[diff] [blame]	62	/// column limit:
				63	/// - getLineLengthAfterCompression, for calculating the size in columns of the
				64	/// line after a whitespace range has been compressed, and
				65	/// - compressWhitespace, for executing the whitespace compression using a
				66	/// whitespace manager; note that the compressed whitespace may be in the
				67	/// middle of the original line and of the reformatted line.
				68	///
				69	/// For tokens where the whitespace before each line needs to be also
				70	/// reformatted, for example for tokens supporting reflow, there are analogous
				71	/// operations that might be executed before the main line breaking occurs:
Manuel Klimek	93699f4	2017-11-29 14:29:43 +0000	[diff] [blame]	72	/// - getReflowSplit, for finding a split such that the content preceding it
Krasimir Georgiev	9183422	2017-01-25 13:58:58 +0000	[diff] [blame]	73	/// needs to be specially reflown,
Manuel Klimek	93699f4	2017-11-29 14:29:43 +0000	[diff] [blame]	74	/// - reflow, for executing the split using a whitespace manager,
Krasimir Georgiev	35599fd	2017-10-16 09:08:53 +0000	[diff] [blame]	75	/// - introducesBreakBefore, for checking if reformatting the beginning
				76	/// of the content introduces a line break before it,
Manuel Klimek	93699f4	2017-11-29 14:29:43 +0000	[diff] [blame]	77	/// - adaptStartOfLine, for executing the reflow using a whitespace
Krasimir Georgiev	9183422	2017-01-25 13:58:58 +0000	[diff] [blame]	78	/// manager.
				79	///
Krasimir Georgiev	22d7e6b	2017-07-20 22:29:39 +0000	[diff] [blame]	80	/// For tokens that require the whitespace after the last line to be
				81	/// reformatted, for example in multiline jsdoc comments that require the
				82	/// trailing '*/' to be on a line of itself, there are analogous operations
				83	/// that might be executed after the last line has been reformatted:
				84	/// - getSplitAfterLastLine, for finding a split after the last line that needs
				85	/// to be reflown,
Krasimir Georgiev	22d7e6b	2017-07-20 22:29:39 +0000	[diff] [blame]	86	/// - replaceWhitespaceAfterLastLine, for executing the reflow using a
				87	/// whitespace manager.
				88	///
Alexander Kornienko	cb45bc1	2013-04-15 14:28:00 +0000	[diff] [blame]	89	class BreakableToken {
				90	public:
Alexander Kornienko	dd7ece5	2013-06-07 16:02:52 +0000	[diff] [blame]	91	/// \brief Contains starting character index and length of split.
Manuel Klimek	9043c74	2013-05-27 15:23:34 +0000	[diff] [blame]	92	typedef std::pair<StringRef::size_type, unsigned> Split;
				93
Angel Garcia Gomez	637d1e6	2015-10-20 13:23:58 +0000	[diff] [blame]	94	virtual ~BreakableToken() {}
Manuel Klimek	9043c74	2013-05-27 15:23:34 +0000	[diff] [blame]	95
				96	/// \brief Returns the number of lines in this token in the original code.
Alexander Kornienko	cb45bc1	2013-04-15 14:28:00 +0000	[diff] [blame]	97	virtual unsigned getLineCount() const = 0;
Manuel Klimek	9043c74	2013-05-27 15:23:34 +0000	[diff] [blame]	98
Manuel Klimek	93699f4	2017-11-29 14:29:43 +0000	[diff] [blame]	99	/// \brief Returns the number of columns required to format the text in the
				100	/// byte range [\p Offset, \p Offset \c + \p Length).
Manuel Klimek	9043c74	2013-05-27 15:23:34 +0000	[diff] [blame]	101	///
Manuel Klimek	93699f4	2017-11-29 14:29:43 +0000	[diff] [blame]	102	/// \p Offset is the byte offset from the start of the content of the line
				103	/// at \p LineIndex.
				104	///
				105	/// \p StartColumn is the column at which the text starts in the formatted
				106	/// file, needed to compute tab stops correctly.
				107	virtual unsigned getRangeLength(unsigned LineIndex, unsigned Offset,
				108	StringRef::size_type Length,
				109	unsigned StartColumn) const = 0;
				110
				111	/// \brief Returns the number of columns required to format the text following
				112	/// the byte \p Offset in the line \p LineIndex, including potentially
				113	/// unbreakable sequences of tokens following after the end of the token.
				114	///
				115	/// \p Offset is the byte offset from the start of the content of the line
				116	/// at \p LineIndex.
				117	///
				118	/// \p StartColumn is the column at which the text starts in the formatted
				119	/// file, needed to compute tab stops correctly.
				120	///
				121	/// For breakable tokens that never use extra space at the end of a line, this
				122	/// is equivalent to getRangeLength with a Length of StringRef::npos.
				123	virtual unsigned getRemainingLength(unsigned LineIndex, unsigned Offset,
				124	unsigned StartColumn) const {
				125	return getRangeLength(LineIndex, Offset, StringRef::npos, StartColumn);
				126	}
				127
				128	/// \brief Returns the column at which content in line \p LineIndex starts,
				129	/// assuming no reflow.
				130	///
				131	/// If \p Break is true, returns the column at which the line should start
				132	/// after the line break.
				133	/// If \p Break is false, returns the column at which the line itself will
				134	/// start.
				135	virtual unsigned getContentStartColumn(unsigned LineIndex,
				136	bool Break) const = 0;
Alexander Kornienko	cb45bc1	2013-04-15 14:28:00 +0000	[diff] [blame]	137
Manuel Klimek	9043c74	2013-05-27 15:23:34 +0000	[diff] [blame]	138	/// \brief Returns a range (offset, length) at which to break the line at
				139	/// \p LineIndex, if previously broken at \p TailOffset. If possible, do not
Manuel Klimek	93699f4	2017-11-29 14:29:43 +0000	[diff] [blame]	140	/// violate \p ColumnLimit, assuming the text starting at \p TailOffset in
				141	/// the token is formatted starting at ContentStartColumn in the reformatted
				142	/// file.
Alexander Kornienko	cb45bc1	2013-04-15 14:28:00 +0000	[diff] [blame]	143	virtual Split getSplit(unsigned LineIndex, unsigned TailOffset,
Manuel Klimek	93699f4	2017-11-29 14:29:43 +0000	[diff] [blame]	144	unsigned ColumnLimit, unsigned ContentStartColumn,
Krasimir Georgiev	17725d8	2017-03-08 08:55:12 +0000	[diff] [blame]	145	llvm::Regex &CommentPragmasRegex) const = 0;
Manuel Klimek	9043c74	2013-05-27 15:23:34 +0000	[diff] [blame]	146
				147	/// \brief Emits the previously retrieved \p Split via \p Whitespaces.
Alexander Kornienko	cb45bc1	2013-04-15 14:28:00 +0000	[diff] [blame]	148	virtual void insertBreak(unsigned LineIndex, unsigned TailOffset, Split Split,
Manuel Klimek	93699f4	2017-11-29 14:29:43 +0000	[diff] [blame]	149	WhitespaceManager &Whitespaces) const = 0;
Manuel Klimek	9043c74	2013-05-27 15:23:34 +0000	[diff] [blame]	150
Manuel Klimek	93699f4	2017-11-29 14:29:43 +0000	[diff] [blame]	151	/// \brief Returns the number of columns needed to format
				152	/// \p RemainingTokenColumns, assuming that Split is within the range measured
				153	/// by \p RemainingTokenColumns, and that the whitespace in Split is reduced
				154	/// to a single space.
				155	unsigned getLengthAfterCompression(unsigned RemainingTokenColumns,
				156	Split Split) const;
Krasimir Georgiev	9183422	2017-01-25 13:58:58 +0000	[diff] [blame]	157
Alexander Kornienko	875395f	2013-11-12 17:50:13 +0000	[diff] [blame]	158	/// \brief Replaces the whitespace range described by \p Split with a single
				159	/// space.
Krasimir Georgiev	9183422	2017-01-25 13:58:58 +0000	[diff] [blame]	160	virtual void compressWhitespace(unsigned LineIndex, unsigned TailOffset,
				161	Split Split,
Manuel Klimek	93699f4	2017-11-29 14:29:43 +0000	[diff] [blame]	162	WhitespaceManager &Whitespaces) const = 0;
Krasimir Georgiev	9183422	2017-01-25 13:58:58 +0000	[diff] [blame]	163
Manuel Klimek	93699f4	2017-11-29 14:29:43 +0000	[diff] [blame]	164	/// \brief Returns whether the token supports reflowing text.
				165	virtual bool supportsReflow() const { return false; }
				166
				167	/// \brief Returns a whitespace range (offset, length) of the content at \p
				168	/// LineIndex such that the content of that line is reflown to the end of the
				169	/// previous one.
Krasimir Georgiev	9183422	2017-01-25 13:58:58 +0000	[diff] [blame]	170	///
Manuel Klimek	93699f4	2017-11-29 14:29:43 +0000	[diff] [blame]	171	/// Returning (StringRef::npos, 0) indicates reflowing is not possible.
Krasimir Georgiev	9183422	2017-01-25 13:58:58 +0000	[diff] [blame]	172	///
Manuel Klimek	93699f4	2017-11-29 14:29:43 +0000	[diff] [blame]	173	/// The range will include any whitespace preceding the specified line's
				174	/// content.
				175	///
				176	/// If the split is not contained within one token, for example when reflowing
				177	/// line comments, returns (0, <length>).
				178	virtual Split getReflowSplit(unsigned LineIndex,
Krasimir Georgiev	a7a24bf	2017-03-08 08:58:44 +0000	[diff] [blame]	179	llvm::Regex &CommentPragmasRegex) const {
Krasimir Georgiev	9183422	2017-01-25 13:58:58 +0000	[diff] [blame]	180	return Split(StringRef::npos, 0);
				181	}
				182
Manuel Klimek	93699f4	2017-11-29 14:29:43 +0000	[diff] [blame]	183	/// \brief Reflows the current line into the end of the previous one.
				184	virtual void reflow(unsigned LineIndex,
				185	WhitespaceManager &Whitespaces) const {}
				186
Manuel Klimek	7786614	2017-11-17 11:17:15 +0000	[diff] [blame]	187	/// \brief Returns whether there will be a line break at the start of the
				188	/// token.
				189	virtual bool introducesBreakBeforeToken() const {
Krasimir Georgiev	35599fd	2017-10-16 09:08:53 +0000	[diff] [blame]	190	return false;
				191	}
				192
Manuel Klimek	9043c74	2013-05-27 15:23:34 +0000	[diff] [blame]	193	/// \brief Replaces the whitespace between \p LineIndex-1 and \p LineIndex.
Manuel Klimek	93699f4	2017-11-29 14:29:43 +0000	[diff] [blame]	194	virtual void adaptStartOfLine(unsigned LineIndex,
				195	WhitespaceManager &Whitespaces) const {}
Manuel Klimek	9043c74	2013-05-27 15:23:34 +0000	[diff] [blame]	196
Krasimir Georgiev	22d7e6b	2017-07-20 22:29:39 +0000	[diff] [blame]	197	/// \brief Returns a whitespace range (offset, length) of the content at
				198	/// the last line that needs to be reformatted after the last line has been
				199	/// reformatted.
				200	///
				201	/// A result having offset == StringRef::npos means that no reformat is
				202	/// necessary.
Manuel Klimek	93699f4	2017-11-29 14:29:43 +0000	[diff] [blame]	203	virtual Split getSplitAfterLastLine(unsigned TailOffset) const {
Krasimir Georgiev	22d7e6b	2017-07-20 22:29:39 +0000	[diff] [blame]	204	return Split(StringRef::npos, 0);
				205	}
				206
Krasimir Georgiev	22d7e6b	2017-07-20 22:29:39 +0000	[diff] [blame]	207	/// \brief Replaces the whitespace from \p SplitAfterLastLine on the last line
				208	/// after the last line has been formatted by performing a reformatting.
Manuel Klimek	93699f4	2017-11-29 14:29:43 +0000	[diff] [blame]	209	void replaceWhitespaceAfterLastLine(unsigned TailOffset,
				210	Split SplitAfterLastLine,
				211	WhitespaceManager &Whitespaces) const {
Krasimir Georgiev	22d7e6b	2017-07-20 22:29:39 +0000	[diff] [blame]	212	insertBreak(getLineCount() - 1, TailOffset, SplitAfterLastLine,
				213	Whitespaces);
				214	}
				215
Krasimir Georgiev	9183422	2017-01-25 13:58:58 +0000	[diff] [blame]	216	/// \brief Updates the next token of \p State to the next token after this
				217	/// one. This can be used when this token manages a set of underlying tokens
				218	/// as a unit and is responsible for the formatting of the them.
				219	virtual void updateNextToken(LineState &State) const {}
				220
Alexander Kornienko	9e90b62	2013-04-17 17:34:05 +0000	[diff] [blame]	221	protected:
Daniel Jasper	7d42f3f	2017-01-31 11:25:01 +0000	[diff] [blame]	222	BreakableToken(const FormatToken &Tok, bool InPPDirective,
				223	encoding::Encoding Encoding, const FormatStyle &Style)
				224	: Tok(Tok), InPPDirective(InPPDirective), Encoding(Encoding),
				225	Style(Style) {}
Manuel Klimek	9043c74	2013-05-27 15:23:34 +0000	[diff] [blame]	226
Alexander Kornienko	9e90b62	2013-04-17 17:34:05 +0000	[diff] [blame]	227	const FormatToken &Tok;
Alexander Kornienko	be63390	2013-06-14 11:46:10 +0000	[diff] [blame]	228	const bool InPPDirective;
				229	const encoding::Encoding Encoding;
Alexander Kornienko	ebb43ca	2013-09-05 14:08:34 +0000	[diff] [blame]	230	const FormatStyle &Style;
Alexander Kornienko	cb45bc1	2013-04-15 14:28:00 +0000	[diff] [blame]	231	};
				232
Manuel Klimek	93699f4	2017-11-29 14:29:43 +0000	[diff] [blame]	233	class BreakableStringLiteral : public BreakableToken {
Alexander Kornienko	cb45bc1	2013-04-15 14:28:00 +0000	[diff] [blame]	234	public:
Manuel Klimek	9043c74	2013-05-27 15:23:34 +0000	[diff] [blame]	235	/// \brief Creates a breakable token for a single line string literal.
				236	///
				237	/// \p StartColumn specifies the column in which the token will start
				238	/// after formatting.
Daniel Jasper	7d42f3f	2017-01-31 11:25:01 +0000	[diff] [blame]	239	BreakableStringLiteral(const FormatToken &Tok, unsigned StartColumn,
				240	StringRef Prefix, StringRef Postfix,
				241	bool InPPDirective, encoding::Encoding Encoding,
				242	const FormatStyle &Style);
Alexander Kornienko	cb45bc1	2013-04-15 14:28:00 +0000	[diff] [blame]	243
Krasimir Georgiev	17725d8	2017-03-08 08:55:12 +0000	[diff] [blame]	244	Split getSplit(unsigned LineIndex, unsigned TailOffset, unsigned ColumnLimit,
Manuel Klimek	93699f4	2017-11-29 14:29:43 +0000	[diff] [blame]	245	unsigned ReflowColumn,
Krasimir Georgiev	17725d8	2017-03-08 08:55:12 +0000	[diff] [blame]	246	llvm::Regex &CommentPragmasRegex) const override;
Craig Topper	fb6b25b	2014-03-15 04:29:04 +0000	[diff] [blame]	247	void insertBreak(unsigned LineIndex, unsigned TailOffset, Split Split,
Manuel Klimek	93699f4	2017-11-29 14:29:43 +0000	[diff] [blame]	248	WhitespaceManager &Whitespaces) const override;
Krasimir Georgiev	9183422	2017-01-25 13:58:58 +0000	[diff] [blame]	249	void compressWhitespace(unsigned LineIndex, unsigned TailOffset, Split Split,
Manuel Klimek	93699f4	2017-11-29 14:29:43 +0000	[diff] [blame]	250	WhitespaceManager &Whitespaces) const override {}
				251	unsigned getLineCount() const override;
				252	unsigned getRangeLength(unsigned LineIndex, unsigned Offset,
				253	StringRef::size_type Length,
				254	unsigned StartColumn) const override;
				255	unsigned getRemainingLength(unsigned LineIndex, unsigned Offset,
				256	unsigned StartColumn) const override;
				257	unsigned getContentStartColumn(unsigned LineIndex, bool Break) const override;
				258
				259	protected:
				260	// The column in which the token starts.
				261	unsigned StartColumn;
				262	// The prefix a line needs after a break in the token.
				263	StringRef Prefix;
				264	// The postfix a line needs before introducing a break.
				265	StringRef Postfix;
				266	// The token text excluding the prefix and postfix.
				267	StringRef Line;
				268	// Length of the sequence of tokens after this string literal that cannot
				269	// contain line breaks.
				270	unsigned UnbreakableTailLength;
Manuel Klimek	9043c74	2013-05-27 15:23:34 +0000	[diff] [blame]	271	};
Alexander Kornienko	cb45bc1	2013-04-15 14:28:00 +0000	[diff] [blame]	272
Krasimir Georgiev	9183422	2017-01-25 13:58:58 +0000	[diff] [blame]	273	class BreakableComment : public BreakableToken {
				274	protected:
				275	/// \brief Creates a breakable token for a comment.
Manuel Klimek	9043c74	2013-05-27 15:23:34 +0000	[diff] [blame]	276	///
Krasimir Georgiev	4b15922	2017-02-21 10:54:50 +0000	[diff] [blame]	277	/// \p StartColumn specifies the column in which the comment will start after
				278	/// formatting.
Daniel Jasper	7d42f3f	2017-01-31 11:25:01 +0000	[diff] [blame]	279	BreakableComment(const FormatToken &Token, unsigned StartColumn,
Daniel Jasper	7d42f3f	2017-01-31 11:25:01 +0000	[diff] [blame]	280	bool InPPDirective, encoding::Encoding Encoding,
				281	const FormatStyle &Style);
Krasimir Georgiev	9183422	2017-01-25 13:58:58 +0000	[diff] [blame]	282
				283	public:
Manuel Klimek	93699f4	2017-11-29 14:29:43 +0000	[diff] [blame]	284	bool supportsReflow() const override { return true; }
Krasimir Georgiev	9183422	2017-01-25 13:58:58 +0000	[diff] [blame]	285	unsigned getLineCount() const override;
Krasimir Georgiev	17725d8	2017-03-08 08:55:12 +0000	[diff] [blame]	286	Split getSplit(unsigned LineIndex, unsigned TailOffset, unsigned ColumnLimit,
Manuel Klimek	93699f4	2017-11-29 14:29:43 +0000	[diff] [blame]	287	unsigned ReflowColumn,
Krasimir Georgiev	17725d8	2017-03-08 08:55:12 +0000	[diff] [blame]	288	llvm::Regex &CommentPragmasRegex) const override;
Krasimir Georgiev	9183422	2017-01-25 13:58:58 +0000	[diff] [blame]	289	void compressWhitespace(unsigned LineIndex, unsigned TailOffset, Split Split,
Manuel Klimek	93699f4	2017-11-29 14:29:43 +0000	[diff] [blame]	290	WhitespaceManager &Whitespaces) const override;
Krasimir Georgiev	9183422	2017-01-25 13:58:58 +0000	[diff] [blame]	291
				292	protected:
Krasimir Georgiev	9183422	2017-01-25 13:58:58 +0000	[diff] [blame]	293	// Returns the token containing the line at LineIndex.
				294	const FormatToken &tokenAt(unsigned LineIndex) const;
				295
				296	// Checks if the content of line LineIndex may be reflown with the previous
				297	// line.
Krasimir Georgiev	00c5c72	2017-02-02 15:32:19 +0000	[diff] [blame]	298	virtual bool mayReflow(unsigned LineIndex,
				299	llvm::Regex &CommentPragmasRegex) const = 0;
Krasimir Georgiev	9183422	2017-01-25 13:58:58 +0000	[diff] [blame]	300
				301	// Contains the original text of the lines of the block comment.
				302	//
				303	// In case of a block comments, excludes the leading /* in the first line and
				304	// trailing */ in the last line. In case of line comments, excludes the
				305	// leading // and spaces.
				306	SmallVector<StringRef, 16> Lines;
				307
				308	// Contains the text of the lines excluding all leading and trailing
				309	// whitespace between the lines. Note that the decoration (if present) is also
				310	// not considered part of the text.
				311	SmallVector<StringRef, 16> Content;
				312
				313	// Tokens[i] contains a reference to the token containing Lines[i] if the
				314	// whitespace range before that token is managed by this block.
				315	// Otherwise, Tokens[i] is a null pointer.
				316	SmallVector<FormatToken *, 16> Tokens;
				317
				318	// ContentColumn[i] is the target column at which Content[i] should be.
				319	// Note that this excludes a leading "* " or "*" in case of block comments
				320	// where all lines have a "*" prefix, or the leading "// " or "//" in case of
				321	// line comments.
				322	//
				323	// In block comments, the first line's target column is always positive. The
				324	// remaining lines' target columns are relative to the first line to allow
				325	// correct indentation of comments in \c WhitespaceManager. Thus they can be
				326	// negative as well (in case the first line needs to be unindented more than
				327	// there's actual whitespace in another line).
				328	SmallVector<int, 16> ContentColumn;
				329
				330	// The intended start column of the first line of text from this section.
				331	unsigned StartColumn;
				332
Krasimir Georgiev	9183422	2017-01-25 13:58:58 +0000	[diff] [blame]	333	// The prefix to use in front a line that has been reflown up.
				334	// For example, when reflowing the second line after the first here:
				335	// // comment 1
				336	// // comment 2
				337	// we expect:
				338	// // comment 1 comment 2
				339	// and not:
				340	// // comment 1comment 2
				341	StringRef ReflowPrefix = " ";
				342	};
				343
				344	class BreakableBlockComment : public BreakableComment {
				345	public:
Daniel Jasper	7d42f3f	2017-01-31 11:25:01 +0000	[diff] [blame]	346	BreakableBlockComment(const FormatToken &Token, unsigned StartColumn,
				347	unsigned OriginalStartColumn, bool FirstInLine,
				348	bool InPPDirective, encoding::Encoding Encoding,
				349	const FormatStyle &Style);
Manuel Klimek	9043c74	2013-05-27 15:23:34 +0000	[diff] [blame]	350
Manuel Klimek	93699f4	2017-11-29 14:29:43 +0000	[diff] [blame]	351	unsigned getRangeLength(unsigned LineIndex, unsigned Offset,
				352	StringRef::size_type Length,
				353	unsigned StartColumn) const override;
				354	unsigned getRemainingLength(unsigned LineIndex, unsigned Offset,
				355	unsigned StartColumn) const override;
				356	unsigned getContentStartColumn(unsigned LineIndex, bool Break) const override;
Craig Topper	fb6b25b	2014-03-15 04:29:04 +0000	[diff] [blame]	357	void insertBreak(unsigned LineIndex, unsigned TailOffset, Split Split,
Manuel Klimek	93699f4	2017-11-29 14:29:43 +0000	[diff] [blame]	358	WhitespaceManager &Whitespaces) const override;
				359	Split getReflowSplit(unsigned LineIndex,
Krasimir Georgiev	00c5c72	2017-02-02 15:32:19 +0000	[diff] [blame]	360	llvm::Regex &CommentPragmasRegex) const override;
Manuel Klimek	93699f4	2017-11-29 14:29:43 +0000	[diff] [blame]	361	void reflow(unsigned LineIndex,
				362	WhitespaceManager &Whitespaces) const override;
Manuel Klimek	7786614	2017-11-17 11:17:15 +0000	[diff] [blame]	363	bool introducesBreakBeforeToken() const override;
Manuel Klimek	93699f4	2017-11-29 14:29:43 +0000	[diff] [blame]	364	void adaptStartOfLine(unsigned LineIndex,
				365	WhitespaceManager &Whitespaces) const override;
				366	Split getSplitAfterLastLine(unsigned TailOffset) const override;
Krasimir Georgiev	22d7e6b	2017-07-20 22:29:39 +0000	[diff] [blame]	367
Krasimir Georgiev	00c5c72	2017-02-02 15:32:19 +0000	[diff] [blame]	368	bool mayReflow(unsigned LineIndex,
				369	llvm::Regex &CommentPragmasRegex) const override;
Alexander Kornienko	cb45bc1	2013-04-15 14:28:00 +0000	[diff] [blame]	370
				371	private:
Krasimir Georgiev	9183422	2017-01-25 13:58:58 +0000	[diff] [blame]	372	// Rearranges the whitespace between Lines[LineIndex-1] and Lines[LineIndex].
Manuel Klimek	9043c74	2013-05-27 15:23:34 +0000	[diff] [blame]	373	//
Krasimir Georgiev	9183422	2017-01-25 13:58:58 +0000	[diff] [blame]	374	// Updates Content[LineIndex-1] and Content[LineIndex] by stripping off
				375	// leading and trailing whitespace.
				376	//
				377	// Sets ContentColumn to the intended column in which the text at
Manuel Klimek	9043c74	2013-05-27 15:23:34 +0000	[diff] [blame]	378	// Lines[LineIndex] starts (note that the decoration, if present, is not
				379	// considered part of the text).
Alexander Kornienko	ebb43ca	2013-09-05 14:08:34 +0000	[diff] [blame]	380	void adjustWhitespace(unsigned LineIndex, int IndentDelta);
Alexander Kornienko	9e90b62	2013-04-17 17:34:05 +0000	[diff] [blame]	381
Manuel Klimek	9043c74	2013-05-27 15:23:34 +0000	[diff] [blame]	382	// The column at which the text of a broken line should start.
				383	// Note that an optional decoration would go before that column.
				384	// IndentAtLineBreak is a uniform position for all lines in a block comment,
				385	// regardless of their relative position.
				386	// FIXME: Revisit the decision to do this; the main reason was to support
				387	// patterns like
				388	// /************//
				389	// * Comment
				390	// We could also support such patterns by special casing the first line
				391	// instead.
				392	unsigned IndentAtLineBreak;
				393
Alexander Kornienko	614d96a	2013-07-08 14:12:07 +0000	[diff] [blame]	394	// This is to distinguish between the case when the last line was empty and
				395	// the case when it started with a decoration ("" or " ").
				396	bool LastLineNeedsDecoration;
				397
Manuel Klimek	9043c74	2013-05-27 15:23:34 +0000	[diff] [blame]	398	// Either "* " if all lines begin with a "*", or empty.
				399	StringRef Decoration;
Krasimir Georgiev	bb99a36	2017-02-16 12:39:31 +0000	[diff] [blame]	400
				401	// If this block comment has decorations, this is the column of the start of
				402	// the decorations.
				403	unsigned DecorationColumn;
Krasimir Georgiev	22d7e6b	2017-07-20 22:29:39 +0000	[diff] [blame]	404
				405	// If true, make sure that the opening '/*' and the closing '/' ends on a
				406	// line of itself. Styles like jsdoc require this for multiline comments.
				407	bool DelimitersOnNewline;
Manuel Klimek	48c930c	2017-12-04 08:53:16 +0000	[diff] [blame^]	408
				409	// Length of the sequence of tokens after this string literal that cannot
				410	// contain line breaks.
				411	unsigned UnbreakableTailLength;
Alexander Kornienko	cb45bc1	2013-04-15 14:28:00 +0000	[diff] [blame]	412	};
				413
Krasimir Georgiev	9183422	2017-01-25 13:58:58 +0000	[diff] [blame]	414	class BreakableLineCommentSection : public BreakableComment {
				415	public:
Daniel Jasper	7d42f3f	2017-01-31 11:25:01 +0000	[diff] [blame]	416	BreakableLineCommentSection(const FormatToken &Token, unsigned StartColumn,
Krasimir Georgiev	9183422	2017-01-25 13:58:58 +0000	[diff] [blame]	417	unsigned OriginalStartColumn, bool FirstInLine,
				418	bool InPPDirective, encoding::Encoding Encoding,
				419	const FormatStyle &Style);
				420
Manuel Klimek	93699f4	2017-11-29 14:29:43 +0000	[diff] [blame]	421	unsigned getRangeLength(unsigned LineIndex, unsigned Offset,
				422	StringRef::size_type Length,
				423	unsigned StartColumn) const override;
				424	unsigned getContentStartColumn(unsigned LineIndex, bool Break) const override;
Krasimir Georgiev	9183422	2017-01-25 13:58:58 +0000	[diff] [blame]	425	void insertBreak(unsigned LineIndex, unsigned TailOffset, Split Split,
Manuel Klimek	93699f4	2017-11-29 14:29:43 +0000	[diff] [blame]	426	WhitespaceManager &Whitespaces) const override;
				427	Split getReflowSplit(unsigned LineIndex,
Krasimir Georgiev	00c5c72	2017-02-02 15:32:19 +0000	[diff] [blame]	428	llvm::Regex &CommentPragmasRegex) const override;
Manuel Klimek	93699f4	2017-11-29 14:29:43 +0000	[diff] [blame]	429	void reflow(unsigned LineIndex,
				430	WhitespaceManager &Whitespaces) const override;
				431	void adaptStartOfLine(unsigned LineIndex,
				432	WhitespaceManager &Whitespaces) const override;
Krasimir Georgiev	a7a24bf	2017-03-08 08:58:44 +0000	[diff] [blame]	433	void updateNextToken(LineState &State) const override;
Krasimir Georgiev	00c5c72	2017-02-02 15:32:19 +0000	[diff] [blame]	434	bool mayReflow(unsigned LineIndex,
				435	llvm::Regex &CommentPragmasRegex) const override;
Krasimir Georgiev	9183422	2017-01-25 13:58:58 +0000	[diff] [blame]	436
				437	private:
Krasimir Georgiev	2091a3a	2017-02-08 14:45:19 +0000	[diff] [blame]	438	// OriginalPrefix[i] contains the original prefix of line i, including
				439	// trailing whitespace before the start of the content. The indentation
				440	// preceding the prefix is not included.
				441	// For example, if the line is:
				442	// // content
				443	// then the original prefix is "// ".
				444	SmallVector<StringRef, 16> OriginalPrefix;
				445
Krasimir Georgiev	9183422	2017-01-25 13:58:58 +0000	[diff] [blame]	446	// Prefix[i] contains the intended leading "//" with trailing spaces to
				447	// account for the indentation of content within the comment at line i after
				448	// formatting. It can be different than the original prefix when the original
				449	// line starts like this:
				450	// //content
				451	// Then the original prefix is "//", but the prefix is "// ".
				452	SmallVector<StringRef, 16> Prefix;
				453
				454	SmallVector<unsigned, 16> OriginalContentColumn;
				455
				456	/// \brief The token to which the last line of this breakable token belongs
				457	/// to; nullptr if that token is the initial token.
				458	///
				459	/// The distinction is because if the token of the last line of this breakable
				460	/// token is distinct from the initial token, this breakable token owns the
				461	/// whitespace before the token of the last line, and the whitespace manager
				462	/// must be able to modify it.
				463	FormatToken *LastLineTok = nullptr;
				464	};
Alexander Kornienko	cb45bc1	2013-04-15 14:28:00 +0000	[diff] [blame]	465	} // namespace format
				466	} // namespace clang
				467
Benjamin Kramer	2f5db8b	2014-08-13 16:25:19 +0000	[diff] [blame]	468	#endif