Blame - clang/lib/AST/RawCommentList.cpp - toolchain/llvm-project

blob: a8d15036cab99eefd71411aeb1742bff1e035bd4 [file] [log] [blame]

Dmitri Gribenko	aab8383	2012-06-20 00:34:58 +0000	[diff] [blame]	1	//===--- RawCommentList.cpp - Processing raw comments ------------ C++ --===//
				2	//
Chandler Carruth	2946cd7	2019-01-19 08:50:56 +0000	[diff] [blame]	3	// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
				4	// See https://llvm.org/LICENSE.txt for license information.
				5	// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
Dmitri Gribenko	aab8383	2012-06-20 00:34:58 +0000	[diff] [blame]	6	//
				7	//===----------------------------------------------------------------------===//
				8
Chandler Carruth	39a3e75	2012-06-20 09:53:52 +0000	[diff] [blame]	9	#include "clang/AST/RawCommentList.h"
Dmitri Gribenko	5188c4b	2012-06-26 20:39:18 +0000	[diff] [blame]	10	#include "clang/AST/ASTContext.h"
Dmitri Gribenko	a43ec18	2012-08-11 00:51:43 +0000	[diff] [blame]	11	#include "clang/AST/Comment.h"
Dmitri Gribenko	5188c4b	2012-06-26 20:39:18 +0000	[diff] [blame]	12	#include "clang/AST/CommentBriefParser.h"
Dmitri Gribenko	ca7f80a	2012-08-09 00:03:17 +0000	[diff] [blame]	13	#include "clang/AST/CommentCommandTraits.h"
Chandler Carruth	3a02247	2012-12-04 09:13:33 +0000	[diff] [blame]	14	#include "clang/AST/CommentLexer.h"
				15	#include "clang/AST/CommentParser.h"
				16	#include "clang/AST/CommentSema.h"
James Dennett	2def1e8	2015-07-15 19:13:39 +0000	[diff] [blame]	17	#include "clang/Basic/CharInfo.h"
Dmitri Gribenko	aab8383	2012-06-20 00:34:58 +0000	[diff] [blame]	18	#include "llvm/ADT/STLExtras.h"
Reid Kleckner	86565c1	2020-02-27 11:01:58 -0800	[diff] [blame]	19	#include "llvm/Support/Allocator.h"
Dmitri Gribenko	aab8383	2012-06-20 00:34:58 +0000	[diff] [blame]	20
				21	using namespace clang;
				22
				23	namespace {
				24	/// Get comment kind and bool describing if it is a trailing comment.
Dmitri Gribenko	e958562	2013-04-26 20:12:49 +0000	[diff] [blame]	25	std::pair<RawComment::CommentKind, bool> getCommentKind(StringRef Comment,
				26	bool ParseAllComments) {
				27	const size_t MinCommentLength = ParseAllComments ? 2 : 3;
				28	if ((Comment.size() < MinCommentLength) \|\| Comment[0] != '/')
Abramo Bagnara	e06a888	2012-07-04 07:30:26 +0000	[diff] [blame]	29	return std::make_pair(RawComment::RCK_Invalid, false);
Dmitri Gribenko	aab8383	2012-06-20 00:34:58 +0000	[diff] [blame]	30
				31	RawComment::CommentKind K;
				32	if (Comment[1] == '/') {
				33	if (Comment.size() < 3)
Abramo Bagnara	e06a888	2012-07-04 07:30:26 +0000	[diff] [blame]	34	return std::make_pair(RawComment::RCK_OrdinaryBCPL, false);
Dmitri Gribenko	aab8383	2012-06-20 00:34:58 +0000	[diff] [blame]	35
				36	if (Comment[2] == '/')
Abramo Bagnara	e06a888	2012-07-04 07:30:26 +0000	[diff] [blame]	37	K = RawComment::RCK_BCPLSlash;
Dmitri Gribenko	aab8383	2012-06-20 00:34:58 +0000	[diff] [blame]	38	else if (Comment[2] == '!')
Abramo Bagnara	e06a888	2012-07-04 07:30:26 +0000	[diff] [blame]	39	K = RawComment::RCK_BCPLExcl;
Dmitri Gribenko	aab8383	2012-06-20 00:34:58 +0000	[diff] [blame]	40	else
Abramo Bagnara	e06a888	2012-07-04 07:30:26 +0000	[diff] [blame]	41	return std::make_pair(RawComment::RCK_OrdinaryBCPL, false);
Dmitri Gribenko	aab8383	2012-06-20 00:34:58 +0000	[diff] [blame]	42	} else {
				43	assert(Comment.size() >= 4);
				44
				45	// Comment lexer does not understand escapes in comment markers, so pretend
				46	// that this is not a comment.
				47	if (Comment[1] != '*' \|\|
				48	Comment[Comment.size() - 2] != '*' \|\|
				49	Comment[Comment.size() - 1] != '/')
Abramo Bagnara	e06a888	2012-07-04 07:30:26 +0000	[diff] [blame]	50	return std::make_pair(RawComment::RCK_Invalid, false);
Dmitri Gribenko	aab8383	2012-06-20 00:34:58 +0000	[diff] [blame]	51
				52	if (Comment[2] == '*')
Abramo Bagnara	e06a888	2012-07-04 07:30:26 +0000	[diff] [blame]	53	K = RawComment::RCK_JavaDoc;
Dmitri Gribenko	aab8383	2012-06-20 00:34:58 +0000	[diff] [blame]	54	else if (Comment[2] == '!')
Abramo Bagnara	e06a888	2012-07-04 07:30:26 +0000	[diff] [blame]	55	K = RawComment::RCK_Qt;
Dmitri Gribenko	aab8383	2012-06-20 00:34:58 +0000	[diff] [blame]	56	else
Abramo Bagnara	e06a888	2012-07-04 07:30:26 +0000	[diff] [blame]	57	return std::make_pair(RawComment::RCK_OrdinaryC, false);
Dmitri Gribenko	aab8383	2012-06-20 00:34:58 +0000	[diff] [blame]	58	}
				59	const bool TrailingComment = (Comment.size() > 3) && (Comment[3] == '<');
				60	return std::make_pair(K, TrailingComment);
				61	}
				62
				63	bool mergedCommentIsTrailingComment(StringRef Comment) {
				64	return (Comment.size() > 3) && (Comment[3] == '<');
				65	}
James Dennett	2def1e8	2015-07-15 19:13:39 +0000	[diff] [blame]	66
				67	/// Returns true if R1 and R2 both have valid locations that start on the same
				68	/// column.
				69	bool commentsStartOnSameColumn(const SourceManager &SM, const RawComment &R1,
				70	const RawComment &R2) {
Stephen Kelly	f2ceec4	2018-08-09 21:08:08 +0000	[diff] [blame]	71	SourceLocation L1 = R1.getBeginLoc();
				72	SourceLocation L2 = R2.getBeginLoc();
James Dennett	2def1e8	2015-07-15 19:13:39 +0000	[diff] [blame]	73	bool Invalid = false;
				74	unsigned C1 = SM.getPresumedColumnNumber(L1, &Invalid);
				75	if (!Invalid) {
				76	unsigned C2 = SM.getPresumedColumnNumber(L2, &Invalid);
				77	return !Invalid && (C1 == C2);
				78	}
				79	return false;
				80	}
Dmitri Gribenko	aab8383	2012-06-20 00:34:58 +0000	[diff] [blame]	81	} // unnamed namespace
				82
Adrian Prantl	9fc8faf	2018-05-09 01:00:01 +0000	[diff] [blame]	83	/// Determines whether there is only whitespace in `Buffer` between `P`
James Dennett	2def1e8	2015-07-15 19:13:39 +0000	[diff] [blame]	84	/// and the previous line.
				85	/// \param Buffer The buffer to search in.
				86	/// \param P The offset from the beginning of `Buffer` to start from.
				87	/// \return true if all of the characters in `Buffer` ranging from the closest
				88	/// line-ending character before `P` (or the beginning of `Buffer`) to `P - 1`
				89	/// are whitespace.
				90	static bool onlyWhitespaceOnLineBefore(const char *Buffer, unsigned P) {
				91	// Search backwards until we see linefeed or carriage return.
				92	for (unsigned I = P; I != 0; --I) {
				93	char C = Buffer[I - 1];
				94	if (isVerticalWhitespace(C))
				95	return true;
				96	if (!isHorizontalWhitespace(C))
				97	return false;
				98	}
				99	// We hit the beginning of the buffer.
				100	return true;
				101	}
				102
				103	/// Returns whether `K` is an ordinary comment kind.
				104	static bool isOrdinaryKind(RawComment::CommentKind K) {
				105	return (K == RawComment::RCK_OrdinaryBCPL) \|\|
				106	(K == RawComment::RCK_OrdinaryC);
				107	}
				108
Dmitri Gribenko	aab8383	2012-06-20 00:34:58 +0000	[diff] [blame]	109	RawComment::RawComment(const SourceManager &SourceMgr, SourceRange SR,
David L. Jones	13d5a87	2018-03-02 00:07:45 +0000	[diff] [blame]	110	const CommentOptions &CommentOpts, bool Merged) :
Dmitri Gribenko	60c7ec6	2012-06-27 05:48:36 +0000	[diff] [blame]	111	Range(SR), RawTextValid(false), BriefTextValid(false),
David L. Jones	13d5a87	2018-03-02 00:07:45 +0000	[diff] [blame]	112	IsAttached(false), IsTrailingComment(false),
				113	IsAlmostTrailingComment(false) {
Dmitri Gribenko	aab8383	2012-06-20 00:34:58 +0000	[diff] [blame]	114	// Extract raw comment text, if possible.
Dmitri Gribenko	fecc2e0	2012-06-21 21:02:45 +0000	[diff] [blame]	115	if (SR.getBegin() == SR.getEnd() \|\| getRawText(SourceMgr).empty()) {
Abramo Bagnara	e06a888	2012-07-04 07:30:26 +0000	[diff] [blame]	116	Kind = RCK_Invalid;
Dmitri Gribenko	aab8383	2012-06-20 00:34:58 +0000	[diff] [blame]	117	return;
				118	}
				119
James Dennett	2def1e8	2015-07-15 19:13:39 +0000	[diff] [blame]	120	// Guess comment kind.
David L. Jones	13d5a87	2018-03-02 00:07:45 +0000	[diff] [blame]	121	std::pair<CommentKind, bool> K =
				122	getCommentKind(RawText, CommentOpts.ParseAllComments);
James Dennett	2def1e8	2015-07-15 19:13:39 +0000	[diff] [blame]	123
				124	// Guess whether an ordinary comment is trailing.
David L. Jones	13d5a87	2018-03-02 00:07:45 +0000	[diff] [blame]	125	if (CommentOpts.ParseAllComments && isOrdinaryKind(K.first)) {
James Dennett	2def1e8	2015-07-15 19:13:39 +0000	[diff] [blame]	126	FileID BeginFileID;
				127	unsigned BeginOffset;
				128	std::tie(BeginFileID, BeginOffset) =
				129	SourceMgr.getDecomposedLoc(Range.getBegin());
				130	if (BeginOffset != 0) {
				131	bool Invalid = false;
				132	const char *Buffer =
				133	SourceMgr.getBufferData(BeginFileID, &Invalid).data();
				134	IsTrailingComment \|=
				135	(!Invalid && !onlyWhitespaceOnLineBefore(Buffer, BeginOffset));
				136	}
				137	}
				138
Dmitri Gribenko	aab8383	2012-06-20 00:34:58 +0000	[diff] [blame]	139	if (!Merged) {
Dmitri Gribenko	aab8383	2012-06-20 00:34:58 +0000	[diff] [blame]	140	Kind = K.first;
James Dennett	2def1e8	2015-07-15 19:13:39 +0000	[diff] [blame]	141	IsTrailingComment \|= K.second;
Dmitri Gribenko	aab8383	2012-06-20 00:34:58 +0000	[diff] [blame]	142
				143	IsAlmostTrailingComment = RawText.startswith("//<") \|\|
				144	RawText.startswith("/*<");
				145	} else {
Abramo Bagnara	e06a888	2012-07-04 07:30:26 +0000	[diff] [blame]	146	Kind = RCK_Merged;
James Dennett	2def1e8	2015-07-15 19:13:39 +0000	[diff] [blame]	147	IsTrailingComment =
				148	IsTrailingComment \|\| mergedCommentIsTrailingComment(RawText);
Dmitri Gribenko	aab8383	2012-06-20 00:34:58 +0000	[diff] [blame]	149	}
				150	}
				151
Dmitri Gribenko	aab8383	2012-06-20 00:34:58 +0000	[diff] [blame]	152	StringRef RawComment::getRawTextSlow(const SourceManager &SourceMgr) const {
				153	FileID BeginFileID;
				154	FileID EndFileID;
				155	unsigned BeginOffset;
				156	unsigned EndOffset;
				157
Benjamin Kramer	867ea1d	2014-03-02 13:01:17 +0000	[diff] [blame]	158	std::tie(BeginFileID, BeginOffset) =
Dmitri Gribenko	aab8383	2012-06-20 00:34:58 +0000	[diff] [blame]	159	SourceMgr.getDecomposedLoc(Range.getBegin());
Benjamin Kramer	867ea1d	2014-03-02 13:01:17 +0000	[diff] [blame]	160	std::tie(EndFileID, EndOffset) = SourceMgr.getDecomposedLoc(Range.getEnd());
Dmitri Gribenko	aab8383	2012-06-20 00:34:58 +0000	[diff] [blame]	161
				162	const unsigned Length = EndOffset - BeginOffset;
				163	if (Length < 2)
				164	return StringRef();
				165
				166	// The comment can't begin in one file and end in another.
				167	assert(BeginFileID == EndFileID);
				168
				169	bool Invalid = false;
				170	const char *BufferStart = SourceMgr.getBufferData(BeginFileID,
				171	&Invalid).data();
				172	if (Invalid)
				173	return StringRef();
				174
				175	return StringRef(BufferStart + BeginOffset, Length);
				176	}
				177
Dmitri Gribenko	3292d06	2012-07-02 17:35:10 +0000	[diff] [blame]	178	const char *RawComment::extractBriefText(const ASTContext &Context) const {
Justin Bogner	1499413	2016-10-16 20:12:42 +0000	[diff] [blame]	179	// Lazily initialize RawText using the accessor before using it.
				180	(void)getRawText(Context.getSourceManager());
Dmitri Gribenko	5188c4b	2012-06-26 20:39:18 +0000	[diff] [blame]	181
Dmitri Gribenko	4586df7	2012-07-27 20:37:06 +0000	[diff] [blame]	182	// Since we will be copying the resulting text, all allocations made during
				183	// parsing are garbage after resulting string is formed. Thus we can use
				184	// a separate allocator for all temporary stuff.
				185	llvm::BumpPtrAllocator Allocator;
				186
Fariborz Jahanian	5b63707	2013-05-03 23:15:20 +0000	[diff] [blame]	187	comments::Lexer L(Allocator, Context.getDiagnostics(),
				188	Context.getCommentCommandTraits(),
Dmitri Gribenko	7acbf00	2012-09-10 20:32:42 +0000	[diff] [blame]	189	Range.getBegin(),
Dmitri Gribenko	5188c4b	2012-06-26 20:39:18 +0000	[diff] [blame]	190	RawText.begin(), RawText.end());
Dmitri Gribenko	7acbf00	2012-09-10 20:32:42 +0000	[diff] [blame]	191	comments::BriefParser P(L, Context.getCommentCommandTraits());
Dmitri Gribenko	5188c4b	2012-06-26 20:39:18 +0000	[diff] [blame]	192
				193	const std::string Result = P.Parse();
				194	const unsigned BriefTextLength = Result.size();
				195	char *BriefTextPtr = new (Context) char[BriefTextLength + 1];
				196	memcpy(BriefTextPtr, Result.c_str(), BriefTextLength + 1);
Dmitri Gribenko	3292d06	2012-07-02 17:35:10 +0000	[diff] [blame]	197	BriefText = BriefTextPtr;
Dmitri Gribenko	5188c4b	2012-06-26 20:39:18 +0000	[diff] [blame]	198	BriefTextValid = true;
				199
Dmitri Gribenko	3292d06	2012-07-02 17:35:10 +0000	[diff] [blame]	200	return BriefTextPtr;
Dmitri Gribenko	5188c4b	2012-06-26 20:39:18 +0000	[diff] [blame]	201	}
				202
Dmitri Gribenko	b261088	2012-08-14 17:17:18 +0000	[diff] [blame]	203	comments::FullComment *RawComment::parse(const ASTContext &Context,
Dmitri Gribenko	6743e04	2012-09-29 11:40:46 +0000	[diff] [blame]	204	const Preprocessor *PP,
Dmitri Gribenko	b261088	2012-08-14 17:17:18 +0000	[diff] [blame]	205	const Decl *D) const {
Justin Bogner	1499413	2016-10-16 20:12:42 +0000	[diff] [blame]	206	// Lazily initialize RawText using the accessor before using it.
				207	(void)getRawText(Context.getSourceManager());
Dmitri Gribenko	a43ec18	2012-08-11 00:51:43 +0000	[diff] [blame]	208
Fariborz Jahanian	5b63707	2013-05-03 23:15:20 +0000	[diff] [blame]	209	comments::Lexer L(Context.getAllocator(), Context.getDiagnostics(),
				210	Context.getCommentCommandTraits(),
Dmitri Gribenko	6bab911	2012-08-31 10:35:30 +0000	[diff] [blame]	211	getSourceRange().getBegin(),
Dmitri Gribenko	a43ec18	2012-08-11 00:51:43 +0000	[diff] [blame]	212	RawText.begin(), RawText.end());
				213	comments::Sema S(Context.getAllocator(), Context.getSourceManager(),
Dmitri Gribenko	7acbf00	2012-09-10 20:32:42 +0000	[diff] [blame]	214	Context.getDiagnostics(),
Dmitri Gribenko	6743e04	2012-09-29 11:40:46 +0000	[diff] [blame]	215	Context.getCommentCommandTraits(),
				216	PP);
Dmitri Gribenko	b261088	2012-08-14 17:17:18 +0000	[diff] [blame]	217	S.setDecl(D);
Dmitri Gribenko	a43ec18	2012-08-11 00:51:43 +0000	[diff] [blame]	218	comments::Parser P(L, S, Context.getAllocator(), Context.getSourceManager(),
Dmitri Gribenko	7acbf00	2012-09-10 20:32:42 +0000	[diff] [blame]	219	Context.getDiagnostics(),
				220	Context.getCommentCommandTraits());
Dmitri Gribenko	a43ec18	2012-08-11 00:51:43 +0000	[diff] [blame]	221
Dmitri Gribenko	b261088	2012-08-14 17:17:18 +0000	[diff] [blame]	222	return P.parseFullComment();
Dmitri Gribenko	a43ec18	2012-08-11 00:51:43 +0000	[diff] [blame]	223	}
				224
Benjamin Kramer	20c28be	2013-09-28 15:06:27 +0000	[diff] [blame]	225	static bool onlyWhitespaceBetween(SourceManager &SM,
				226	SourceLocation Loc1, SourceLocation Loc2,
				227	unsigned MaxNewlinesAllowed) {
Dmitri Gribenko	1d0f567	2012-09-09 20:47:31 +0000	[diff] [blame]	228	std::pair<FileID, unsigned> Loc1Info = SM.getDecomposedLoc(Loc1);
				229	std::pair<FileID, unsigned> Loc2Info = SM.getDecomposedLoc(Loc2);
Dmitri Gribenko	aab8383	2012-06-20 00:34:58 +0000	[diff] [blame]	230
Dmitri Gribenko	1d0f567	2012-09-09 20:47:31 +0000	[diff] [blame]	231	// Question does not make sense if locations are in different files.
				232	if (Loc1Info.first != Loc2Info.first)
Dmitri Gribenko	aab8383	2012-06-20 00:34:58 +0000	[diff] [blame]	233	return false;
				234
				235	bool Invalid = false;
Dmitri Gribenko	1d0f567	2012-09-09 20:47:31 +0000	[diff] [blame]	236	const char *Buffer = SM.getBufferData(Loc1Info.first, &Invalid).data();
Dmitri Gribenko	aab8383	2012-06-20 00:34:58 +0000	[diff] [blame]	237	if (Invalid)
				238	return false;
				239
Benjamin Kramer	20c28be	2013-09-28 15:06:27 +0000	[diff] [blame]	240	unsigned NumNewlines = 0;
				241	assert(Loc1Info.second <= Loc2Info.second && "Loc1 after Loc2!");
				242	// Look for non-whitespace characters and remember any newlines seen.
				243	for (unsigned I = Loc1Info.second; I != Loc2Info.second; ++I) {
				244	switch (Buffer[I]) {
				245	default:
				246	return false;
				247	case ' ':
				248	case '\t':
				249	case '\f':
				250	case '\v':
				251	break;
				252	case '\r':
				253	case '\n':
				254	++NumNewlines;
				255
				256	// Check if we have found more than the maximum allowed number of
				257	// newlines.
				258	if (NumNewlines > MaxNewlinesAllowed)
				259	return false;
				260
				261	// Collapse \r\n and \n\r into a single newline.
				262	if (I + 1 != Loc2Info.second &&
				263	(Buffer[I + 1] == '\n' \|\| Buffer[I + 1] == '\r') &&
				264	Buffer[I] != Buffer[I + 1])
				265	++I;
				266	break;
				267	}
				268	}
				269
				270	return true;
Dmitri Gribenko	aab8383	2012-06-20 00:34:58 +0000	[diff] [blame]	271	}
Dmitri Gribenko	aab8383	2012-06-20 00:34:58 +0000	[diff] [blame]	272
Dmitri Gribenko	7dd29d4	2012-07-06 18:19:34 +0000	[diff] [blame]	273	void RawCommentList::addComment(const RawComment &RC,
David L. Jones	13d5a87	2018-03-02 00:07:45 +0000	[diff] [blame]	274	const CommentOptions &CommentOpts,
Dmitri Gribenko	7dd29d4	2012-07-06 18:19:34 +0000	[diff] [blame]	275	llvm::BumpPtrAllocator &Allocator) {
Dmitri Gribenko	aab8383	2012-06-20 00:34:58 +0000	[diff] [blame]	276	if (RC.isInvalid())
				277	return;
				278
Dmitri Gribenko	aab8383	2012-06-20 00:34:58 +0000	[diff] [blame]	279	// Ordinary comments are not interesting for us.
David L. Jones	13d5a87	2018-03-02 00:07:45 +0000	[diff] [blame]	280	if (RC.isOrdinary() && !CommentOpts.ParseAllComments)
Dmitri Gribenko	aab8383	2012-06-20 00:34:58 +0000	[diff] [blame]	281	return;
				282
Jan Korous	f31d8df	2019-08-13 18:11:44 +0000	[diff] [blame]	283	std::pair<FileID, unsigned> Loc =
				284	SourceMgr.getDecomposedLoc(RC.getBeginLoc());
				285
				286	const FileID CommentFile = Loc.first;
				287	const unsigned CommentOffset = Loc.second;
				288
Dmitri Gribenko	aab8383	2012-06-20 00:34:58 +0000	[diff] [blame]	289	// If this is the first Doxygen comment, save it (because there isn't
				290	// anything to merge it with).
Jan Korous	f31d8df	2019-08-13 18:11:44 +0000	[diff] [blame]	291	if (OrderedComments[CommentFile].empty()) {
				292	OrderedComments[CommentFile][CommentOffset] =
				293	new (Allocator) RawComment(RC);
Dmitri Gribenko	aab8383	2012-06-20 00:34:58 +0000	[diff] [blame]	294	return;
				295	}
				296
Jan Korous	f31d8df	2019-08-13 18:11:44 +0000	[diff] [blame]	297	const RawComment &C1 = *OrderedComments[CommentFile].rbegin()->second;
Dmitri Gribenko	aab8383	2012-06-20 00:34:58 +0000	[diff] [blame]	298	const RawComment &C2 = RC;
				299
				300	// Merge comments only if there is only whitespace between them.
James Dennett	2def1e8	2015-07-15 19:13:39 +0000	[diff] [blame]	301	// Can't merge trailing and non-trailing comments unless the second is
				302	// non-trailing ordinary in the same column, as in the case:
				303	// int x; // documents x
				304	// // more text
				305	// versus:
				306	// int x; // documents x
				307	// int y; // documents y
				308	// or:
				309	// int x; // documents x
				310	// // documents y
				311	// int y;
Dmitri Gribenko	557a8d5	2012-08-28 01:20:53 +0000	[diff] [blame]	312	// Merge comments if they are on same or consecutive lines.
James Dennett	2def1e8	2015-07-15 19:13:39 +0000	[diff] [blame]	313	if ((C1.isTrailingComment() == C2.isTrailingComment() \|\|
				314	(C1.isTrailingComment() && !C2.isTrailingComment() &&
				315	isOrdinaryKind(C2.getKind()) &&
				316	commentsStartOnSameColumn(SourceMgr, C1, C2))) &&
Stephen Kelly	1c301dc	2018-08-09 21:09:38 +0000	[diff] [blame]	317	onlyWhitespaceBetween(SourceMgr, C1.getEndLoc(), C2.getBeginLoc(),
Benjamin Kramer	20c28be	2013-09-28 15:06:27 +0000	[diff] [blame]	318	/MaxNewlinesAllowed=/1)) {
Stephen Kelly	1c301dc	2018-08-09 21:09:38 +0000	[diff] [blame]	319	SourceRange MergedRange(C1.getBeginLoc(), C2.getEndLoc());
Jan Korous	f31d8df	2019-08-13 18:11:44 +0000	[diff] [blame]	320	*OrderedComments[CommentFile].rbegin()->second =
				321	RawComment(SourceMgr, MergedRange, CommentOpts, true);
Benjamin Kramer	20c28be	2013-09-28 15:06:27 +0000	[diff] [blame]	322	} else {
Jan Korous	f31d8df	2019-08-13 18:11:44 +0000	[diff] [blame]	323	OrderedComments[CommentFile][CommentOffset] =
				324	new (Allocator) RawComment(RC);
Benjamin Kramer	20c28be	2013-09-28 15:06:27 +0000	[diff] [blame]	325	}
Dmitri Gribenko	aab8383	2012-06-20 00:34:58 +0000	[diff] [blame]	326	}
Dmitri Gribenko	9ee0e30	2014-03-27 15:40:39 +0000	[diff] [blame]	327
Jan Korous	f31d8df	2019-08-13 18:11:44 +0000	[diff] [blame]	328	const std::map<unsigned, RawComment >
				329	RawCommentList::getCommentsInFile(FileID File) const {
				330	auto CommentsInFile = OrderedComments.find(File);
				331	if (CommentsInFile == OrderedComments.end())
				332	return nullptr;
Dmitri Gribenko	9ee0e30	2014-03-27 15:40:39 +0000	[diff] [blame]	333
Jan Korous	f31d8df	2019-08-13 18:11:44 +0000	[diff] [blame]	334	return &CommentsInFile->second;
				335	}
				336
				337	bool RawCommentList::empty() const { return OrderedComments.empty(); }
				338
				339	unsigned RawCommentList::getCommentBeginLine(RawComment *C, FileID File,
				340	unsigned Offset) const {
				341	auto Cached = CommentBeginLine.find(C);
				342	if (Cached != CommentBeginLine.end())
				343	return Cached->second;
				344	const unsigned Line = SourceMgr.getLineNumber(File, Offset);
				345	CommentBeginLine[C] = Line;
				346	return Line;
				347	}
				348
				349	unsigned RawCommentList::getCommentEndOffset(RawComment *C) const {
				350	auto Cached = CommentEndOffset.find(C);
				351	if (Cached != CommentEndOffset.end())
				352	return Cached->second;
				353	const unsigned Offset =
				354	SourceMgr.getDecomposedLoc(C->getSourceRange().getEnd()).second;
				355	CommentEndOffset[C] = Offset;
				356	return Offset;
Dmitri Gribenko	9ee0e30	2014-03-27 15:40:39 +0000	[diff] [blame]	357	}
Ilya Biryukov	1ff7c32	2018-05-16 12:30:09 +0000	[diff] [blame]	358
				359	std::string RawComment::getFormattedText(const SourceManager &SourceMgr,
				360	DiagnosticsEngine &Diags) const {
				361	llvm::StringRef CommentText = getRawText(SourceMgr);
				362	if (CommentText.empty())
				363	return "";
				364
				365	llvm::BumpPtrAllocator Allocator;
				366	// We do not parse any commands, so CommentOptions are ignored by
				367	// comments::Lexer. Therefore, we just use default-constructed options.
				368	CommentOptions DefOpts;
				369	comments::CommandTraits EmptyTraits(Allocator, DefOpts);
				370	comments::Lexer L(Allocator, Diags, EmptyTraits, getSourceRange().getBegin(),
				371	CommentText.begin(), CommentText.end(),
				372	/ParseCommands=/false);
				373
				374	std::string Result;
				375	// A column number of the first non-whitespace token in the comment text.
				376	// We skip whitespace up to this column, but keep the whitespace after this
				377	// column. IndentColumn is calculated when lexing the first line and reused
				378	// for the rest of lines.
				379	unsigned IndentColumn = 0;
				380
				381	// Processes one line of the comment and adds it to the result.
				382	// Handles skipping the indent at the start of the line.
				383	// Returns false when eof is reached and true otherwise.
				384	auto LexLine = [&](bool IsFirstLine) -> bool {
				385	comments::Token Tok;
				386	// Lex the first token on the line. We handle it separately, because we to
				387	// fix up its indentation.
				388	L.lex(Tok);
				389	if (Tok.is(comments::tok::eof))
				390	return false;
				391	if (Tok.is(comments::tok::newline)) {
				392	Result += "\n";
				393	return true;
				394	}
				395	llvm::StringRef TokText = L.getSpelling(Tok, SourceMgr);
				396	bool LocInvalid = false;
				397	unsigned TokColumn =
				398	SourceMgr.getSpellingColumnNumber(Tok.getLocation(), &LocInvalid);
				399	assert(!LocInvalid && "getFormattedText for invalid location");
				400
				401	// Amount of leading whitespace in TokText.
				402	size_t WhitespaceLen = TokText.find_first_not_of(" \t");
				403	if (WhitespaceLen == StringRef::npos)
				404	WhitespaceLen = TokText.size();
				405	// Remember the amount of whitespace we skipped in the first line to remove
				406	// indent up to that column in the following lines.
				407	if (IsFirstLine)
				408	IndentColumn = TokColumn + WhitespaceLen;
				409
				410	// Amount of leading whitespace we actually want to skip.
				411	// For the first line we skip all the whitespace.
				412	// For the rest of the lines, we skip whitespace up to IndentColumn.
				413	unsigned SkipLen =
				414	IsFirstLine
				415	? WhitespaceLen
				416	: std::min<size_t>(
				417	WhitespaceLen,
				418	std::max<int>(static_cast<int>(IndentColumn) - TokColumn, 0));
				419	llvm::StringRef Trimmed = TokText.drop_front(SkipLen);
				420	Result += Trimmed;
				421	// Lex all tokens in the rest of the line.
				422	for (L.lex(Tok); Tok.isNot(comments::tok::eof); L.lex(Tok)) {
				423	if (Tok.is(comments::tok::newline)) {
				424	Result += "\n";
				425	return true;
				426	}
				427	Result += L.getSpelling(Tok, SourceMgr);
				428	}
				429	// We've reached the end of file token.
				430	return false;
				431	};
				432
				433	auto DropTrailingNewLines = [](std::string &Str) {
Oliver Bruns	ad7211d	2020-04-06 10:38:30 +0200	[diff] [blame]	434	while (!Str.empty() && Str.back() == '\n')
Ilya Biryukov	1ff7c32	2018-05-16 12:30:09 +0000	[diff] [blame]	435	Str.pop_back();
				436	};
				437
Raphael Isemann	b23ccec	2018-12-10 12:37:46 +0000	[diff] [blame]	438	// Process first line separately to remember indent for the following lines.
Ilya Biryukov	1ff7c32	2018-05-16 12:30:09 +0000	[diff] [blame]	439	if (!LexLine(/IsFirstLine=/true)) {
				440	DropTrailingNewLines(Result);
				441	return Result;
				442	}
				443	// Process the rest of the lines.
				444	while (LexLine(/IsFirstLine=/false))
				445	;
				446	DropTrailingNewLines(Result);
				447	return Result;
				448	}