Blame - lib/Lex/TokenLexer.cpp - platform/external/clang

blob: 0f1004f2b2f766ddee5a97aabe078c57875433e6 [file] [log] [blame]

Chris Lattner	1543e9c	2008-03-09 02:18:51 +0000	[diff] [blame]	1	//===--- TokenLexer.cpp - Lex from a token stream -------------------------===//
Reid Spencer	5f016e2	2007-07-11 17:01:13 +0000	[diff] [blame]	2	//
				3	// The LLVM Compiler Infrastructure
				4	//
Chris Lattner	0bc735f	2007-12-29 19:59:25 +0000	[diff] [blame]	5	// This file is distributed under the University of Illinois Open Source
				6	// License. See LICENSE.TXT for details.
Reid Spencer	5f016e2	2007-07-11 17:01:13 +0000	[diff] [blame]	7	//
				8	//===----------------------------------------------------------------------===//
				9	//
Chris Lattner	1543e9c	2008-03-09 02:18:51 +0000	[diff] [blame]	10	// This file implements the TokenLexer interface.
Reid Spencer	5f016e2	2007-07-11 17:01:13 +0000	[diff] [blame]	11	//
				12	//===----------------------------------------------------------------------===//
				13
Chris Lattner	5d75de0	2008-03-09 02:22:57 +0000	[diff] [blame]	14	#include "clang/Lex/TokenLexer.h"
Chris Lattner	e5c8ffe	2008-03-09 02:55:12 +0000	[diff] [blame]	15	#include "MacroArgs.h"
Reid Spencer	5f016e2	2007-07-11 17:01:13 +0000	[diff] [blame]	16	#include "clang/Lex/MacroInfo.h"
				17	#include "clang/Lex/Preprocessor.h"
				18	#include "clang/Basic/SourceManager.h"
Chris Lattner	500d329	2009-01-29 05:15:15 +0000	[diff] [blame]	19	#include "clang/Lex/LexDiagnostic.h"
Benjamin Kramer	8fe83e1	2012-02-04 13:45:25 +0000	[diff] [blame]	20	#include "llvm/ADT/SmallString.h"
Reid Spencer	5f016e2	2007-07-11 17:01:13 +0000	[diff] [blame]	21	using namespace clang;
				22
Reid Spencer	5f016e2	2007-07-11 17:01:13 +0000	[diff] [blame]	23
Chris Lattner	1543e9c	2008-03-09 02:18:51 +0000	[diff] [blame]	24	/// Create a TokenLexer for the specified macro with the specified actual
Reid Spencer	5f016e2	2007-07-11 17:01:13 +0000	[diff] [blame]	25	/// arguments. Note that this ctor takes ownership of the ActualArgs pointer.
Chandler Carruth	d0f5e44	2011-07-14 08:20:34 +0000	[diff] [blame]	26	void TokenLexer::Init(Token &Tok, SourceLocation ELEnd, MacroArgs *Actuals) {
Chris Lattner	1543e9c	2008-03-09 02:18:51 +0000	[diff] [blame]	27	// If the client is reusing a TokenLexer, make sure to free any memory
Chris Lattner	9594acf	2007-07-15 00:25:26 +0000	[diff] [blame]	28	// associated with it.
				29	destroy();
Mike Stump	1eb4433	2009-09-09 15:08:12 +0000	[diff] [blame]	30
Chris Lattner	cc1a875	2007-10-07 08:44:20 +0000	[diff] [blame]	31	Macro = PP.getMacroInfo(Tok.getIdentifierInfo());
Chris Lattner	9594acf	2007-07-15 00:25:26 +0000	[diff] [blame]	32	ActualArgs = Actuals;
				33	CurToken = 0;
Mike Stump	1eb4433	2009-09-09 15:08:12 +0000	[diff] [blame]	34
Chandler Carruth	d0f5e44	2011-07-14 08:20:34 +0000	[diff] [blame]	35	ExpandLocStart = Tok.getLocation();
				36	ExpandLocEnd = ELEnd;
Chris Lattner	9594acf	2007-07-15 00:25:26 +0000	[diff] [blame]	37	AtStartOfLine = Tok.isAtStartOfLine();
				38	HasLeadingSpace = Tok.hasLeadingSpace();
Chris Lattner	8d89643	2008-03-09 02:07:49 +0000	[diff] [blame]	39	Tokens = &*Macro->tokens_begin();
				40	OwnsTokens = false;
Chris Lattner	6b88450	2008-03-10 06:06:04 +0000	[diff] [blame]	41	DisableMacroExpansion = false;
Chris Lattner	8d89643	2008-03-09 02:07:49 +0000	[diff] [blame]	42	NumTokens = Macro->tokens_end()-Macro->tokens_begin();
Argyrios Kyrtzidis	b73377e	2011-07-07 03:40:34 +0000	[diff] [blame]	43	MacroExpansionStart = SourceLocation();
				44
				45	SourceManager &SM = PP.getSourceManager();
Douglas Gregor	f62d43d	2011-07-19 16:10:42 +0000	[diff] [blame]	46	MacroStartSLocOffset = SM.getNextLocalOffset();
Argyrios Kyrtzidis	b73377e	2011-07-07 03:40:34 +0000	[diff] [blame]	47
				48	if (NumTokens > 0) {
				49	assert(Tokens[0].getLocation().isValid());
				50	assert((Tokens[0].getLocation().isFileID() \|\| Tokens[0].is(tok::comment)) &&
				51	"Macro defined in macro?");
Chandler Carruth	d0f5e44	2011-07-14 08:20:34 +0000	[diff] [blame]	52	assert(ExpandLocStart.isValid());
Argyrios Kyrtzidis	b73377e	2011-07-07 03:40:34 +0000	[diff] [blame]	53
				54	// Reserve a source location entry chunk for the length of the macro
				55	// definition. Tokens that get lexed directly from the definition will
				56	// have their locations pointing inside this chunk. This is to avoid
				57	// creating separate source location entries for each token.
Argyrios Kyrtzidis	499ea55	2011-08-23 21:02:38 +0000	[diff] [blame]	58	MacroDefStart = SM.getExpansionLoc(Tokens[0].getLocation());
				59	MacroDefLength = Macro->getDefinitionLength(SM);
				60	MacroExpansionStart = SM.createExpansionLoc(MacroDefStart,
Chandler Carruth	bf340e4	2011-07-26 03:03:05 +0000	[diff] [blame]	61	ExpandLocStart,
				62	ExpandLocEnd,
Argyrios Kyrtzidis	499ea55	2011-08-23 21:02:38 +0000	[diff] [blame]	63	MacroDefLength);
Argyrios Kyrtzidis	b73377e	2011-07-07 03:40:34 +0000	[diff] [blame]	64	}
Reid Spencer	5f016e2	2007-07-11 17:01:13 +0000	[diff] [blame]	65
				66	// If this is a function-like macro, expand the arguments and change
Chris Lattner	8d89643	2008-03-09 02:07:49 +0000	[diff] [blame]	67	// Tokens to point to the expanded tokens.
Reid Spencer	5f016e2	2007-07-11 17:01:13 +0000	[diff] [blame]	68	if (Macro->isFunctionLike() && Macro->getNumArgs())
				69	ExpandFunctionArguments();
Mike Stump	1eb4433	2009-09-09 15:08:12 +0000	[diff] [blame]	70
Reid Spencer	5f016e2	2007-07-11 17:01:13 +0000	[diff] [blame]	71	// Mark the macro as currently disabled, so that it is not recursively
				72	// expanded. The macro must be disabled only after argument pre-expansion of
				73	// function-like macro arguments occurs.
				74	Macro->DisableMacro();
				75	}
				76
Chris Lattner	9594acf	2007-07-15 00:25:26 +0000	[diff] [blame]	77
				78
Chris Lattner	1543e9c	2008-03-09 02:18:51 +0000	[diff] [blame]	79	/// Create a TokenLexer for the specified token stream. This does not
Reid Spencer	5f016e2	2007-07-11 17:01:13 +0000	[diff] [blame]	80	/// take ownership of the specified token vector.
Chris Lattner	6b88450	2008-03-10 06:06:04 +0000	[diff] [blame]	81	void TokenLexer::Init(const Token *TokArray, unsigned NumToks,
				82	bool disableMacroExpansion, bool ownsTokens) {
Chris Lattner	1543e9c	2008-03-09 02:18:51 +0000	[diff] [blame]	83	// If the client is reusing a TokenLexer, make sure to free any memory
Chris Lattner	9594acf	2007-07-15 00:25:26 +0000	[diff] [blame]	84	// associated with it.
				85	destroy();
Mike Stump	1eb4433	2009-09-09 15:08:12 +0000	[diff] [blame]	86
Chris Lattner	9594acf	2007-07-15 00:25:26 +0000	[diff] [blame]	87	Macro = 0;
				88	ActualArgs = 0;
Chris Lattner	8d89643	2008-03-09 02:07:49 +0000	[diff] [blame]	89	Tokens = TokArray;
Chris Lattner	6b88450	2008-03-10 06:06:04 +0000	[diff] [blame]	90	OwnsTokens = ownsTokens;
				91	DisableMacroExpansion = disableMacroExpansion;
Chris Lattner	8d89643	2008-03-09 02:07:49 +0000	[diff] [blame]	92	NumTokens = NumToks;
Chris Lattner	9594acf	2007-07-15 00:25:26 +0000	[diff] [blame]	93	CurToken = 0;
Chandler Carruth	d0f5e44	2011-07-14 08:20:34 +0000	[diff] [blame]	94	ExpandLocStart = ExpandLocEnd = SourceLocation();
Chris Lattner	9594acf	2007-07-15 00:25:26 +0000	[diff] [blame]	95	AtStartOfLine = false;
				96	HasLeadingSpace = false;
Argyrios Kyrtzidis	b73377e	2011-07-07 03:40:34 +0000	[diff] [blame]	97	MacroExpansionStart = SourceLocation();
Mike Stump	1eb4433	2009-09-09 15:08:12 +0000	[diff] [blame]	98
Reid Spencer	5f016e2	2007-07-11 17:01:13 +0000	[diff] [blame]	99	// Set HasLeadingSpace/AtStartOfLine so that the first token will be
				100	// returned unmodified.
				101	if (NumToks != 0) {
				102	AtStartOfLine = TokArray[0].isAtStartOfLine();
				103	HasLeadingSpace = TokArray[0].hasLeadingSpace();
				104	}
				105	}
				106
				107
Chris Lattner	1543e9c	2008-03-09 02:18:51 +0000	[diff] [blame]	108	void TokenLexer::destroy() {
Reid Spencer	5f016e2	2007-07-11 17:01:13 +0000	[diff] [blame]	109	// If this was a function-like macro that actually uses its arguments, delete
				110	// the expanded tokens.
Chris Lattner	8d89643	2008-03-09 02:07:49 +0000	[diff] [blame]	111	if (OwnsTokens) {
				112	delete [] Tokens;
				113	Tokens = 0;
Chris Lattner	32fca72	2009-03-04 06:50:57 +0000	[diff] [blame]	114	OwnsTokens = false;
Chris Lattner	9c68306	2007-07-22 01:16:55 +0000	[diff] [blame]	115	}
Mike Stump	1eb4433	2009-09-09 15:08:12 +0000	[diff] [blame]	116
Chris Lattner	1543e9c	2008-03-09 02:18:51 +0000	[diff] [blame]	117	// TokenLexer owns its formal arguments.
Chris Lattner	561395b	2009-12-14 22:12:52 +0000	[diff] [blame]	118	if (ActualArgs) ActualArgs->destroy(PP);
Reid Spencer	5f016e2	2007-07-11 17:01:13 +0000	[diff] [blame]	119	}
				120
				121	/// Expand the arguments of a function-like macro so that we can quickly
Chris Lattner	8d89643	2008-03-09 02:07:49 +0000	[diff] [blame]	122	/// return preexpanded tokens from Tokens.
Chris Lattner	1543e9c	2008-03-09 02:18:51 +0000	[diff] [blame]	123	void TokenLexer::ExpandFunctionArguments() {
Argyrios Kyrtzidis	0fd9c48	2011-07-07 03:40:37 +0000	[diff] [blame]	124
Chris Lattner	5f9e272	2011-07-23 10:55:15 +0000	[diff] [blame]	125	SmallVector<Token, 128> ResultToks;
Mike Stump	1eb4433	2009-09-09 15:08:12 +0000	[diff] [blame]	126
Chris Lattner	8d89643	2008-03-09 02:07:49 +0000	[diff] [blame]	127	// Loop through 'Tokens', expanding them into ResultToks. Keep
Reid Spencer	5f016e2	2007-07-11 17:01:13 +0000	[diff] [blame]	128	// track of whether we change anything. If not, no need to keep them. If so,
Chris Lattner	8d89643	2008-03-09 02:07:49 +0000	[diff] [blame]	129	// we install the newly expanded sequence as the new 'Tokens' list.
Reid Spencer	5f016e2	2007-07-11 17:01:13 +0000	[diff] [blame]	130	bool MadeChange = false;
Mike Stump	1eb4433	2009-09-09 15:08:12 +0000	[diff] [blame]	131
Reid Spencer	5f016e2	2007-07-11 17:01:13 +0000	[diff] [blame]	132	// NextTokGetsSpace - When this is true, the next token appended to the
				133	// output list will get a leading space, regardless of whether it had one to
				134	// begin with or not. This is used for placemarker support.
				135	bool NextTokGetsSpace = false;
Mike Stump	1eb4433	2009-09-09 15:08:12 +0000	[diff] [blame]	136
Chris Lattner	8d89643	2008-03-09 02:07:49 +0000	[diff] [blame]	137	for (unsigned i = 0, e = NumTokens; i != e; ++i) {
Reid Spencer	5f016e2	2007-07-11 17:01:13 +0000	[diff] [blame]	138	// If we found the stringify operator, get the argument stringified. The
				139	// preprocessor already verified that the following token is a macro name
				140	// when the #define was parsed.
Chris Lattner	8d89643	2008-03-09 02:07:49 +0000	[diff] [blame]	141	const Token &CurTok = Tokens[i];
Chris Lattner	22f6bbc	2007-10-09 18:02:16 +0000	[diff] [blame]	142	if (CurTok.is(tok::hash) \|\| CurTok.is(tok::hashat)) {
Chris Lattner	8d89643	2008-03-09 02:07:49 +0000	[diff] [blame]	143	int ArgNo = Macro->getArgumentNum(Tokens[i+1].getIdentifierInfo());
Reid Spencer	5f016e2	2007-07-11 17:01:13 +0000	[diff] [blame]	144	assert(ArgNo != -1 && "Token following # is not an argument?");
Mike Stump	1eb4433	2009-09-09 15:08:12 +0000	[diff] [blame]	145
Abramo Bagnara	a08529c	2011-10-03 18:39:03 +0000	[diff] [blame]	146	SourceLocation ExpansionLocStart =
Argyrios Kyrtzidis	c0069d8	2011-08-23 21:02:32 +0000	[diff] [blame]	147	getExpansionLocForMacroDefLoc(CurTok.getLocation());
Abramo Bagnara	a08529c	2011-10-03 18:39:03 +0000	[diff] [blame]	148	SourceLocation ExpansionLocEnd =
				149	getExpansionLocForMacroDefLoc(Tokens[i+1].getLocation());
Argyrios Kyrtzidis	b73377e	2011-07-07 03:40:34 +0000	[diff] [blame]	150
Chris Lattner	d217773	2007-07-20 16:59:19 +0000	[diff] [blame]	151	Token Res;
Chris Lattner	22f6bbc	2007-10-09 18:02:16 +0000	[diff] [blame]	152	if (CurTok.is(tok::hash)) // Stringify
Abramo Bagnara	a08529c	2011-10-03 18:39:03 +0000	[diff] [blame]	153	Res = ActualArgs->getStringifiedArgument(ArgNo, PP,
				154	ExpansionLocStart,
				155	ExpansionLocEnd);
Reid Spencer	5f016e2	2007-07-11 17:01:13 +0000	[diff] [blame]	156	else {
				157	// 'charify': don't bother caching these.
Chris Lattner	e5c8ffe	2008-03-09 02:55:12 +0000	[diff] [blame]	158	Res = MacroArgs::StringifyArgument(ActualArgs->getUnexpArgument(ArgNo),
Abramo Bagnara	a08529c	2011-10-03 18:39:03 +0000	[diff] [blame]	159	PP, true,
				160	ExpansionLocStart,
				161	ExpansionLocEnd);
Reid Spencer	5f016e2	2007-07-11 17:01:13 +0000	[diff] [blame]	162	}
Mike Stump	1eb4433	2009-09-09 15:08:12 +0000	[diff] [blame]	163
Reid Spencer	5f016e2	2007-07-11 17:01:13 +0000	[diff] [blame]	164	// The stringified/charified string leading space flag gets set to match
				165	// the #/#@ operator.
				166	if (CurTok.hasLeadingSpace() \|\| NextTokGetsSpace)
Chris Lattner	d217773	2007-07-20 16:59:19 +0000	[diff] [blame]	167	Res.setFlag(Token::LeadingSpace);
Mike Stump	1eb4433	2009-09-09 15:08:12 +0000	[diff] [blame]	168
Reid Spencer	5f016e2	2007-07-11 17:01:13 +0000	[diff] [blame]	169	ResultToks.push_back(Res);
				170	MadeChange = true;
				171	++i; // Skip arg name.
				172	NextTokGetsSpace = false;
				173	continue;
				174	}
Mike Stump	1eb4433	2009-09-09 15:08:12 +0000	[diff] [blame]	175
Reid Spencer	5f016e2	2007-07-11 17:01:13 +0000	[diff] [blame]	176	// Otherwise, if this is not an argument token, just add the token to the
				177	// output buffer.
				178	IdentifierInfo *II = CurTok.getIdentifierInfo();
				179	int ArgNo = II ? Macro->getArgumentNum(II) : -1;
				180	if (ArgNo == -1) {
				181	// This isn't an argument, just add it.
				182	ResultToks.push_back(CurTok);
				183
				184	if (NextTokGetsSpace) {
Chris Lattner	d217773	2007-07-20 16:59:19 +0000	[diff] [blame]	185	ResultToks.back().setFlag(Token::LeadingSpace);
Reid Spencer	5f016e2	2007-07-11 17:01:13 +0000	[diff] [blame]	186	NextTokGetsSpace = false;
				187	}
				188	continue;
				189	}
Mike Stump	1eb4433	2009-09-09 15:08:12 +0000	[diff] [blame]	190
Reid Spencer	5f016e2	2007-07-11 17:01:13 +0000	[diff] [blame]	191	// An argument is expanded somehow, the result is different than the
				192	// input.
				193	MadeChange = true;
				194
				195	// Otherwise, this is a use of the argument. Find out if there is a paste
				196	// (##) operator before or after the argument.
Mike Stump	1eb4433	2009-09-09 15:08:12 +0000	[diff] [blame]	197	bool PasteBefore =
Argyrios Kyrtzidis	3582a6c	2011-07-07 18:04:47 +0000	[diff] [blame]	198	!ResultToks.empty() && ResultToks.back().is(tok::hashhash);
Chris Lattner	8d89643	2008-03-09 02:07:49 +0000	[diff] [blame]	199	bool PasteAfter = i+1 != e && Tokens[i+1].is(tok::hashhash);
Mike Stump	1eb4433	2009-09-09 15:08:12 +0000	[diff] [blame]	200
Reid Spencer	5f016e2	2007-07-11 17:01:13 +0000	[diff] [blame]	201	// If it is not the LHS/RHS of a ## operator, we must pre-expand the
				202	// argument and substitute the expanded tokens into the result. This is
				203	// C99 6.10.3.1p1.
				204	if (!PasteBefore && !PasteAfter) {
Chris Lattner	d217773	2007-07-20 16:59:19 +0000	[diff] [blame]	205	const Token *ResultArgToks;
Reid Spencer	5f016e2	2007-07-11 17:01:13 +0000	[diff] [blame]	206
				207	// Only preexpand the argument if it could possibly need it. This
				208	// avoids some work in common cases.
Chris Lattner	d217773	2007-07-20 16:59:19 +0000	[diff] [blame]	209	const Token *ArgTok = ActualArgs->getUnexpArgument(ArgNo);
Chris Lattner	cc1a875	2007-10-07 08:44:20 +0000	[diff] [blame]	210	if (ActualArgs->ArgNeedsPreexpansion(ArgTok, PP))
Chris Lattner	f5809a7	2009-12-28 06:17:16 +0000	[diff] [blame]	211	ResultArgToks = &ActualArgs->getPreExpArgument(ArgNo, Macro, PP)[0];
Reid Spencer	5f016e2	2007-07-11 17:01:13 +0000	[diff] [blame]	212	else
				213	ResultArgToks = ArgTok; // Use non-preexpanded tokens.
Mike Stump	1eb4433	2009-09-09 15:08:12 +0000	[diff] [blame]	214
Reid Spencer	5f016e2	2007-07-11 17:01:13 +0000	[diff] [blame]	215	// If the arg token expanded into anything, append it.
Chris Lattner	22f6bbc	2007-10-09 18:02:16 +0000	[diff] [blame]	216	if (ResultArgToks->isNot(tok::eof)) {
Reid Spencer	5f016e2	2007-07-11 17:01:13 +0000	[diff] [blame]	217	unsigned FirstResult = ResultToks.size();
				218	unsigned NumToks = MacroArgs::getArgLength(ResultArgToks);
				219	ResultToks.append(ResultArgToks, ResultArgToks+NumToks);
Mike Stump	1eb4433	2009-09-09 15:08:12 +0000	[diff] [blame]	220
Argyrios Kyrtzidis	3582a6c	2011-07-07 18:04:47 +0000	[diff] [blame]	221	// If the '##' came from expanding an argument, turn it into 'unknown'
				222	// to avoid pasting.
				223	for (unsigned i = FirstResult, e = ResultToks.size(); i != e; ++i) {
				224	Token &Tok = ResultToks[i];
				225	if (Tok.is(tok::hashhash))
				226	Tok.setKind(tok::unknown);
				227	}
				228
Chandler Carruth	d0f5e44	2011-07-14 08:20:34 +0000	[diff] [blame]	229	if(ExpandLocStart.isValid()) {
Argyrios Kyrtzidis	d60a34a	2011-08-19 22:34:17 +0000	[diff] [blame]	230	updateLocForMacroArgTokens(CurTok.getLocation(),
				231	ResultToks.begin()+FirstResult,
				232	ResultToks.end());
Argyrios Kyrtzidis	b73377e	2011-07-07 03:40:34 +0000	[diff] [blame]	233	}
				234
Reid Spencer	5f016e2	2007-07-11 17:01:13 +0000	[diff] [blame]	235	// If any tokens were substituted from the argument, the whitespace
				236	// before the first token should match the whitespace of the arg
				237	// identifier.
Chris Lattner	d217773	2007-07-20 16:59:19 +0000	[diff] [blame]	238	ResultToks[FirstResult].setFlagValue(Token::LeadingSpace,
Reid Spencer	5f016e2	2007-07-11 17:01:13 +0000	[diff] [blame]	239	CurTok.hasLeadingSpace() \|\|
				240	NextTokGetsSpace);
				241	NextTokGetsSpace = false;
				242	} else {
				243	// If this is an empty argument, and if there was whitespace before the
				244	// formal token, make sure the next token gets whitespace before it.
				245	NextTokGetsSpace = CurTok.hasLeadingSpace();
				246	}
				247	continue;
				248	}
Mike Stump	1eb4433	2009-09-09 15:08:12 +0000	[diff] [blame]	249
Reid Spencer	5f016e2	2007-07-11 17:01:13 +0000	[diff] [blame]	250	// Okay, we have a token that is either the LHS or RHS of a paste (##)
				251	// argument. It gets substituted as its non-pre-expanded tokens.
Chris Lattner	d217773	2007-07-20 16:59:19 +0000	[diff] [blame]	252	const Token *ArgToks = ActualArgs->getUnexpArgument(ArgNo);
Reid Spencer	5f016e2	2007-07-11 17:01:13 +0000	[diff] [blame]	253	unsigned NumToks = MacroArgs::getArgLength(ArgToks);
				254	if (NumToks) { // Not an empty argument?
Richard Smith	9f728cd	2012-06-22 23:59:08 +0000	[diff] [blame^]	255	// If this is the GNU ", ## __VA_ARGS__" extension, and we just learned
				256	// that __VA_ARGS__ expands to multiple tokens, avoid a pasting error when
				257	// the expander trys to paste ',' with the first token of the __VA_ARGS__
Chris Lattner	71a3a8d	2008-01-29 07:54:23 +0000	[diff] [blame]	258	// expansion.
				259	if (PasteBefore && ResultToks.size() >= 2 &&
				260	ResultToks[ResultToks.size()-2].is(tok::comma) &&
				261	(unsigned)ArgNo == Macro->getNumArgs()-1 &&
				262	Macro->isVariadic()) {
				263	// Remove the paste operator, report use of the extension.
				264	PP.Diag(ResultToks.back().getLocation(), diag::ext_paste_comma);
				265	ResultToks.pop_back();
				266	}
Mike Stump	1eb4433	2009-09-09 15:08:12 +0000	[diff] [blame]	267
Reid Spencer	5f016e2	2007-07-11 17:01:13 +0000	[diff] [blame]	268	ResultToks.append(ArgToks, ArgToks+NumToks);
Mike Stump	1eb4433	2009-09-09 15:08:12 +0000	[diff] [blame]	269
Argyrios Kyrtzidis	3582a6c	2011-07-07 18:04:47 +0000	[diff] [blame]	270	// If the '##' came from expanding an argument, turn it into 'unknown'
				271	// to avoid pasting.
				272	for (unsigned i = ResultToks.size() - NumToks, e = ResultToks.size();
				273	i != e; ++i) {
				274	Token &Tok = ResultToks[i];
				275	if (Tok.is(tok::hashhash))
				276	Tok.setKind(tok::unknown);
				277	}
				278
Chandler Carruth	d0f5e44	2011-07-14 08:20:34 +0000	[diff] [blame]	279	if (ExpandLocStart.isValid()) {
Argyrios Kyrtzidis	d60a34a	2011-08-19 22:34:17 +0000	[diff] [blame]	280	updateLocForMacroArgTokens(CurTok.getLocation(),
				281	ResultToks.end()-NumToks, ResultToks.end());
Argyrios Kyrtzidis	b73377e	2011-07-07 03:40:34 +0000	[diff] [blame]	282	}
				283
Chris Lattner	442a661	2009-05-25 16:23:08 +0000	[diff] [blame]	284	// If this token (the macro argument) was supposed to get leading
				285	// whitespace, transfer this information onto the first token of the
				286	// expansion.
				287	//
				288	// Do not do this if the paste operator occurs before the macro argument,
				289	// as in "A ## MACROARG". In valid code, the first token will get
				290	// smooshed onto the preceding one anyway (forming AMACROARG). In
				291	// assembler-with-cpp mode, invalid pastes are allowed through: in this
				292	// case, we do not want the extra whitespace to be added. For example,
				293	// we want ". ## foo" -> ".foo" not ". foo".
				294	if ((CurTok.hasLeadingSpace() \|\| NextTokGetsSpace) &&
				295	!PasteBefore)
				296	ResultToks[ResultToks.size()-NumToks].setFlag(Token::LeadingSpace);
Mike Stump	1eb4433	2009-09-09 15:08:12 +0000	[diff] [blame]	297
Chris Lattner	442a661	2009-05-25 16:23:08 +0000	[diff] [blame]	298	NextTokGetsSpace = false;
Reid Spencer	5f016e2	2007-07-11 17:01:13 +0000	[diff] [blame]	299	continue;
				300	}
Mike Stump	1eb4433	2009-09-09 15:08:12 +0000	[diff] [blame]	301
Reid Spencer	5f016e2	2007-07-11 17:01:13 +0000	[diff] [blame]	302	// If an empty argument is on the LHS or RHS of a paste, the standard (C99
				303	// 6.10.3.3p2,3) calls for a bunch of placemarker stuff to occur. We
				304	// implement this by eating ## operators when a LHS or RHS expands to
				305	// empty.
				306	NextTokGetsSpace \|= CurTok.hasLeadingSpace();
				307	if (PasteAfter) {
				308	// Discard the argument token and skip (don't copy to the expansion
				309	// buffer) the paste operator after it.
Chris Lattner	8d89643	2008-03-09 02:07:49 +0000	[diff] [blame]	310	NextTokGetsSpace \|= Tokens[i+1].hasLeadingSpace();
Reid Spencer	5f016e2	2007-07-11 17:01:13 +0000	[diff] [blame]	311	++i;
				312	continue;
				313	}
Mike Stump	1eb4433	2009-09-09 15:08:12 +0000	[diff] [blame]	314
Reid Spencer	5f016e2	2007-07-11 17:01:13 +0000	[diff] [blame]	315	// If this is on the RHS of a paste operator, we've already copied the
				316	// paste operator to the ResultToks list. Remove it.
Chris Lattner	22f6bbc	2007-10-09 18:02:16 +0000	[diff] [blame]	317	assert(PasteBefore && ResultToks.back().is(tok::hashhash));
Reid Spencer	5f016e2	2007-07-11 17:01:13 +0000	[diff] [blame]	318	NextTokGetsSpace \|= ResultToks.back().hasLeadingSpace();
				319	ResultToks.pop_back();
Mike Stump	1eb4433	2009-09-09 15:08:12 +0000	[diff] [blame]	320
Reid Spencer	5f016e2	2007-07-11 17:01:13 +0000	[diff] [blame]	321	// If this is the __VA_ARGS__ token, and if the argument wasn't provided,
				322	// and if the macro had at least one real argument, and if the token before
				323	// the ## was a comma, remove the comma.
				324	if ((unsigned)ArgNo == Macro->getNumArgs()-1 && // is __VA_ARGS__
				325	ActualArgs->isVarargsElidedUse() && // Argument elided.
Chris Lattner	22f6bbc	2007-10-09 18:02:16 +0000	[diff] [blame]	326	!ResultToks.empty() && ResultToks.back().is(tok::comma)) {
Reid Spencer	5f016e2	2007-07-11 17:01:13 +0000	[diff] [blame]	327	// Never add a space, even if the comma, ##, or arg had a space.
				328	NextTokGetsSpace = false;
Chris Lattner	71a3a8d	2008-01-29 07:54:23 +0000	[diff] [blame]	329	// Remove the paste operator, report use of the extension.
				330	PP.Diag(ResultToks.back().getLocation(), diag::ext_paste_comma);
Reid Spencer	5f016e2	2007-07-11 17:01:13 +0000	[diff] [blame]	331	ResultToks.pop_back();
Chris Lattner	496af57	2010-08-21 00:27:00 +0000	[diff] [blame]	332
				333	// If the comma was right after another paste (e.g. "X##,##__VA_ARGS__"),
				334	// then removal of the comma should produce a placemarker token (in C99
				335	// terms) which we model by popping off the previous ##, giving us a plain
				336	// "X" when __VA_ARGS__ is empty.
				337	if (!ResultToks.empty() && ResultToks.back().is(tok::hashhash))
				338	ResultToks.pop_back();
Reid Spencer	5f016e2	2007-07-11 17:01:13 +0000	[diff] [blame]	339	}
				340	continue;
				341	}
Mike Stump	1eb4433	2009-09-09 15:08:12 +0000	[diff] [blame]	342
Chris Lattner	8d89643	2008-03-09 02:07:49 +0000	[diff] [blame]	343	// If anything changed, install this as the new Tokens list.
Reid Spencer	5f016e2	2007-07-11 17:01:13 +0000	[diff] [blame]	344	if (MadeChange) {
Chris Lattner	32fca72	2009-03-04 06:50:57 +0000	[diff] [blame]	345	assert(!OwnsTokens && "This would leak if we already own the token list");
Reid Spencer	5f016e2	2007-07-11 17:01:13 +0000	[diff] [blame]	346	// This is deleted in the dtor.
Chris Lattner	8d89643	2008-03-09 02:07:49 +0000	[diff] [blame]	347	NumTokens = ResultToks.size();
Argyrios Kyrtzidis	5b3284a	2011-06-29 22:20:11 +0000	[diff] [blame]	348	// The tokens will be added to Preprocessor's cache and will be removed
				349	// when this TokenLexer finishes lexing them.
				350	Tokens = PP.cacheMacroExpandedTokens(this, ResultToks);
Mike Stump	1eb4433	2009-09-09 15:08:12 +0000	[diff] [blame]	351
Argyrios Kyrtzidis	5b3284a	2011-06-29 22:20:11 +0000	[diff] [blame]	352	// The preprocessor cache of macro expanded tokens owns these tokens,not us.
Chris Lattner	32fca72	2009-03-04 06:50:57 +0000	[diff] [blame]	353	OwnsTokens = false;
Reid Spencer	5f016e2	2007-07-11 17:01:13 +0000	[diff] [blame]	354	}
				355	}
				356
				357	/// Lex - Lex and return a token from this macro stream.
				358	///
Chris Lattner	1543e9c	2008-03-09 02:18:51 +0000	[diff] [blame]	359	void TokenLexer::Lex(Token &Tok) {
Reid Spencer	5f016e2	2007-07-11 17:01:13 +0000	[diff] [blame]	360	// Lexing off the end of the macro, pop this macro off the expansion stack.
				361	if (isAtEnd()) {
				362	// If this is a macro (not a token stream), mark the macro enabled now
				363	// that it is no longer being expanded.
				364	if (Macro) Macro->EnableMacro();
				365
				366	// Pop this context off the preprocessors lexer stack and get the next
				367	// token. This will delete "this" so remember the PP instance var.
				368	Preprocessor &PPCache = PP;
Chris Lattner	fde2bf9	2008-03-09 03:04:16 +0000	[diff] [blame]	369	if (PP.HandleEndOfTokenLexer(Tok))
Reid Spencer	5f016e2	2007-07-11 17:01:13 +0000	[diff] [blame]	370	return;
				371
Chris Lattner	fde2bf9	2008-03-09 03:04:16 +0000	[diff] [blame]	372	// HandleEndOfTokenLexer may not return a token. If it doesn't, lex
				373	// whatever is next.
Reid Spencer	5f016e2	2007-07-11 17:01:13 +0000	[diff] [blame]	374	return PPCache.Lex(Tok);
				375	}
Mike Stump	1eb4433	2009-09-09 15:08:12 +0000	[diff] [blame]	376
Argyrios Kyrtzidis	0fd9c48	2011-07-07 03:40:37 +0000	[diff] [blame]	377	SourceManager &SM = PP.getSourceManager();
				378
Reid Spencer	5f016e2	2007-07-11 17:01:13 +0000	[diff] [blame]	379	// If this is the first token of the expanded result, we inherit spacing
				380	// properties later.
				381	bool isFirstToken = CurToken == 0;
Mike Stump	1eb4433	2009-09-09 15:08:12 +0000	[diff] [blame]	382
Reid Spencer	5f016e2	2007-07-11 17:01:13 +0000	[diff] [blame]	383	// Get the next token to return.
Chris Lattner	8d89643	2008-03-09 02:07:49 +0000	[diff] [blame]	384	Tok = Tokens[CurToken++];
Mike Stump	1eb4433	2009-09-09 15:08:12 +0000	[diff] [blame]	385
Chris Lattner	332ee08	2009-04-19 20:29:42 +0000	[diff] [blame]	386	bool TokenIsFromPaste = false;
Mike Stump	1eb4433	2009-09-09 15:08:12 +0000	[diff] [blame]	387
Reid Spencer	5f016e2	2007-07-11 17:01:13 +0000	[diff] [blame]	388	// If this token is followed by a token paste (##) operator, paste the tokens!
Chris Lattner	b11e43c	2011-06-14 18:19:37 +0000	[diff] [blame]	389	// Note that ## is a normal token when not expanding a macro.
Argyrios Kyrtzidis	3582a6c	2011-07-07 18:04:47 +0000	[diff] [blame]	390	if (!isAtEnd() && Tokens[CurToken].is(tok::hashhash) && Macro) {
Chris Lattner	04f2bd8	2009-12-04 06:14:03 +0000	[diff] [blame]	391	// When handling the microsoft /##/ extension, the final token is
				392	// returned by PasteTokens, not the pasted token.
				393	if (PasteTokens(Tok))
Chris Lattner	3f1cc83	2008-02-07 06:03:59 +0000	[diff] [blame]	394	return;
Kovarththanan Rajaratnam	65cc1e8	2010-03-13 08:53:33 +0000	[diff] [blame]	395
Chris Lattner	04f2bd8	2009-12-04 06:14:03 +0000	[diff] [blame]	396	TokenIsFromPaste = true;
Mike Stump	1eb4433	2009-09-09 15:08:12 +0000	[diff] [blame]	397	}
Reid Spencer	5f016e2	2007-07-11 17:01:13 +0000	[diff] [blame]	398
				399	// The token's current location indicate where the token was lexed from. We
				400	// need this information to compute the spelling of the token, but any
				401	// diagnostics for the expanded token should appear as if they came from
Chandler Carruth	d0f5e44	2011-07-14 08:20:34 +0000	[diff] [blame]	402	// ExpansionLoc. Pull this information together into a new SourceLocation
Reid Spencer	5f016e2	2007-07-11 17:01:13 +0000	[diff] [blame]	403	// that captures all of this.
Chandler Carruth	d0f5e44	2011-07-14 08:20:34 +0000	[diff] [blame]	404	if (ExpandLocStart.isValid() && // Don't do this for token streams.
Argyrios Kyrtzidis	b73377e	2011-07-07 03:40:34 +0000	[diff] [blame]	405	// Check that the token's location was not already set properly.
Argyrios Kyrtzidis	5d579e7	2011-08-23 21:02:35 +0000	[diff] [blame]	406	SM.isBeforeInSLocAddrSpace(Tok.getLocation(), MacroStartSLocOffset)) {
Argyrios Kyrtzidis	b73377e	2011-07-07 03:40:34 +0000	[diff] [blame]	407	SourceLocation instLoc;
				408	if (Tok.is(tok::comment)) {
Chandler Carruth	bf340e4	2011-07-26 03:03:05 +0000	[diff] [blame]	409	instLoc = SM.createExpansionLoc(Tok.getLocation(),
				410	ExpandLocStart,
				411	ExpandLocEnd,
				412	Tok.getLength());
Argyrios Kyrtzidis	b73377e	2011-07-07 03:40:34 +0000	[diff] [blame]	413	} else {
Argyrios Kyrtzidis	ec3b538	2011-08-19 22:34:14 +0000	[diff] [blame]	414	instLoc = getExpansionLocForMacroDefLoc(Tok.getLocation());
Argyrios Kyrtzidis	b73377e	2011-07-07 03:40:34 +0000	[diff] [blame]	415	}
				416
				417	Tok.setLocation(instLoc);
Reid Spencer	5f016e2	2007-07-11 17:01:13 +0000	[diff] [blame]	418	}
Mike Stump	1eb4433	2009-09-09 15:08:12 +0000	[diff] [blame]	419
Reid Spencer	5f016e2	2007-07-11 17:01:13 +0000	[diff] [blame]	420	// If this is the first token, set the lexical properties of the token to
				421	// match the lexical properties of the macro identifier.
				422	if (isFirstToken) {
Chris Lattner	d217773	2007-07-20 16:59:19 +0000	[diff] [blame]	423	Tok.setFlagValue(Token::StartOfLine , AtStartOfLine);
				424	Tok.setFlagValue(Token::LeadingSpace, HasLeadingSpace);
Reid Spencer	5f016e2	2007-07-11 17:01:13 +0000	[diff] [blame]	425	}
Mike Stump	1eb4433	2009-09-09 15:08:12 +0000	[diff] [blame]	426
Reid Spencer	5f016e2	2007-07-11 17:01:13 +0000	[diff] [blame]	427	// Handle recursive expansion!
Argyrios Kyrtzidis	6f421f9	2009-05-22 21:09:31 +0000	[diff] [blame]	428	if (!Tok.isAnnotation() && Tok.getIdentifierInfo() != 0) {
Chris Lattner	863c486	2009-01-23 18:35:48 +0000	[diff] [blame]	429	// Change the kind of this identifier to the appropriate token kind, e.g.
				430	// turning "for" into a keyword.
Argyrios Kyrtzidis	6f421f9	2009-05-22 21:09:31 +0000	[diff] [blame]	431	IdentifierInfo *II = Tok.getIdentifierInfo();
Chris Lattner	863c486	2009-01-23 18:35:48 +0000	[diff] [blame]	432	Tok.setKind(II->getTokenID());
Mike Stump	1eb4433	2009-09-09 15:08:12 +0000	[diff] [blame]	433
Chris Lattner	332ee08	2009-04-19 20:29:42 +0000	[diff] [blame]	434	// If this identifier was poisoned and from a paste, emit an error. This
				435	// won't be handled by Preprocessor::HandleIdentifier because this is coming
				436	// from a macro expansion.
				437	if (II->isPoisoned() && TokenIsFromPaste) {
John Wiegley	28bbe4b	2011-04-28 01:08:34 +0000	[diff] [blame]	438	PP.HandlePoisonedIdentifier(Tok);
Chris Lattner	332ee08	2009-04-19 20:29:42 +0000	[diff] [blame]	439	}
Mike Stump	1eb4433	2009-09-09 15:08:12 +0000	[diff] [blame]	440
Chris Lattner	863c486	2009-01-23 18:35:48 +0000	[diff] [blame]	441	if (!DisableMacroExpansion && II->isHandleIdentifierCase())
				442	PP.HandleIdentifier(Tok);
				443	}
Reid Spencer	5f016e2	2007-07-11 17:01:13 +0000	[diff] [blame]	444
				445	// Otherwise, return a normal token.
				446	}
				447
				448	/// PasteTokens - Tok is the LHS of a ## operator, and CurToken is the ##
				449	/// operator. Read the ## and RHS, and paste the LHS/RHS together. If there
Nico Weber	48002c8	2008-09-29 00:25:48 +0000	[diff] [blame]	450	/// are more ## after it, chomp them iteratively. Return the result as Tok.
Chris Lattner	3f1cc83	2008-02-07 06:03:59 +0000	[diff] [blame]	451	/// If this returns true, the caller should immediately return the token.
Chris Lattner	1543e9c	2008-03-09 02:18:51 +0000	[diff] [blame]	452	bool TokenLexer::PasteTokens(Token &Tok) {
Dylan Noblesmith	f7ccbad	2012-02-05 02:13:05 +0000	[diff] [blame]	453	SmallString<128> Buffer;
Chris Lattner	47246be	2009-01-26 19:29:26 +0000	[diff] [blame]	454	const char *ResultTokStrPtr = 0;
Abramo Bagnara	a08529c	2011-10-03 18:39:03 +0000	[diff] [blame]	455	SourceLocation StartLoc = Tok.getLocation();
Argyrios Kyrtzidis	b73377e	2011-07-07 03:40:34 +0000	[diff] [blame]	456	SourceLocation PasteOpLoc;
Reid Spencer	5f016e2	2007-07-11 17:01:13 +0000	[diff] [blame]	457	do {
				458	// Consume the ## operator.
Argyrios Kyrtzidis	b73377e	2011-07-07 03:40:34 +0000	[diff] [blame]	459	PasteOpLoc = Tokens[CurToken].getLocation();
Reid Spencer	5f016e2	2007-07-11 17:01:13 +0000	[diff] [blame]	460	++CurToken;
				461	assert(!isAtEnd() && "No token on the RHS of a paste operator!");
Mike Stump	1eb4433	2009-09-09 15:08:12 +0000	[diff] [blame]	462
Reid Spencer	5f016e2	2007-07-11 17:01:13 +0000	[diff] [blame]	463	// Get the RHS token.
Chris Lattner	8d89643	2008-03-09 02:07:49 +0000	[diff] [blame]	464	const Token &RHS = Tokens[CurToken];
Mike Stump	1eb4433	2009-09-09 15:08:12 +0000	[diff] [blame]	465
Reid Spencer	5f016e2	2007-07-11 17:01:13 +0000	[diff] [blame]	466	// Allocate space for the result token. This is guaranteed to be enough for
Chris Lattner	1fa4953	2009-03-08 08:08:45 +0000	[diff] [blame]	467	// the two tokens.
				468	Buffer.resize(Tok.getLength() + RHS.getLength());
Mike Stump	1eb4433	2009-09-09 15:08:12 +0000	[diff] [blame]	469
Reid Spencer	5f016e2	2007-07-11 17:01:13 +0000	[diff] [blame]	470	// Get the spelling of the LHS token in Buffer.
				471	const char *BufPtr = &Buffer[0];
Douglas Gregor	453091c	2010-03-16 22:30:13 +0000	[diff] [blame]	472	bool Invalid = false;
				473	unsigned LHSLen = PP.getSpelling(Tok, BufPtr, &Invalid);
Reid Spencer	5f016e2	2007-07-11 17:01:13 +0000	[diff] [blame]	474	if (BufPtr != &Buffer[0]) // Really, we want the chars in Buffer!
				475	memcpy(&Buffer[0], BufPtr, LHSLen);
Douglas Gregor	453091c	2010-03-16 22:30:13 +0000	[diff] [blame]	476	if (Invalid)
				477	return true;
				478
Reid Spencer	5f016e2	2007-07-11 17:01:13 +0000	[diff] [blame]	479	BufPtr = &Buffer[LHSLen];
Douglas Gregor	453091c	2010-03-16 22:30:13 +0000	[diff] [blame]	480	unsigned RHSLen = PP.getSpelling(RHS, BufPtr, &Invalid);
				481	if (Invalid)
				482	return true;
Reid Spencer	5f016e2	2007-07-11 17:01:13 +0000	[diff] [blame]	483	if (BufPtr != &Buffer[LHSLen]) // Really, we want the chars in Buffer!
				484	memcpy(&Buffer[LHSLen], BufPtr, RHSLen);
Mike Stump	1eb4433	2009-09-09 15:08:12 +0000	[diff] [blame]	485
Reid Spencer	5f016e2	2007-07-11 17:01:13 +0000	[diff] [blame]	486	// Trim excess space.
Chris Lattner	1fa4953	2009-03-08 08:08:45 +0000	[diff] [blame]	487	Buffer.resize(LHSLen+RHSLen);
Mike Stump	1eb4433	2009-09-09 15:08:12 +0000	[diff] [blame]	488
Reid Spencer	5f016e2	2007-07-11 17:01:13 +0000	[diff] [blame]	489	// Plop the pasted result (including the trailing newline and null) into a
				490	// scratch buffer where we can lex it.
Chris Lattner	47246be	2009-01-26 19:29:26 +0000	[diff] [blame]	491	Token ResultTokTmp;
				492	ResultTokTmp.startToken();
Mike Stump	1eb4433	2009-09-09 15:08:12 +0000	[diff] [blame]	493
Chris Lattner	47246be	2009-01-26 19:29:26 +0000	[diff] [blame]	494	// Claim that the tmp token is a string_literal so that we can get the
Chris Lattner	917f143	2009-12-23 21:29:53 +0000	[diff] [blame]	495	// character pointer back from CreateString in getLiteralData().
Chris Lattner	47246be	2009-01-26 19:29:26 +0000	[diff] [blame]	496	ResultTokTmp.setKind(tok::string_literal);
				497	PP.CreateString(&Buffer[0], Buffer.size(), ResultTokTmp);
				498	SourceLocation ResultTokLoc = ResultTokTmp.getLocation();
				499	ResultTokStrPtr = ResultTokTmp.getLiteralData();
				500
Reid Spencer	5f016e2	2007-07-11 17:01:13 +0000	[diff] [blame]	501	// Lex the resultant pasted token into Result.
Chris Lattner	d217773	2007-07-20 16:59:19 +0000	[diff] [blame]	502	Token Result;
Mike Stump	1eb4433	2009-09-09 15:08:12 +0000	[diff] [blame]	503
Abramo Bagnara	c4bf2b9	2010-12-22 08:23:18 +0000	[diff] [blame]	504	if (Tok.isAnyIdentifier() && RHS.isAnyIdentifier()) {
Reid Spencer	5f016e2	2007-07-11 17:01:13 +0000	[diff] [blame]	505	// Common paste case: identifier+identifier = identifier. Avoid creating
				506	// a lexer and other overhead.
				507	PP.IncrementPasteCounter(true);
				508	Result.startToken();
Abramo Bagnara	c4bf2b9	2010-12-22 08:23:18 +0000	[diff] [blame]	509	Result.setKind(tok::raw_identifier);
				510	Result.setRawIdentifierData(ResultTokStrPtr);
Reid Spencer	5f016e2	2007-07-11 17:01:13 +0000	[diff] [blame]	511	Result.setLocation(ResultTokLoc);
				512	Result.setLength(LHSLen+RHSLen);
				513	} else {
				514	PP.IncrementPasteCounter(false);
Mike Stump	1eb4433	2009-09-09 15:08:12 +0000	[diff] [blame]	515
Chris Lattner	bcc2a67	2009-01-19 06:46:35 +0000	[diff] [blame]	516	assert(ResultTokLoc.isFileID() &&
				517	"Should be a raw location into scratch buffer");
Reid Spencer	5f016e2	2007-07-11 17:01:13 +0000	[diff] [blame]	518	SourceManager &SourceMgr = PP.getSourceManager();
Chris Lattner	47246be	2009-01-26 19:29:26 +0000	[diff] [blame]	519	FileID LocFileID = SourceMgr.getFileID(ResultTokLoc);
Mike Stump	1eb4433	2009-09-09 15:08:12 +0000	[diff] [blame]	520
Douglas Gregor	f715ca1	2010-03-16 00:06:06 +0000	[diff] [blame]	521	bool Invalid = false;
Douglas Gregor	aea67db	2010-03-15 22:54:52 +0000	[diff] [blame]	522	const char *ScratchBufStart
Benjamin Kramer	f6ac97b	2010-03-16 14:14:31 +0000	[diff] [blame]	523	= SourceMgr.getBufferData(LocFileID, &Invalid).data();
Douglas Gregor	f715ca1	2010-03-16 00:06:06 +0000	[diff] [blame]	524	if (Invalid)
Douglas Gregor	aea67db	2010-03-15 22:54:52 +0000	[diff] [blame]	525	return false;
Mike Stump	1eb4433	2009-09-09 15:08:12 +0000	[diff] [blame]	526
Chris Lattner	bcc2a67	2009-01-19 06:46:35 +0000	[diff] [blame]	527	// Make a lexer to lex this string from. Lex just this one token.
Reid Spencer	5f016e2	2007-07-11 17:01:13 +0000	[diff] [blame]	528	// Make a lexer object so that we lex and expand the paste result.
Chris Lattner	47246be	2009-01-26 19:29:26 +0000	[diff] [blame]	529	Lexer TL(SourceMgr.getLocForStartOfFile(LocFileID),
David Blaikie	4e4d084	2012-03-11 07:00:24 +0000	[diff] [blame]	530	PP.getLangOpts(), ScratchBufStart,
Chris Lattner	1fa4953	2009-03-08 08:08:45 +0000	[diff] [blame]	531	ResultTokStrPtr, ResultTokStrPtr+LHSLen+RHSLen);
Mike Stump	1eb4433	2009-09-09 15:08:12 +0000	[diff] [blame]	532
Reid Spencer	5f016e2	2007-07-11 17:01:13 +0000	[diff] [blame]	533	// Lex a token in raw mode. This way it won't look up identifiers
				534	// automatically, lexing off the end will return an eof token, and
				535	// warnings are disabled. This returns true if the result token is the
				536	// entire buffer.
Chris Lattner	1fa4953	2009-03-08 08:08:45 +0000	[diff] [blame]	537	bool isInvalid = !TL.LexFromRawLexer(Result);
Mike Stump	1eb4433	2009-09-09 15:08:12 +0000	[diff] [blame]	538
Reid Spencer	5f016e2	2007-07-11 17:01:13 +0000	[diff] [blame]	539	// If we got an EOF token, we didn't form even ONE token. For example, we
				540	// did "/ ## /" to get "//".
Chris Lattner	1fa4953	2009-03-08 08:08:45 +0000	[diff] [blame]	541	isInvalid \|= Result.is(tok::eof);
Mike Stump	1eb4433	2009-09-09 15:08:12 +0000	[diff] [blame]	542
Chris Lattner	1fa4953	2009-03-08 08:08:45 +0000	[diff] [blame]	543	// If pasting the two tokens didn't form a full new token, this is an
				544	// error. This occurs with "x ## +" and other stuff. Return with Tok
				545	// unmodified and with RHS as the next token to lex.
				546	if (isInvalid) {
				547	// Test for the Microsoft extension of /##/ turning into // here on the
				548	// error path.
David Blaikie	4e4d084	2012-03-11 07:00:24 +0000	[diff] [blame]	549	if (PP.getLangOpts().MicrosoftExt && Tok.is(tok::slash) &&
Chris Lattner	1fa4953	2009-03-08 08:08:45 +0000	[diff] [blame]	550	RHS.is(tok::slash)) {
				551	HandleMicrosoftCommentPaste(Tok);
				552	return true;
				553	}
Mike Stump	1eb4433	2009-09-09 15:08:12 +0000	[diff] [blame]	554
Chris Lattner	920bf45	2010-07-17 16:24:30 +0000	[diff] [blame]	555	// Do not emit the error when preprocessing assembler code.
David Blaikie	4e4d084	2012-03-11 07:00:24 +0000	[diff] [blame]	556	if (!PP.getLangOpts().AsmPreprocessor) {
Chandler Carruth	d0f5e44	2011-07-14 08:20:34 +0000	[diff] [blame]	557	// Explicitly convert the token location to have proper expansion
Chris Lattner	3c17b8a	2009-05-28 05:39:39 +0000	[diff] [blame]	558	// information so that the user knows where it came from.
				559	SourceManager &SM = PP.getSourceManager();
Chris Lattner	b11e43c	2011-06-14 18:19:37 +0000	[diff] [blame]	560	SourceLocation Loc =
Chandler Carruth	bf340e4	2011-07-26 03:03:05 +0000	[diff] [blame]	561	SM.createExpansionLoc(PasteOpLoc, ExpandLocStart, ExpandLocEnd, 2);
Chris Lattner	920bf45	2010-07-17 16:24:30 +0000	[diff] [blame]	562	// If we're in microsoft extensions mode, downgrade this from a hard
				563	// error to a warning that defaults to an error. This allows
				564	// disabling it.
				565	PP.Diag(Loc,
David Blaikie	4e4d084	2012-03-11 07:00:24 +0000	[diff] [blame]	566	PP.getLangOpts().MicrosoftExt ? diag::err_pp_bad_paste_ms
Francois Pichet	62ec1f2	2011-09-17 17:15:52 +0000	[diff] [blame]	567	: diag::err_pp_bad_paste)
Benjamin Kramer	476d8b8	2010-08-11 14:47:12 +0000	[diff] [blame]	568	<< Buffer.str();
Chris Lattner	3c17b8a	2009-05-28 05:39:39 +0000	[diff] [blame]	569	}
Mike Stump	1eb4433	2009-09-09 15:08:12 +0000	[diff] [blame]	570
Richard Smith	c5f7459	2012-06-13 19:02:56 +0000	[diff] [blame]	571	// An error has occurred so exit loop.
				572	break;
Chris Lattner	1fa4953	2009-03-08 08:08:45 +0000	[diff] [blame]	573	}
Mike Stump	1eb4433	2009-09-09 15:08:12 +0000	[diff] [blame]	574
Chris Lattner	1fa4953	2009-03-08 08:08:45 +0000	[diff] [blame]	575	// Turn ## into 'unknown' to avoid # ## # from looking like a paste
				576	// operator.
				577	if (Result.is(tok::hashhash))
				578	Result.setKind(tok::unknown);
Reid Spencer	5f016e2	2007-07-11 17:01:13 +0000	[diff] [blame]	579	}
Mike Stump	1eb4433	2009-09-09 15:08:12 +0000	[diff] [blame]	580
Reid Spencer	5f016e2	2007-07-11 17:01:13 +0000	[diff] [blame]	581	// Transfer properties of the LHS over the the Result.
Chris Lattner	d217773	2007-07-20 16:59:19 +0000	[diff] [blame]	582	Result.setFlagValue(Token::StartOfLine , Tok.isAtStartOfLine());
				583	Result.setFlagValue(Token::LeadingSpace, Tok.hasLeadingSpace());
Argyrios Kyrtzidis	b73377e	2011-07-07 03:40:34 +0000	[diff] [blame]	584
Reid Spencer	5f016e2	2007-07-11 17:01:13 +0000	[diff] [blame]	585	// Finally, replace LHS with the result, consume the RHS, and iterate.
				586	++CurToken;
				587	Tok = Result;
Chris Lattner	8d89643	2008-03-09 02:07:49 +0000	[diff] [blame]	588	} while (!isAtEnd() && Tokens[CurToken].is(tok::hashhash));
Mike Stump	1eb4433	2009-09-09 15:08:12 +0000	[diff] [blame]	589
Abramo Bagnara	a08529c	2011-10-03 18:39:03 +0000	[diff] [blame]	590	SourceLocation EndLoc = Tokens[CurToken - 1].getLocation();
				591
Argyrios Kyrtzidis	b73377e	2011-07-07 03:40:34 +0000	[diff] [blame]	592	// The token's current location indicate where the token was lexed from. We
				593	// need this information to compute the spelling of the token, but any
				594	// diagnostics for the expanded token should appear as if the token was
Abramo Bagnara	a08529c	2011-10-03 18:39:03 +0000	[diff] [blame]	595	// expanded from the full ## expression. Pull this information together into
Argyrios Kyrtzidis	b73377e	2011-07-07 03:40:34 +0000	[diff] [blame]	596	// a new SourceLocation that captures all of this.
Argyrios Kyrtzidis	c0069d8	2011-08-23 21:02:32 +0000	[diff] [blame]	597	SourceManager &SM = PP.getSourceManager();
Abramo Bagnara	a08529c	2011-10-03 18:39:03 +0000	[diff] [blame]	598	if (StartLoc.isFileID())
				599	StartLoc = getExpansionLocForMacroDefLoc(StartLoc);
				600	if (EndLoc.isFileID())
				601	EndLoc = getExpansionLocForMacroDefLoc(EndLoc);
				602	Tok.setLocation(SM.createExpansionLoc(Tok.getLocation(), StartLoc, EndLoc,
Argyrios Kyrtzidis	c0069d8	2011-08-23 21:02:32 +0000	[diff] [blame]	603	Tok.getLength()));
Argyrios Kyrtzidis	b73377e	2011-07-07 03:40:34 +0000	[diff] [blame]	604
Reid Spencer	5f016e2	2007-07-11 17:01:13 +0000	[diff] [blame]	605	// Now that we got the result token, it will be subject to expansion. Since
				606	// token pasting re-lexes the result token in raw mode, identifier information
				607	// isn't looked up. As such, if the result is an identifier, look up id info.
Abramo Bagnara	c4bf2b9	2010-12-22 08:23:18 +0000	[diff] [blame]	608	if (Tok.is(tok::raw_identifier)) {
Reid Spencer	5f016e2	2007-07-11 17:01:13 +0000	[diff] [blame]	609	// Look up the identifier info for the token. We disabled identifier lookup
				610	// by saying we're skipping contents, so we need to do this manually.
Abramo Bagnara	c4bf2b9	2010-12-22 08:23:18 +0000	[diff] [blame]	611	PP.LookUpIdentifierInfo(Tok);
Reid Spencer	5f016e2	2007-07-11 17:01:13 +0000	[diff] [blame]	612	}
Chris Lattner	3f1cc83	2008-02-07 06:03:59 +0000	[diff] [blame]	613	return false;
Reid Spencer	5f016e2	2007-07-11 17:01:13 +0000	[diff] [blame]	614	}
				615
				616	/// isNextTokenLParen - If the next token lexed will pop this macro off the
				617	/// expansion stack, return 2. If the next unexpanded token is a '(', return
				618	/// 1, otherwise return 0.
Chris Lattner	1543e9c	2008-03-09 02:18:51 +0000	[diff] [blame]	619	unsigned TokenLexer::isNextTokenLParen() const {
Reid Spencer	5f016e2	2007-07-11 17:01:13 +0000	[diff] [blame]	620	// Out of tokens?
				621	if (isAtEnd())
				622	return 2;
Chris Lattner	8d89643	2008-03-09 02:07:49 +0000	[diff] [blame]	623	return Tokens[CurToken].is(tok::l_paren);
Reid Spencer	5f016e2	2007-07-11 17:01:13 +0000	[diff] [blame]	624	}
Chris Lattner	3f1cc83	2008-02-07 06:03:59 +0000	[diff] [blame]	625
Peter Collingbourne	b2eb53d	2011-02-22 13:49:00 +0000	[diff] [blame]	626	/// isParsingPreprocessorDirective - Return true if we are in the middle of a
				627	/// preprocessor directive.
				628	bool TokenLexer::isParsingPreprocessorDirective() const {
Peter Collingbourne	8402155	2011-02-28 02:37:51 +0000	[diff] [blame]	629	return Tokens[NumTokens-1].is(tok::eod) && !isAtEnd();
Peter Collingbourne	b2eb53d	2011-02-22 13:49:00 +0000	[diff] [blame]	630	}
Chris Lattner	3f1cc83	2008-02-07 06:03:59 +0000	[diff] [blame]	631
				632	/// HandleMicrosoftCommentPaste - In microsoft compatibility mode, /##/ pastes
				633	/// together to form a comment that comments out everything in the current
				634	/// macro, other active macros, and anything left on the current physical
Chandler Carruth	d0f5e44	2011-07-14 08:20:34 +0000	[diff] [blame]	635	/// source line of the expanded buffer. Handle this by returning the
Chris Lattner	3f1cc83	2008-02-07 06:03:59 +0000	[diff] [blame]	636	/// first token on the next line.
Chris Lattner	1543e9c	2008-03-09 02:18:51 +0000	[diff] [blame]	637	void TokenLexer::HandleMicrosoftCommentPaste(Token &Tok) {
Chris Lattner	3f1cc83	2008-02-07 06:03:59 +0000	[diff] [blame]	638	// We 'comment out' the rest of this macro by just ignoring the rest of the
				639	// tokens that have not been lexed yet, if any.
Mike Stump	1eb4433	2009-09-09 15:08:12 +0000	[diff] [blame]	640
Chris Lattner	3f1cc83	2008-02-07 06:03:59 +0000	[diff] [blame]	641	// Since this must be a macro, mark the macro enabled now that it is no longer
				642	// being expanded.
				643	assert(Macro && "Token streams can't paste comments");
				644	Macro->EnableMacro();
Mike Stump	1eb4433	2009-09-09 15:08:12 +0000	[diff] [blame]	645
Chris Lattner	3f1cc83	2008-02-07 06:03:59 +0000	[diff] [blame]	646	PP.HandleMicrosoftCommentPaste(Tok);
				647	}
Argyrios Kyrtzidis	b73377e	2011-07-07 03:40:34 +0000	[diff] [blame]	648
Argyrios Kyrtzidis	ec3b538	2011-08-19 22:34:14 +0000	[diff] [blame]	649	/// \brief If \arg loc is a file ID and points inside the current macro
Argyrios Kyrtzidis	b73377e	2011-07-07 03:40:34 +0000	[diff] [blame]	650	/// definition, returns the appropriate source location pointing at the
Argyrios Kyrtzidis	ec3b538	2011-08-19 22:34:14 +0000	[diff] [blame]	651	/// macro expansion source location entry, otherwise it returns an invalid
				652	/// SourceLocation.
				653	SourceLocation
				654	TokenLexer::getExpansionLocForMacroDefLoc(SourceLocation loc) const {
Chandler Carruth	d0f5e44	2011-07-14 08:20:34 +0000	[diff] [blame]	655	assert(ExpandLocStart.isValid() && MacroExpansionStart.isValid() &&
Argyrios Kyrtzidis	b73377e	2011-07-07 03:40:34 +0000	[diff] [blame]	656	"Not appropriate for token streams");
Argyrios Kyrtzidis	c0069d8	2011-08-23 21:02:32 +0000	[diff] [blame]	657	assert(loc.isValid() && loc.isFileID());
Argyrios Kyrtzidis	b73377e	2011-07-07 03:40:34 +0000	[diff] [blame]	658
				659	SourceManager &SM = PP.getSourceManager();
Argyrios Kyrtzidis	499ea55	2011-08-23 21:02:38 +0000	[diff] [blame]	660	assert(SM.isInSLocAddrSpace(loc, MacroDefStart, MacroDefLength) &&
				661	"Expected loc to come from the macro definition");
Argyrios Kyrtzidis	b73377e	2011-07-07 03:40:34 +0000	[diff] [blame]	662
Argyrios Kyrtzidis	499ea55	2011-08-23 21:02:38 +0000	[diff] [blame]	663	unsigned relativeOffset = 0;
				664	SM.isInSLocAddrSpace(loc, MacroDefStart, MacroDefLength, &relativeOffset);
Argyrios Kyrtzidis	a64ccef	2011-09-19 20:40:19 +0000	[diff] [blame]	665	return MacroExpansionStart.getLocWithOffset(relativeOffset);
Argyrios Kyrtzidis	b73377e	2011-07-07 03:40:34 +0000	[diff] [blame]	666	}
Argyrios Kyrtzidis	d60a34a	2011-08-19 22:34:17 +0000	[diff] [blame]	667
				668	/// \brief Finds the tokens that are consecutive (from the same FileID)
				669	/// creates a single SLocEntry, and assigns SourceLocations to each token that
				670	/// point to that SLocEntry. e.g for
				671	/// assert(foo == bar);
				672	/// There will be a single SLocEntry for the "foo == bar" chunk and locations
				673	/// for the 'foo', '==', 'bar' tokens will point inside that chunk.
				674	///
				675	/// \arg begin_tokens will be updated to a position past all the found
				676	/// consecutive tokens.
				677	static void updateConsecutiveMacroArgTokens(SourceManager &SM,
				678	SourceLocation InstLoc,
				679	Token *&begin_tokens,
				680	Token * end_tokens) {
				681	assert(begin_tokens < end_tokens);
Argyrios Kyrtzidis	d60a34a	2011-08-19 22:34:17 +0000	[diff] [blame]	682
Argyrios Kyrtzidis	b6c465e	2011-08-23 21:02:41 +0000	[diff] [blame]	683	SourceLocation FirstLoc = begin_tokens->getLocation();
				684	SourceLocation CurLoc = FirstLoc;
				685
				686	// Compare the source location offset of tokens and group together tokens that
				687	// are close, even if their locations point to different FileIDs. e.g.
				688	//
				689	// \|bar \| foo \| cake \| (3 tokens from 3 consecutive FileIDs)
				690	// ^ ^
				691	// \|bar foo cake\| (one SLocEntry chunk for all tokens)
				692	//
				693	// we can perform this "merge" since the token's spelling location depends
				694	// on the relative offset.
				695
				696	Token *NextTok = begin_tokens + 1;
				697	for (; NextTok < end_tokens; ++NextTok) {
				698	int RelOffs;
				699	if (!SM.isInSameSLocAddrSpace(CurLoc, NextTok->getLocation(), &RelOffs))
				700	break; // Token from different local/loaded location.
				701	// Check that token is not before the previous token or more than 50
				702	// "characters" away.
				703	if (RelOffs < 0 \|\| RelOffs > 50)
Argyrios Kyrtzidis	d60a34a	2011-08-19 22:34:17 +0000	[diff] [blame]	704	break;
Argyrios Kyrtzidis	b6c465e	2011-08-23 21:02:41 +0000	[diff] [blame]	705	CurLoc = NextTok->getLocation();
				706	}
Argyrios Kyrtzidis	d60a34a	2011-08-19 22:34:17 +0000	[diff] [blame]	707
				708	// For the consecutive tokens, find the length of the SLocEntry to contain
				709	// all of them.
Argyrios Kyrtzidis	b6c465e	2011-08-23 21:02:41 +0000	[diff] [blame]	710	Token &LastConsecutiveTok = *(NextTok-1);
Argyrios Kyrtzidis	c4b5582	2011-08-24 20:33:05 +0000	[diff] [blame]	711	int LastRelOffs = 0;
Argyrios Kyrtzidis	b6c465e	2011-08-23 21:02:41 +0000	[diff] [blame]	712	SM.isInSameSLocAddrSpace(FirstLoc, LastConsecutiveTok.getLocation(),
				713	&LastRelOffs);
				714	unsigned FullLength = LastRelOffs + LastConsecutiveTok.getLength();
Argyrios Kyrtzidis	d60a34a	2011-08-19 22:34:17 +0000	[diff] [blame]	715
				716	// Create a macro expansion SLocEntry that will "contain" all of the tokens.
				717	SourceLocation Expansion =
Argyrios Kyrtzidis	b6c465e	2011-08-23 21:02:41 +0000	[diff] [blame]	718	SM.createMacroArgExpansionLoc(FirstLoc, InstLoc,FullLength);
Argyrios Kyrtzidis	d60a34a	2011-08-19 22:34:17 +0000	[diff] [blame]	719
				720	// Change the location of the tokens from the spelling location to the new
				721	// expanded location.
Argyrios Kyrtzidis	b6c465e	2011-08-23 21:02:41 +0000	[diff] [blame]	722	for (; begin_tokens < NextTok; ++begin_tokens) {
Argyrios Kyrtzidis	d60a34a	2011-08-19 22:34:17 +0000	[diff] [blame]	723	Token &Tok = *begin_tokens;
Argyrios Kyrtzidis	c4b5582	2011-08-24 20:33:05 +0000	[diff] [blame]	724	int RelOffs = 0;
Argyrios Kyrtzidis	b6c465e	2011-08-23 21:02:41 +0000	[diff] [blame]	725	SM.isInSameSLocAddrSpace(FirstLoc, Tok.getLocation(), &RelOffs);
Argyrios Kyrtzidis	a64ccef	2011-09-19 20:40:19 +0000	[diff] [blame]	726	Tok.setLocation(Expansion.getLocWithOffset(RelOffs));
Argyrios Kyrtzidis	d60a34a	2011-08-19 22:34:17 +0000	[diff] [blame]	727	}
				728	}
				729
				730	/// \brief Creates SLocEntries and updates the locations of macro argument
				731	/// tokens to their new expanded locations.
				732	///
				733	/// \param ArgIdDefLoc the location of the macro argument id inside the macro
				734	/// definition.
				735	/// \param Tokens the macro argument tokens to update.
				736	void TokenLexer::updateLocForMacroArgTokens(SourceLocation ArgIdSpellLoc,
				737	Token *begin_tokens,
				738	Token *end_tokens) {
				739	SourceManager &SM = PP.getSourceManager();
				740
Argyrios Kyrtzidis	b6c465e	2011-08-23 21:02:41 +0000	[diff] [blame]	741	SourceLocation InstLoc =
Argyrios Kyrtzidis	d60a34a	2011-08-19 22:34:17 +0000	[diff] [blame]	742	getExpansionLocForMacroDefLoc(ArgIdSpellLoc);
Argyrios Kyrtzidis	d60a34a	2011-08-19 22:34:17 +0000	[diff] [blame]	743
Argyrios Kyrtzidis	b6c465e	2011-08-23 21:02:41 +0000	[diff] [blame]	744	while (begin_tokens < end_tokens) {
				745	// If there's only one token just create a SLocEntry for it.
				746	if (end_tokens - begin_tokens == 1) {
				747	Token &Tok = *begin_tokens;
				748	Tok.setLocation(SM.createMacroArgExpansionLoc(Tok.getLocation(),
				749	InstLoc,
				750	Tok.getLength()));
				751	return;
				752	}
				753
				754	updateConsecutiveMacroArgTokens(SM, InstLoc, begin_tokens, end_tokens);
				755	}
Argyrios Kyrtzidis	d60a34a	2011-08-19 22:34:17 +0000	[diff] [blame]	756	}