Blame - lib/Lex/PPLexerChange.cpp - platform/external/clang

blob: 0b26ccbecbab7812f47ff3f9130f03634dcd56af [file] [log] [blame]

Shih-wei Liao	f8fd82b	2010-02-10 11:10:31 -0800	[diff] [blame^]	1	//===--- PPLexerChange.cpp - Handle changing lexers in the preprocessor ---===//
				2	//
				3	// The LLVM Compiler Infrastructure
				4	//
				5	// This file is distributed under the University of Illinois Open Source
				6	// License. See LICENSE.TXT for details.
				7	//
				8	//===----------------------------------------------------------------------===//
				9	//
				10	// This file implements pieces of the Preprocessor interface that manage the
				11	// current lexer stack.
				12	//
				13	//===----------------------------------------------------------------------===//
				14
				15	#include "clang/Lex/Preprocessor.h"
				16	#include "clang/Lex/HeaderSearch.h"
				17	#include "clang/Lex/MacroInfo.h"
				18	#include "clang/Lex/LexDiagnostic.h"
				19	#include "clang/Basic/SourceManager.h"
				20	#include "llvm/Support/MemoryBuffer.h"
				21	using namespace clang;
				22
				23	PPCallbacks::~PPCallbacks() {}
				24
				25	//===----------------------------------------------------------------------===//
				26	// Miscellaneous Methods.
				27	//===----------------------------------------------------------------------===//
				28
				29	/// isInPrimaryFile - Return true if we're in the top-level file, not in a
				30	/// #include. This looks through macro expansions and active _Pragma lexers.
				31	bool Preprocessor::isInPrimaryFile() const {
				32	if (IsFileLexer())
				33	return IncludeMacroStack.empty();
				34
				35	// If there are any stacked lexers, we're in a #include.
				36	assert(IsFileLexer(IncludeMacroStack[0]) &&
				37	"Top level include stack isn't our primary lexer?");
				38	for (unsigned i = 1, e = IncludeMacroStack.size(); i != e; ++i)
				39	if (IsFileLexer(IncludeMacroStack[i]))
				40	return false;
				41	return true;
				42	}
				43
				44	/// getCurrentLexer - Return the current file lexer being lexed from. Note
				45	/// that this ignores any potentially active macro expansions and _Pragma
				46	/// expansions going on at the time.
				47	PreprocessorLexer *Preprocessor::getCurrentFileLexer() const {
				48	if (IsFileLexer())
				49	return CurPPLexer;
				50
				51	// Look for a stacked lexer.
				52	for (unsigned i = IncludeMacroStack.size(); i != 0; --i) {
				53	const IncludeStackInfo& ISI = IncludeMacroStack[i-1];
				54	if (IsFileLexer(ISI))
				55	return ISI.ThePPLexer;
				56	}
				57	return 0;
				58	}
				59
				60
				61	//===----------------------------------------------------------------------===//
				62	// Methods for Entering and Callbacks for leaving various contexts
				63	//===----------------------------------------------------------------------===//
				64
				65	/// EnterSourceFile - Add a source file to the top of the include stack and
				66	/// start lexing tokens from it instead of the current buffer.
				67	bool Preprocessor::EnterSourceFile(FileID FID, const DirectoryLookup *CurDir,
				68	std::string &ErrorStr) {
				69	assert(CurTokenLexer == 0 && "Cannot #include a file inside a macro!");
				70	++NumEnteredSourceFiles;
				71
				72	if (MaxIncludeStackDepth < IncludeMacroStack.size())
				73	MaxIncludeStackDepth = IncludeMacroStack.size();
				74
				75	if (PTH) {
				76	if (PTHLexer *PL = PTH->CreateLexer(FID)) {
				77	EnterSourceFileWithPTH(PL, CurDir);
				78	return false;
				79	}
				80	}
				81
				82	// Get the MemoryBuffer for this FID, if it fails, we fail.
				83	const llvm::MemoryBuffer *InputFile =
				84	getSourceManager().getBuffer(FID, &ErrorStr);
				85	if (!ErrorStr.empty())
				86	return true;
				87
				88	EnterSourceFileWithLexer(new Lexer(FID, InputFile, *this), CurDir);
				89	return false;
				90	}
				91
				92	/// EnterSourceFileWithLexer - Add a source file to the top of the include stack
				93	/// and start lexing tokens from it instead of the current buffer.
				94	void Preprocessor::EnterSourceFileWithLexer(Lexer *TheLexer,
				95	const DirectoryLookup *CurDir) {
				96
				97	// Add the current lexer to the include stack.
				98	if (CurPPLexer \|\| CurTokenLexer)
				99	PushIncludeMacroStack();
				100
				101	CurLexer.reset(TheLexer);
				102	CurPPLexer = TheLexer;
				103	CurDirLookup = CurDir;
				104
				105	// Notify the client, if desired, that we are in a new source file.
				106	if (Callbacks && !CurLexer->Is_PragmaLexer) {
				107	SrcMgr::CharacteristicKind FileType =
				108	SourceMgr.getFileCharacteristic(CurLexer->getFileLoc());
				109
				110	Callbacks->FileChanged(CurLexer->getFileLoc(),
				111	PPCallbacks::EnterFile, FileType);
				112	}
				113	}
				114
				115	/// EnterSourceFileWithPTH - Add a source file to the top of the include stack
				116	/// and start getting tokens from it using the PTH cache.
				117	void Preprocessor::EnterSourceFileWithPTH(PTHLexer *PL,
				118	const DirectoryLookup *CurDir) {
				119
				120	if (CurPPLexer \|\| CurTokenLexer)
				121	PushIncludeMacroStack();
				122
				123	CurDirLookup = CurDir;
				124	CurPTHLexer.reset(PL);
				125	CurPPLexer = CurPTHLexer.get();
				126
				127	// Notify the client, if desired, that we are in a new source file.
				128	if (Callbacks) {
				129	FileID FID = CurPPLexer->getFileID();
				130	SourceLocation EnterLoc = SourceMgr.getLocForStartOfFile(FID);
				131	SrcMgr::CharacteristicKind FileType =
				132	SourceMgr.getFileCharacteristic(EnterLoc);
				133	Callbacks->FileChanged(EnterLoc, PPCallbacks::EnterFile, FileType);
				134	}
				135	}
				136
				137	/// EnterMacro - Add a Macro to the top of the include stack and start lexing
				138	/// tokens from it instead of the current buffer.
				139	void Preprocessor::EnterMacro(Token &Tok, SourceLocation ILEnd,
				140	MacroArgs *Args) {
				141	PushIncludeMacroStack();
				142	CurDirLookup = 0;
				143
				144	if (NumCachedTokenLexers == 0) {
				145	CurTokenLexer.reset(new TokenLexer(Tok, ILEnd, Args, *this));
				146	} else {
				147	CurTokenLexer.reset(TokenLexerCache[--NumCachedTokenLexers]);
				148	CurTokenLexer->Init(Tok, ILEnd, Args);
				149	}
				150	}
				151
				152	/// EnterTokenStream - Add a "macro" context to the top of the include stack,
				153	/// which will cause the lexer to start returning the specified tokens.
				154	///
				155	/// If DisableMacroExpansion is true, tokens lexed from the token stream will
				156	/// not be subject to further macro expansion. Otherwise, these tokens will
				157	/// be re-macro-expanded when/if expansion is enabled.
				158	///
				159	/// If OwnsTokens is false, this method assumes that the specified stream of
				160	/// tokens has a permanent owner somewhere, so they do not need to be copied.
				161	/// If it is true, it assumes the array of tokens is allocated with new[] and
				162	/// must be freed.
				163	///
				164	void Preprocessor::EnterTokenStream(const Token *Toks, unsigned NumToks,
				165	bool DisableMacroExpansion,
				166	bool OwnsTokens) {
				167	// Save our current state.
				168	PushIncludeMacroStack();
				169	CurDirLookup = 0;
				170
				171	// Create a macro expander to expand from the specified token stream.
				172	if (NumCachedTokenLexers == 0) {
				173	CurTokenLexer.reset(new TokenLexer(Toks, NumToks, DisableMacroExpansion,
				174	OwnsTokens, *this));
				175	} else {
				176	CurTokenLexer.reset(TokenLexerCache[--NumCachedTokenLexers]);
				177	CurTokenLexer->Init(Toks, NumToks, DisableMacroExpansion, OwnsTokens);
				178	}
				179	}
				180
				181	/// HandleEndOfFile - This callback is invoked when the lexer hits the end of
				182	/// the current file. This either returns the EOF token or pops a level off
				183	/// the include stack and keeps going.
				184	bool Preprocessor::HandleEndOfFile(Token &Result, bool isEndOfMacro) {
				185	assert(!CurTokenLexer &&
				186	"Ending a file when currently in a macro!");
				187
				188	// See if this file had a controlling macro.
				189	if (CurPPLexer) { // Not ending a macro, ignore it.
				190	if (const IdentifierInfo *ControllingMacro =
				191	CurPPLexer->MIOpt.GetControllingMacroAtEndOfFile()) {
				192	// Okay, this has a controlling macro, remember in HeaderFileInfo.
				193	if (const FileEntry *FE =
				194	SourceMgr.getFileEntryForID(CurPPLexer->getFileID()))
				195	HeaderInfo.SetFileControllingMacro(FE, ControllingMacro);
				196	}
				197	}
				198
				199	// If this is a #include'd file, pop it off the include stack and continue
				200	// lexing the #includer file.
				201	if (!IncludeMacroStack.empty()) {
				202	// We're done with the #included file.
				203	RemoveTopOfLexerStack();
				204
				205	// Notify the client, if desired, that we are in a new source file.
				206	if (Callbacks && !isEndOfMacro && CurPPLexer) {
				207	SrcMgr::CharacteristicKind FileType =
				208	SourceMgr.getFileCharacteristic(CurPPLexer->getSourceLocation());
				209	Callbacks->FileChanged(CurPPLexer->getSourceLocation(),
				210	PPCallbacks::ExitFile, FileType);
				211	}
				212
				213	// Client should lex another token.
				214	return false;
				215	}
				216
				217	// If the file ends with a newline, form the EOF token on the newline itself,
				218	// rather than "on the line following it", which doesn't exist. This makes
				219	// diagnostics relating to the end of file include the last file that the user
				220	// actually typed, which is goodness.
				221	if (CurLexer) {
				222	const char *EndPos = CurLexer->BufferEnd;
				223	if (EndPos != CurLexer->BufferStart &&
				224	(EndPos[-1] == '\n' \|\| EndPos[-1] == '\r')) {
				225	--EndPos;
				226
				227	// Handle \n\r and \r\n:
				228	if (EndPos != CurLexer->BufferStart &&
				229	(EndPos[-1] == '\n' \|\| EndPos[-1] == '\r') &&
				230	EndPos[-1] != EndPos[0])
				231	--EndPos;
				232	}
				233
				234	Result.startToken();
				235	CurLexer->BufferPtr = EndPos;
				236	CurLexer->FormTokenWithChars(Result, EndPos, tok::eof);
				237
				238	// We're done with the #included file.
				239	CurLexer.reset();
				240	} else {
				241	assert(CurPTHLexer && "Got EOF but no current lexer set!");
				242	CurPTHLexer->getEOF(Result);
				243	CurPTHLexer.reset();
				244	}
				245
				246	CurPPLexer = 0;
				247
				248	// This is the end of the top-level file. If the diag::pp_macro_not_used
				249	// diagnostic is enabled, look for macros that have not been used.
				250	if (getDiagnostics().getDiagnosticLevel(diag::pp_macro_not_used) !=
				251	Diagnostic::Ignored) {
				252	for (macro_iterator I = macro_begin(false), E = macro_end(false);
				253	I != E; ++I)
				254	if (!I->second->isUsed())
				255	Diag(I->second->getDefinitionLoc(), diag::pp_macro_not_used);
				256	}
				257	return true;
				258	}
				259
				260	/// HandleEndOfTokenLexer - This callback is invoked when the current TokenLexer
				261	/// hits the end of its token stream.
				262	bool Preprocessor::HandleEndOfTokenLexer(Token &Result) {
				263	assert(CurTokenLexer && !CurPPLexer &&
				264	"Ending a macro when currently in a #include file!");
				265
				266	// Delete or cache the now-dead macro expander.
				267	if (NumCachedTokenLexers == TokenLexerCacheSize)
				268	CurTokenLexer.reset();
				269	else
				270	TokenLexerCache[NumCachedTokenLexers++] = CurTokenLexer.take();
				271
				272	// Handle this like a #include file being popped off the stack.
				273	return HandleEndOfFile(Result, true);
				274	}
				275
				276	/// RemoveTopOfLexerStack - Pop the current lexer/macro exp off the top of the
				277	/// lexer stack. This should only be used in situations where the current
				278	/// state of the top-of-stack lexer is unknown.
				279	void Preprocessor::RemoveTopOfLexerStack() {
				280	assert(!IncludeMacroStack.empty() && "Ran out of stack entries to load");
				281
				282	if (CurTokenLexer) {
				283	// Delete or cache the now-dead macro expander.
				284	if (NumCachedTokenLexers == TokenLexerCacheSize)
				285	CurTokenLexer.reset();
				286	else
				287	TokenLexerCache[NumCachedTokenLexers++] = CurTokenLexer.take();
				288	}
				289
				290	PopIncludeMacroStack();
				291	}
				292
				293	/// HandleMicrosoftCommentPaste - When the macro expander pastes together a
				294	/// comment (/##/) in microsoft mode, this method handles updating the current
				295	/// state, returning the token on the next source line.
				296	void Preprocessor::HandleMicrosoftCommentPaste(Token &Tok) {
				297	assert(CurTokenLexer && !CurPPLexer &&
				298	"Pasted comment can only be formed from macro");
				299
				300	// We handle this by scanning for the closest real lexer, switching it to
				301	// raw mode and preprocessor mode. This will cause it to return \n as an
				302	// explicit EOM token.
				303	PreprocessorLexer *FoundLexer = 0;
				304	bool LexerWasInPPMode = false;
				305	for (unsigned i = 0, e = IncludeMacroStack.size(); i != e; ++i) {
				306	IncludeStackInfo &ISI = *(IncludeMacroStack.end()-i-1);
				307	if (ISI.ThePPLexer == 0) continue; // Scan for a real lexer.
				308
				309	// Once we find a real lexer, mark it as raw mode (disabling macro
				310	// expansions) and preprocessor mode (return EOM). We know that the lexer
				311	// was not in raw mode before, because the macro that the comment came
				312	// from was expanded. However, it could have already been in preprocessor
				313	// mode (#if COMMENT) in which case we have to return it to that mode and
				314	// return EOM.
				315	FoundLexer = ISI.ThePPLexer;
				316	FoundLexer->LexingRawMode = true;
				317	LexerWasInPPMode = FoundLexer->ParsingPreprocessorDirective;
				318	FoundLexer->ParsingPreprocessorDirective = true;
				319	break;
				320	}
				321
				322	// Okay, we either found and switched over the lexer, or we didn't find a
				323	// lexer. In either case, finish off the macro the comment came from, getting
				324	// the next token.
				325	if (!HandleEndOfTokenLexer(Tok)) Lex(Tok);
				326
				327	// Discarding comments as long as we don't have EOF or EOM. This 'comments
				328	// out' the rest of the line, including any tokens that came from other macros
				329	// that were active, as in:
				330	// #define submacro a COMMENT b
				331	// submacro c
				332	// which should lex to 'a' only: 'b' and 'c' should be removed.
				333	while (Tok.isNot(tok::eom) && Tok.isNot(tok::eof))
				334	Lex(Tok);
				335
				336	// If we got an eom token, then we successfully found the end of the line.
				337	if (Tok.is(tok::eom)) {
				338	assert(FoundLexer && "Can't get end of line without an active lexer");
				339	// Restore the lexer back to normal mode instead of raw mode.
				340	FoundLexer->LexingRawMode = false;
				341
				342	// If the lexer was already in preprocessor mode, just return the EOM token
				343	// to finish the preprocessor line.
				344	if (LexerWasInPPMode) return;
				345
				346	// Otherwise, switch out of PP mode and return the next lexed token.
				347	FoundLexer->ParsingPreprocessorDirective = false;
				348	return Lex(Tok);
				349	}
				350
				351	// If we got an EOF token, then we reached the end of the token stream but
				352	// didn't find an explicit \n. This can only happen if there was no lexer
				353	// active (an active lexer would return EOM at EOF if there was no \n in
				354	// preprocessor directive mode), so just return EOF as our token.
				355	assert(!FoundLexer && "Lexer should return EOM before EOF in PP mode");
				356	}