Blame - Driver/PrintPreprocessedOutput.cpp - platform/external/clang

blob: d1f1cef9855fdbbc156c967b53f7c38abc04369b [file] [log] [blame]

Reid Spencer	5f016e2	2007-07-11 17:01:13 +0000	[diff] [blame]	1	//===--- PrintPreprocessedOutput.cpp - Implement the -E mode --------------===//
				2	//
				3	// The LLVM Compiler Infrastructure
				4	//
				5	// This file was developed by Chris Lattner and is distributed under
				6	// the University of Illinois Open Source License. See LICENSE.TXT for details.
				7	//
				8	//===----------------------------------------------------------------------===//
				9	//
				10	// This code simply runs the preprocessor on the input file and prints out the
				11	// result. This is the traditional behavior of the -E option.
				12	//
				13	//===----------------------------------------------------------------------===//
				14
				15	#include "clang.h"
				16	#include "clang/Lex/PPCallbacks.h"
				17	#include "clang/Lex/Preprocessor.h"
				18	#include "clang/Lex/Pragma.h"
				19	#include "clang/Basic/SourceManager.h"
				20	#include "llvm/Support/CommandLine.h"
				21	#include "llvm/ADT/StringExtras.h"
				22	#include "llvm/Config/config.h"
				23	#include <cstdio>
				24	using namespace clang;
				25
				26	//===----------------------------------------------------------------------===//
				27	// Simple buffered I/O
				28	//===----------------------------------------------------------------------===//
				29	//
				30	// Empirically, iostream is over 30% slower than stdio for this workload, and
				31	// stdio itself isn't very well suited. The problem with stdio is use of
				32	// putchar_unlocked. We have many newline characters that need to be emitted,
				33	// but stdio needs to do extra checks to handle line buffering mode. These
				34	// extra checks make putchar_unlocked fall off its inlined code path, hitting
				35	// slow system code. In practice, using 'write' directly makes 'clang -E -P'
				36	// about 10% faster than using the stdio path on darwin.
				37
				38	#ifdef HAVE_UNISTD_H
				39	#include <unistd.h>
				40	#else
				41	#define USE_STDIO 1
				42	#endif
				43
				44	static char OutBufStart = 0, OutBufEnd, *OutBufCur;
				45
				46	/// InitOutputBuffer - Initialize our output buffer.
				47	///
				48	static void InitOutputBuffer() {
				49	#ifndef USE_STDIO
				50	OutBufStart = new char[64*1024];
				51	OutBufEnd = OutBufStart+64*1024;
				52	OutBufCur = OutBufStart;
				53	#endif
				54	}
				55
				56	/// FlushBuffer - Write the accumulated bytes to the output stream.
				57	///
				58	static void FlushBuffer() {
				59	#ifndef USE_STDIO
				60	write(STDOUT_FILENO, OutBufStart, OutBufCur-OutBufStart);
				61	OutBufCur = OutBufStart;
				62	#endif
				63	}
				64
				65	/// CleanupOutputBuffer - Finish up output.
				66	///
				67	static void CleanupOutputBuffer() {
				68	#ifndef USE_STDIO
				69	FlushBuffer();
				70	delete [] OutBufStart;
				71	#endif
				72	}
				73
				74	static void OutputChar(char c) {
				75	#ifdef USE_STDIO
				76	putchar_unlocked(c);
				77	#else
				78	if (OutBufCur >= OutBufEnd)
				79	FlushBuffer();
				80	*OutBufCur++ = c;
				81	#endif
				82	}
				83
				84	static void OutputString(const char *Ptr, unsigned Size) {
				85	#ifdef USE_STDIO
				86	fwrite(Ptr, Size, 1, stdout);
				87	#else
				88	if (OutBufCur+Size >= OutBufEnd)
				89	FlushBuffer();
				90	memcpy(OutBufCur, Ptr, Size);
				91	OutBufCur += Size;
				92	#endif
				93	}
				94
				95
				96	//===----------------------------------------------------------------------===//
				97	// Preprocessed token printer
				98	//===----------------------------------------------------------------------===//
				99
				100	static llvm::cl::opt<bool>
				101	DisableLineMarkers("P", llvm::cl::desc("Disable linemarker output in -E mode"));
				102	static llvm::cl::opt<bool>
				103	EnableCommentOutput("C", llvm::cl::desc("Enable comment output in -E mode"));
				104	static llvm::cl::opt<bool>
				105	EnableMacroCommentOutput("CC",
				106	llvm::cl::desc("Enable comment output in -E mode, "
				107	"even from macro expansions"));
				108
				109	namespace {
				110	class PrintPPOutputPPCallbacks : public PPCallbacks {
				111	Preprocessor &PP;
				112	unsigned CurLine;
				113	std::string CurFilename;
				114	bool EmittedTokensOnThisLine;
				115	DirectoryLookup::DirType FileType;
				116	public:
				117	PrintPPOutputPPCallbacks(Preprocessor &pp) : PP(pp) {
				118	CurLine = 0;
Chris Lattner	0cbc4b5	2007-07-22 06:38:50 +0000	[diff] [blame]	119	CurFilename = "<uninit>";
Reid Spencer	5f016e2	2007-07-11 17:01:13 +0000	[diff] [blame]	120	EmittedTokensOnThisLine = false;
				121	FileType = DirectoryLookup::NormalHeaderDir;
				122	}
				123
				124	void SetEmittedTokensOnThisLine() { EmittedTokensOnThisLine = true; }
Chris Lattner	f0f2b29	2007-07-23 06:09:34 +0000	[diff] [blame]	125	bool hasEmittedTokensOnThisLine() const { return EmittedTokensOnThisLine; }
Reid Spencer	5f016e2	2007-07-11 17:01:13 +0000	[diff] [blame]	126
				127	virtual void FileChanged(SourceLocation Loc, FileChangeReason Reason,
				128	DirectoryLookup::DirType FileType);
				129	virtual void Ident(SourceLocation Loc, const std::string &str);
				130
				131
Chris Lattner	d217773	2007-07-20 16:59:19 +0000	[diff] [blame]	132	void HandleFirstTokOnLine(Token &Tok);
Reid Spencer	5f016e2	2007-07-11 17:01:13 +0000	[diff] [blame]	133	void MoveToLine(SourceLocation Loc);
Chris Lattner	d217773	2007-07-20 16:59:19 +0000	[diff] [blame]	134	bool AvoidConcat(const Token &PrevTok, const Token &Tok);
Reid Spencer	5f016e2	2007-07-11 17:01:13 +0000	[diff] [blame]	135	};
				136	}
				137
				138	/// MoveToLine - Move the output to the source line specified by the location
				139	/// object. We can do this by emitting some number of \n's, or be emitting a
				140	/// #line directive.
				141	void PrintPPOutputPPCallbacks::MoveToLine(SourceLocation Loc) {
				142	if (DisableLineMarkers) {
				143	if (EmittedTokensOnThisLine) {
				144	OutputChar('\n');
				145	EmittedTokensOnThisLine = false;
				146	}
				147	return;
				148	}
				149
Chris Lattner	9dc1f53	2007-07-20 16:37:10 +0000	[diff] [blame]	150	unsigned LineNo = PP.getSourceManager().getLogicalLineNumber(Loc);
Reid Spencer	5f016e2	2007-07-11 17:01:13 +0000	[diff] [blame]	151
				152	// If this line is "close enough" to the original line, just print newlines,
				153	// otherwise print a #line directive.
				154	if (LineNo-CurLine < 8) {
Chris Lattner	822f940	2007-07-23 05:14:05 +0000	[diff] [blame]	155	if (LineNo-CurLine == 1)
Reid Spencer	5f016e2	2007-07-11 17:01:13 +0000	[diff] [blame]	156	OutputChar('\n');
Chris Lattner	822f940	2007-07-23 05:14:05 +0000	[diff] [blame]	157	else {
				158	const char *NewLines = "\n\n\n\n\n\n\n\n";
				159	OutputString(NewLines, LineNo-CurLine);
				160	CurLine = LineNo;
				161	}
Reid Spencer	5f016e2	2007-07-11 17:01:13 +0000	[diff] [blame]	162	} else {
				163	if (EmittedTokensOnThisLine) {
				164	OutputChar('\n');
				165	EmittedTokensOnThisLine = false;
				166	}
				167
				168	CurLine = LineNo;
				169
				170	OutputChar('#');
				171	OutputChar(' ');
				172	std::string Num = llvm::utostr_32(LineNo);
				173	OutputString(&Num[0], Num.size());
				174	OutputChar(' ');
Chris Lattner	0cbc4b5	2007-07-22 06:38:50 +0000	[diff] [blame]	175	OutputChar('"');
Reid Spencer	5f016e2	2007-07-11 17:01:13 +0000	[diff] [blame]	176	OutputString(&CurFilename[0], CurFilename.size());
Chris Lattner	0cbc4b5	2007-07-22 06:38:50 +0000	[diff] [blame]	177	OutputChar('"');
Reid Spencer	5f016e2	2007-07-11 17:01:13 +0000	[diff] [blame]	178
				179	if (FileType == DirectoryLookup::SystemHeaderDir)
				180	OutputString(" 3", 2);
				181	else if (FileType == DirectoryLookup::ExternCSystemHeaderDir)
				182	OutputString(" 3 4", 4);
				183	OutputChar('\n');
				184	}
				185	}
				186
				187
				188	/// FileChanged - Whenever the preprocessor enters or exits a #include file
				189	/// it invokes this handler. Update our conception of the current source
				190	/// position.
				191	void PrintPPOutputPPCallbacks::FileChanged(SourceLocation Loc,
				192	FileChangeReason Reason,
				193	DirectoryLookup::DirType FileType) {
				194	if (DisableLineMarkers) return;
				195
				196	// Unless we are exiting a #include, make sure to skip ahead to the line the
				197	// #include directive was at.
				198	SourceManager &SourceMgr = PP.getSourceManager();
				199	if (Reason == PPCallbacks::EnterFile) {
Chris Lattner	9dc1f53	2007-07-20 16:37:10 +0000	[diff] [blame]	200	MoveToLine(SourceMgr.getIncludeLoc(Loc));
Reid Spencer	5f016e2	2007-07-11 17:01:13 +0000	[diff] [blame]	201	} else if (Reason == PPCallbacks::SystemHeaderPragma) {
				202	MoveToLine(Loc);
				203
				204	// TODO GCC emits the # directive for this directive on the line AFTER the
				205	// directive and emits a bunch of spaces that aren't needed. Emulate this
				206	// strange behavior.
				207	}
				208
Chris Lattner	9dc1f53	2007-07-20 16:37:10 +0000	[diff] [blame]	209	Loc = SourceMgr.getLogicalLoc(Loc);
Reid Spencer	5f016e2	2007-07-11 17:01:13 +0000	[diff] [blame]	210	CurLine = SourceMgr.getLineNumber(Loc);
Chris Lattner	0cbc4b5	2007-07-22 06:38:50 +0000	[diff] [blame]	211	CurFilename = Lexer::Stringify(SourceMgr.getSourceName(Loc));
Reid Spencer	5f016e2	2007-07-11 17:01:13 +0000	[diff] [blame]	212	FileType = FileType;
				213
				214	if (EmittedTokensOnThisLine) {
				215	OutputChar('\n');
				216	EmittedTokensOnThisLine = false;
				217	}
				218
Reid Spencer	5f016e2	2007-07-11 17:01:13 +0000	[diff] [blame]	219	OutputChar('#');
				220	OutputChar(' ');
				221	std::string Num = llvm::utostr_32(CurLine);
				222	OutputString(&Num[0], Num.size());
				223	OutputChar(' ');
Chris Lattner	0cbc4b5	2007-07-22 06:38:50 +0000	[diff] [blame]	224	OutputChar('"');
Reid Spencer	5f016e2	2007-07-11 17:01:13 +0000	[diff] [blame]	225	OutputString(&CurFilename[0], CurFilename.size());
Chris Lattner	0cbc4b5	2007-07-22 06:38:50 +0000	[diff] [blame]	226	OutputChar('"');
Reid Spencer	5f016e2	2007-07-11 17:01:13 +0000	[diff] [blame]	227
				228	switch (Reason) {
				229	case PPCallbacks::EnterFile:
				230	OutputString(" 1", 2);
				231	break;
				232	case PPCallbacks::ExitFile:
				233	OutputString(" 2", 2);
				234	break;
				235	case PPCallbacks::SystemHeaderPragma: break;
				236	case PPCallbacks::RenameFile: break;
				237	}
				238
				239	if (FileType == DirectoryLookup::SystemHeaderDir)
				240	OutputString(" 3", 2);
				241	else if (FileType == DirectoryLookup::ExternCSystemHeaderDir)
				242	OutputString(" 3 4", 4);
				243
				244	OutputChar('\n');
				245	}
				246
				247	/// HandleIdent - Handle #ident directives when read by the preprocessor.
				248	///
				249	void PrintPPOutputPPCallbacks::Ident(SourceLocation Loc, const std::string &S) {
				250	MoveToLine(Loc);
				251
				252	OutputString("#ident ", strlen("#ident "));
				253	OutputString(&S[0], S.size());
				254	EmittedTokensOnThisLine = true;
				255	}
				256
				257	/// HandleFirstTokOnLine - When emitting a preprocessed file in -E mode, this
				258	/// is called for the first token on each new line.
Chris Lattner	d217773	2007-07-20 16:59:19 +0000	[diff] [blame]	259	void PrintPPOutputPPCallbacks::HandleFirstTokOnLine(Token &Tok) {
Reid Spencer	5f016e2	2007-07-11 17:01:13 +0000	[diff] [blame]	260	// Figure out what line we went to and insert the appropriate number of
				261	// newline characters.
				262	MoveToLine(Tok.getLocation());
				263
				264	// Print out space characters so that the first token on a line is
				265	// indented for easy reading.
Chris Lattner	9dc1f53	2007-07-20 16:37:10 +0000	[diff] [blame]	266	const SourceManager &SourceMgr = PP.getSourceManager();
				267	unsigned ColNo = SourceMgr.getLogicalColumnNumber(Tok.getLocation());
Reid Spencer	5f016e2	2007-07-11 17:01:13 +0000	[diff] [blame]	268
				269	// This hack prevents stuff like:
				270	// #define HASH #
				271	// HASH define foo bar
				272	// From having the # character end up at column 1, which makes it so it
				273	// is not handled as a #define next time through the preprocessor if in
				274	// -fpreprocessed mode.
				275	if (ColNo <= 1 && Tok.getKind() == tok::hash)
				276	OutputChar(' ');
				277
				278	// Otherwise, indent the appropriate number of spaces.
				279	for (; ColNo > 1; --ColNo)
				280	OutputChar(' ');
				281	}
				282
				283	namespace {
				284	struct UnknownPragmaHandler : public PragmaHandler {
				285	const char *Prefix;
				286	PrintPPOutputPPCallbacks *Callbacks;
				287
				288	UnknownPragmaHandler(const char prefix, PrintPPOutputPPCallbacks callbacks)
				289	: PragmaHandler(0), Prefix(prefix), Callbacks(callbacks) {}
Chris Lattner	d217773	2007-07-20 16:59:19 +0000	[diff] [blame]	290	virtual void HandlePragma(Preprocessor &PP, Token &PragmaTok) {
Reid Spencer	5f016e2	2007-07-11 17:01:13 +0000	[diff] [blame]	291	// Figure out what line we went to and insert the appropriate number of
				292	// newline characters.
				293	Callbacks->MoveToLine(PragmaTok.getLocation());
				294	OutputString(Prefix, strlen(Prefix));
				295
				296	// Read and print all of the pragma tokens.
				297	while (PragmaTok.getKind() != tok::eom) {
				298	if (PragmaTok.hasLeadingSpace())
				299	OutputChar(' ');
				300	std::string TokSpell = PP.getSpelling(PragmaTok);
				301	OutputString(&TokSpell[0], TokSpell.size());
				302	PP.LexUnexpandedToken(PragmaTok);
				303	}
				304	OutputChar('\n');
				305	}
				306	};
				307	} // end anonymous namespace
				308
Chris Lattner	f0f2b29	2007-07-23 06:09:34 +0000	[diff] [blame]	309
				310	enum AvoidConcatInfo {
				311	/// By default, a token never needs to avoid concatenation. Most tokens (e.g.
				312	/// ',', ')', etc) don't cause a problem when concatenated.
				313	aci_never_avoid_concat = 0,
				314
				315	/// aci_custom_firstchar - AvoidConcat contains custom code to handle this
				316	/// token's requirements, and it needs to know the first character of the
				317	/// token.
				318	aci_custom_firstchar = 1,
				319
				320	/// aci_custom - AvoidConcat contains custom code to handle this token's
				321	/// requirements, but it doesn't need to know the first character of the
				322	/// token.
				323	aci_custom = 2,
				324
				325	/// aci_avoid_equal - Many tokens cannot be safely followed by an '='
				326	/// character. For example, "<<" turns into "<<=" when followed by an =.
				327	aci_avoid_equal = 4
				328	};
				329
				330	/// This array contains information for each token on what action to take when
				331	/// avoiding concatenation of tokens in the AvoidConcat method.
				332	static char TokenInfo[tok::NUM_TOKENS];
				333
				334	/// InitAvoidConcatTokenInfo - Tokens that must avoid concatenation should be
				335	/// marked by this function.
				336	static void InitAvoidConcatTokenInfo() {
				337	// These tokens have custom code in AvoidConcat.
				338	TokenInfo[tok::identifier ] \|= aci_custom;
				339	TokenInfo[tok::numeric_constant] \|= aci_custom_firstchar;
				340	TokenInfo[tok::period ] \|= aci_custom_firstchar;
				341	TokenInfo[tok::amp ] \|= aci_custom_firstchar;
				342	TokenInfo[tok::plus ] \|= aci_custom_firstchar;
				343	TokenInfo[tok::minus ] \|= aci_custom_firstchar;
				344	TokenInfo[tok::slash ] \|= aci_custom_firstchar;
				345	TokenInfo[tok::less ] \|= aci_custom_firstchar;
				346	TokenInfo[tok::greater ] \|= aci_custom_firstchar;
				347	TokenInfo[tok::pipe ] \|= aci_custom_firstchar;
				348	TokenInfo[tok::percent ] \|= aci_custom_firstchar;
				349	TokenInfo[tok::colon ] \|= aci_custom_firstchar;
				350	TokenInfo[tok::hash ] \|= aci_custom_firstchar;
				351	TokenInfo[tok::arrow ] \|= aci_custom_firstchar;
				352
				353	// These tokens change behavior if followed by an '='.
				354	TokenInfo[tok::amp ] \|= aci_avoid_equal; // &=
				355	TokenInfo[tok::plus ] \|= aci_avoid_equal; // +=
				356	TokenInfo[tok::minus ] \|= aci_avoid_equal; // -=
				357	TokenInfo[tok::slash ] \|= aci_avoid_equal; // /=
				358	TokenInfo[tok::less ] \|= aci_avoid_equal; // <=
				359	TokenInfo[tok::greater ] \|= aci_avoid_equal; // >=
				360	TokenInfo[tok::pipe ] \|= aci_avoid_equal; // \|=
				361	TokenInfo[tok::percent ] \|= aci_avoid_equal; // %=
				362	TokenInfo[tok::star ] \|= aci_avoid_equal; // *=
				363	TokenInfo[tok::exclaim ] \|= aci_avoid_equal; // !=
				364	TokenInfo[tok::lessless ] \|= aci_avoid_equal; // <<=
				365	TokenInfo[tok::greaterequal] \|= aci_avoid_equal; // >>=
				366	TokenInfo[tok::caret ] \|= aci_avoid_equal; // ^=
				367	TokenInfo[tok::equal ] \|= aci_avoid_equal; // ==
				368	}
				369
Reid Spencer	5f016e2	2007-07-11 17:01:13 +0000	[diff] [blame]	370	/// AvoidConcat - If printing PrevTok immediately followed by Tok would cause
				371	/// the two individual tokens to be lexed as a single token, return true (which
				372	/// causes a space to be printed between them). This allows the output of -E
				373	/// mode to be lexed to the same token stream as lexing the input directly
				374	/// would.
				375	///
				376	/// This code must conservatively return true if it doesn't want to be 100%
				377	/// accurate. This will cause the output to include extra space characters, but
				378	/// the resulting output won't have incorrect concatenations going on. Examples
				379	/// include "..", which we print with a space between, because we don't want to
				380	/// track enough to tell "x.." from "...".
Chris Lattner	d217773	2007-07-20 16:59:19 +0000	[diff] [blame]	381	bool PrintPPOutputPPCallbacks::AvoidConcat(const Token &PrevTok,
				382	const Token &Tok) {
Reid Spencer	5f016e2	2007-07-11 17:01:13 +0000	[diff] [blame]	383	char Buffer[256];
				384
Chris Lattner	f0f2b29	2007-07-23 06:09:34 +0000	[diff] [blame]	385	tok::TokenKind PrevKind = PrevTok.getKind();
				386	if (PrevTok.getIdentifierInfo()) // Language keyword or named operator.
				387	PrevKind = tok::identifier;
				388
				389	// Look up information on when we should avoid concatenation with prevtok.
				390	unsigned ConcatInfo = TokenInfo[PrevKind];
				391
				392	// If prevtok never causes a problem for anything after it, return quickly.
				393	if (ConcatInfo == 0) return false;
Reid Spencer	5f016e2	2007-07-11 17:01:13 +0000	[diff] [blame]	394
Chris Lattner	f0f2b29	2007-07-23 06:09:34 +0000	[diff] [blame]	395	if (ConcatInfo & aci_avoid_equal) {
				396	// If the next token is '=' or '==', avoid concatenation.
				397	if (Tok.getKind() == tok::equal \|\|
				398	Tok.getKind() == tok::equalequal)
				399	return true;
				400	ConcatInfo &= ~ConcatInfo;
				401	}
				402
				403	if (ConcatInfo == 0) return false;
				404
				405
				406
Reid Spencer	5f016e2	2007-07-11 17:01:13 +0000	[diff] [blame]	407	// Basic algorithm: we look at the first character of the second token, and
				408	// determine whether it, if appended to the first token, would form (or would
				409	// contribute) to a larger token if concatenated.
Chris Lattner	f0f2b29	2007-07-23 06:09:34 +0000	[diff] [blame]	410	char FirstChar = 0;
				411	if (ConcatInfo & aci_custom) {
				412	// If the token does not need to know the first character, don't get it.
				413	} else if (IdentifierInfo *II = Tok.getIdentifierInfo()) {
Reid Spencer	5f016e2	2007-07-11 17:01:13 +0000	[diff] [blame]	414	// Avoid spelling identifiers, the most common form of token.
				415	FirstChar = II->getName()[0];
Chris Lattner	b19f5e8	2007-07-23 05:18:42 +0000	[diff] [blame]	416	} else if (!Tok.needsCleaning()) {
				417	SourceManager &SrcMgr = PP.getSourceManager();
				418	FirstChar =
				419	*SrcMgr.getCharacterData(SrcMgr.getPhysicalLoc(Tok.getLocation()));
Reid Spencer	5f016e2	2007-07-11 17:01:13 +0000	[diff] [blame]	420	} else if (Tok.getLength() < 256) {
				421	const char *TokPtr = Buffer;
				422	PP.getSpelling(Tok, TokPtr);
				423	FirstChar = TokPtr[0];
				424	} else {
				425	FirstChar = PP.getSpelling(Tok)[0];
				426	}
Chris Lattner	f0f2b29	2007-07-23 06:09:34 +0000	[diff] [blame]	427
Reid Spencer	5f016e2	2007-07-11 17:01:13 +0000	[diff] [blame]	428	switch (PrevKind) {
Chris Lattner	f0f2b29	2007-07-23 06:09:34 +0000	[diff] [blame]	429	default: assert(0 && "InitAvoidConcatTokenInfo built wrong");
Reid Spencer	5f016e2	2007-07-11 17:01:13 +0000	[diff] [blame]	430	case tok::identifier: // id+id or id+number or id+L"foo".
Chris Lattner	f0f2b29	2007-07-23 06:09:34 +0000	[diff] [blame]	431	if (Tok.getKind() == tok::numeric_constant \|\| Tok.getIdentifierInfo() \|\|
				432	Tok.getKind() == tok::wide_string_literal /* \|\|
				433	Tok.getKind() == tok::wide_char_literal*/)
				434	return true;
				435	if (Tok.getKind() != tok::char_constant)
				436	return false;
				437
				438	// FIXME: need a wide_char_constant!
				439	if (!Tok.needsCleaning()) {
				440	SourceManager &SrcMgr = PP.getSourceManager();
				441	return *SrcMgr.getCharacterData(SrcMgr.getPhysicalLoc(Tok.getLocation()))
				442	== 'L';
				443	} else if (Tok.getLength() < 256) {
				444	const char *TokPtr = Buffer;
				445	PP.getSpelling(Tok, TokPtr);
				446	return TokPtr[0] == 'L';
				447	} else {
				448	return PP.getSpelling(Tok)[0] == 'L';
				449	}
Reid Spencer	5f016e2	2007-07-11 17:01:13 +0000	[diff] [blame]	450	case tok::numeric_constant:
				451	return isalnum(FirstChar) \|\| Tok.getKind() == tok::numeric_constant \|\|
				452	FirstChar == '+' \|\| FirstChar == '-' \|\| FirstChar == '.';
				453	case tok::period: // ..., .*, .1234
				454	return FirstChar == '.' \|\| FirstChar == '*' \|\| isdigit(FirstChar);
Chris Lattner	f0f2b29	2007-07-23 06:09:34 +0000	[diff] [blame]	455	case tok::amp: // &&
				456	return FirstChar == '&';
				457	case tok::plus: // ++
				458	return FirstChar == '+';
				459	case tok::minus: // --, ->, ->*
				460	return FirstChar == '-' \|\| FirstChar == '>';
				461	case tok::slash: //, /*, //
				462	return FirstChar == '*' \|\| FirstChar == '/';
				463	case tok::less: // <<, <<=, <:, <%
				464	return FirstChar == '<' \|\| FirstChar == ':' \|\| FirstChar == '%';
				465	case tok::greater: // >>, >>=
				466	return FirstChar == '>';
				467	case tok::pipe: // \|\|
				468	return FirstChar == '\|';
				469	case tok::percent: // %>, %:
				470	return FirstChar == '>' \|\| FirstChar == ':';
Reid Spencer	5f016e2	2007-07-11 17:01:13 +0000	[diff] [blame]	471	case tok::colon: // ::, :>
				472	return FirstChar == ':' \|\| FirstChar == '>';
				473	case tok::hash: // ##, #@, %:%:
				474	return FirstChar == '#' \|\| FirstChar == '@' \|\| FirstChar == '%';
				475	case tok::arrow: // ->*
				476	return FirstChar == '*';
Reid Spencer	5f016e2	2007-07-11 17:01:13 +0000	[diff] [blame]	477	}
				478	}
				479
				480	/// DoPrintPreprocessedInput - This implements -E mode.
				481	///
				482	void clang::DoPrintPreprocessedInput(unsigned MainFileID, Preprocessor &PP,
				483	const LangOptions &Options) {
				484	// Inform the preprocessor whether we want it to retain comments or not, due
				485	// to -C or -CC.
				486	PP.SetCommentRetentionState(EnableCommentOutput, EnableMacroCommentOutput);
				487
				488	InitOutputBuffer();
Chris Lattner	f0f2b29	2007-07-23 06:09:34 +0000	[diff] [blame]	489	InitAvoidConcatTokenInfo();
Reid Spencer	5f016e2	2007-07-11 17:01:13 +0000	[diff] [blame]	490
Chris Lattner	d217773	2007-07-20 16:59:19 +0000	[diff] [blame]	491	Token Tok, PrevTok;
Reid Spencer	5f016e2	2007-07-11 17:01:13 +0000	[diff] [blame]	492	char Buffer[256];
				493	PrintPPOutputPPCallbacks *Callbacks = new PrintPPOutputPPCallbacks(PP);
				494	PP.setPPCallbacks(Callbacks);
				495
				496	PP.AddPragmaHandler(0, new UnknownPragmaHandler("#pragma", Callbacks));
				497	PP.AddPragmaHandler("GCC", new UnknownPragmaHandler("#pragma GCC",Callbacks));
				498
				499	// After we have configured the preprocessor, enter the main file.
				500
				501	// Start parsing the specified input file.
				502	PP.EnterSourceFile(MainFileID, 0, true);
				503
				504	do {
				505	PrevTok = Tok;
				506	PP.Lex(Tok);
				507
				508	// If this token is at the start of a line, emit newlines if needed.
				509	if (Tok.isAtStartOfLine()) {
				510	Callbacks->HandleFirstTokOnLine(Tok);
				511	} else if (Tok.hasLeadingSpace() \|\|
Chris Lattner	f0f2b29	2007-07-23 06:09:34 +0000	[diff] [blame]	512	// If we haven't emitted a token on this line yet, PrevTok isn't
				513	// useful to look at and no concatenation could happen anyway.
				514	(!Callbacks->hasEmittedTokensOnThisLine() &&
				515	// Don't print "-" next to "-", it would form "--".
				516	Callbacks->AvoidConcat(PrevTok, Tok))) {
Reid Spencer	5f016e2	2007-07-11 17:01:13 +0000	[diff] [blame]	517	OutputChar(' ');
				518	}
				519
Chris Lattner	2933f41	2007-07-23 06:14:36 +0000	[diff] [blame^]	520	if (IdentifierInfo *II = Tok.getIdentifierInfo()) {
				521	const char *Str = II->getName();
				522	unsigned Len = Tok.needsCleaning() ? strlen(Str) : Tok.getLength();
				523	OutputString(Str, Len);
				524	} else if (Tok.getLength() < 256) {
Reid Spencer	5f016e2	2007-07-11 17:01:13 +0000	[diff] [blame]	525	const char *TokPtr = Buffer;
				526	unsigned Len = PP.getSpelling(Tok, TokPtr);
				527	OutputString(TokPtr, Len);
				528	} else {
				529	std::string S = PP.getSpelling(Tok);
				530	OutputString(&S[0], S.size());
				531	}
				532	Callbacks->SetEmittedTokensOnThisLine();
				533	} while (Tok.getKind() != tok::eof);
				534	OutputChar('\n');
				535
				536	CleanupOutputBuffer();
				537	}
				538