blob: a73757f1b59e09c75a387e98a276f1f1517cdec7 [file] [log] [blame]
Chris Lattner4b009652007-07-25 00:24:17 +00001//===--- Preprocess.cpp - C Language Family Preprocessor Implementation ---===//
2//
3// The LLVM Compiler Infrastructure
4//
Chris Lattner959e5be2007-12-29 19:59:25 +00005// This file is distributed under the University of Illinois Open Source
6// License. See LICENSE.TXT for details.
Chris Lattner4b009652007-07-25 00:24:17 +00007//
8//===----------------------------------------------------------------------===//
9//
10// This file implements the Preprocessor interface.
11//
12//===----------------------------------------------------------------------===//
13//
14// Options to support:
15// -H - Print the name of each header file used.
16// -d[MDNI] - Dump various things.
17// -fworking-directory - #line's with preprocessor's working dir.
18// -fpreprocessed
19// -dependency-file,-M,-MM,-MF,-MG,-MP,-MT,-MQ,-MD,-MMD
20// -W*
21// -w
22//
23// Messages to emit:
24// "Multiple include guards may be useful for:\n"
25//
26//===----------------------------------------------------------------------===//
27
28#include "clang/Lex/Preprocessor.h"
29#include "clang/Lex/HeaderSearch.h"
30#include "clang/Lex/MacroInfo.h"
31#include "clang/Lex/PPCallbacks.h"
32#include "clang/Lex/Pragma.h"
33#include "clang/Lex/ScratchBuffer.h"
34#include "clang/Basic/Diagnostic.h"
35#include "clang/Basic/FileManager.h"
36#include "clang/Basic/SourceManager.h"
37#include "clang/Basic/TargetInfo.h"
38#include "llvm/ADT/SmallVector.h"
39#include "llvm/Support/MemoryBuffer.h"
Ted Kremenekce4c64e2008-01-14 16:44:48 +000040#include "llvm/Support/Streams.h"
Chris Lattner1b023182007-09-03 18:30:32 +000041#include <ctime>
Chris Lattner4b009652007-07-25 00:24:17 +000042using namespace clang;
43
44//===----------------------------------------------------------------------===//
45
46Preprocessor::Preprocessor(Diagnostic &diags, const LangOptions &opts,
47 TargetInfo &target, SourceManager &SM,
48 HeaderSearch &Headers)
49 : Diags(diags), Features(opts), Target(target), FileMgr(Headers.getFileMgr()),
50 SourceMgr(SM), HeaderInfo(Headers), Identifiers(opts),
51 CurLexer(0), CurDirLookup(0), CurMacroExpander(0), Callbacks(0) {
52 ScratchBuf = new ScratchBuffer(SourceMgr);
53
54 // Clear stats.
55 NumDirectives = NumDefined = NumUndefined = NumPragma = 0;
56 NumIf = NumElse = NumEndif = 0;
57 NumEnteredSourceFiles = 0;
58 NumMacroExpanded = NumFnMacroExpanded = NumBuiltinMacroExpanded = 0;
59 NumFastMacroExpanded = NumTokenPaste = NumFastTokenPaste = 0;
60 MaxIncludeStackDepth = 0;
61 NumSkipped = 0;
62
63 // Default to discarding comments.
64 KeepComments = false;
65 KeepMacroComments = false;
66
67 // Macro expansion is enabled.
68 DisableMacroExpansion = false;
69 InMacroArgs = false;
70 NumCachedMacroExpanders = 0;
71
72 // "Poison" __VA_ARGS__, which can only appear in the expansion of a macro.
73 // This gets unpoisoned where it is allowed.
74 (Ident__VA_ARGS__ = getIdentifierInfo("__VA_ARGS__"))->setIsPoisoned();
75
Chris Lattnerd1f21e12007-10-09 22:10:18 +000076 Predefines = 0;
77
Chris Lattner4b009652007-07-25 00:24:17 +000078 // Initialize the pragma handlers.
79 PragmaHandlers = new PragmaNamespace(0);
80 RegisterBuiltinPragmas();
81
82 // Initialize builtin macros like __LINE__ and friends.
83 RegisterBuiltinMacros();
84}
85
86Preprocessor::~Preprocessor() {
87 // Free any active lexers.
88 delete CurLexer;
89
90 while (!IncludeMacroStack.empty()) {
91 delete IncludeMacroStack.back().TheLexer;
92 delete IncludeMacroStack.back().TheMacroExpander;
93 IncludeMacroStack.pop_back();
94 }
Chris Lattner7a1b0882007-10-07 08:44:20 +000095
96 // Free any macro definitions.
97 for (llvm::DenseMap<IdentifierInfo*, MacroInfo*>::iterator I =
98 Macros.begin(), E = Macros.end(); I != E; ++I) {
99 // Free the macro definition.
100 delete I->second;
101 I->second = 0;
102 I->first->setHasMacroDefinition(false);
103 }
Chris Lattner4b009652007-07-25 00:24:17 +0000104
105 // Free any cached macro expanders.
106 for (unsigned i = 0, e = NumCachedMacroExpanders; i != e; ++i)
107 delete MacroExpanderCache[i];
108
109 // Release pragma information.
110 delete PragmaHandlers;
111
112 // Delete the scratch buffer info.
113 delete ScratchBuf;
114}
115
116PPCallbacks::~PPCallbacks() {
117}
118
119/// Diag - Forwarding function for diagnostics. This emits a diagnostic at
120/// the specified Token's location, translating the token's start
121/// position in the current buffer into a SourcePosition object for rendering.
122void Preprocessor::Diag(SourceLocation Loc, unsigned DiagID) {
Ted Kremenekd7f64cd2007-12-12 22:39:36 +0000123 Diags.Report(getFullLoc(Loc), DiagID);
Chris Lattner4b009652007-07-25 00:24:17 +0000124}
125
126void Preprocessor::Diag(SourceLocation Loc, unsigned DiagID,
127 const std::string &Msg) {
Ted Kremenekd7f64cd2007-12-12 22:39:36 +0000128 Diags.Report(getFullLoc(Loc), DiagID, &Msg, 1);
Chris Lattner4b009652007-07-25 00:24:17 +0000129}
130
131void Preprocessor::DumpToken(const Token &Tok, bool DumpFlags) const {
Ted Kremenekce4c64e2008-01-14 16:44:48 +0000132 llvm::cerr << tok::getTokenName(Tok.getKind()) << " '"
133 << getSpelling(Tok) << "'";
Chris Lattner4b009652007-07-25 00:24:17 +0000134
135 if (!DumpFlags) return;
Chris Lattnerc0f7c512007-12-09 20:31:55 +0000136
Ted Kremenekce4c64e2008-01-14 16:44:48 +0000137 llvm::cerr << "\t";
Chris Lattner4b009652007-07-25 00:24:17 +0000138 if (Tok.isAtStartOfLine())
Ted Kremenekce4c64e2008-01-14 16:44:48 +0000139 llvm::cerr << " [StartOfLine]";
Chris Lattner4b009652007-07-25 00:24:17 +0000140 if (Tok.hasLeadingSpace())
Ted Kremenekce4c64e2008-01-14 16:44:48 +0000141 llvm::cerr << " [LeadingSpace]";
Chris Lattner4b009652007-07-25 00:24:17 +0000142 if (Tok.isExpandDisabled())
Ted Kremenekce4c64e2008-01-14 16:44:48 +0000143 llvm::cerr << " [ExpandDisabled]";
Chris Lattner4b009652007-07-25 00:24:17 +0000144 if (Tok.needsCleaning()) {
145 const char *Start = SourceMgr.getCharacterData(Tok.getLocation());
Ted Kremenekce4c64e2008-01-14 16:44:48 +0000146 llvm::cerr << " [UnClean='" << std::string(Start, Start+Tok.getLength())
147 << "']";
Chris Lattner4b009652007-07-25 00:24:17 +0000148 }
Chris Lattnerc0f7c512007-12-09 20:31:55 +0000149
Ted Kremenekce4c64e2008-01-14 16:44:48 +0000150 llvm::cerr << "\tLoc=<";
Chris Lattnerc0f7c512007-12-09 20:31:55 +0000151 DumpLocation(Tok.getLocation());
Ted Kremenekce4c64e2008-01-14 16:44:48 +0000152 llvm::cerr << ">";
Chris Lattnerc0f7c512007-12-09 20:31:55 +0000153}
154
155void Preprocessor::DumpLocation(SourceLocation Loc) const {
156 SourceLocation LogLoc = SourceMgr.getLogicalLoc(Loc);
Ted Kremenekce4c64e2008-01-14 16:44:48 +0000157 llvm::cerr << SourceMgr.getSourceName(LogLoc) << ':'
158 << SourceMgr.getLineNumber(LogLoc) << ':'
159 << SourceMgr.getLineNumber(LogLoc);
Chris Lattnerc0f7c512007-12-09 20:31:55 +0000160
161 SourceLocation PhysLoc = SourceMgr.getPhysicalLoc(Loc);
162 if (PhysLoc != LogLoc) {
Ted Kremenekce4c64e2008-01-14 16:44:48 +0000163 llvm::cerr << " <PhysLoc=";
Chris Lattnerc0f7c512007-12-09 20:31:55 +0000164 DumpLocation(PhysLoc);
Ted Kremenekce4c64e2008-01-14 16:44:48 +0000165 llvm::cerr << ">";
Chris Lattnerc0f7c512007-12-09 20:31:55 +0000166 }
Chris Lattner4b009652007-07-25 00:24:17 +0000167}
168
169void Preprocessor::DumpMacro(const MacroInfo &MI) const {
Ted Kremenekce4c64e2008-01-14 16:44:48 +0000170 llvm::cerr << "MACRO: ";
Chris Lattner4b009652007-07-25 00:24:17 +0000171 for (unsigned i = 0, e = MI.getNumTokens(); i != e; ++i) {
172 DumpToken(MI.getReplacementToken(i));
Ted Kremenekce4c64e2008-01-14 16:44:48 +0000173 llvm::cerr << " ";
Chris Lattner4b009652007-07-25 00:24:17 +0000174 }
Ted Kremenekce4c64e2008-01-14 16:44:48 +0000175 llvm::cerr << "\n";
Chris Lattner4b009652007-07-25 00:24:17 +0000176}
177
178void Preprocessor::PrintStats() {
Ted Kremenekce4c64e2008-01-14 16:44:48 +0000179 llvm::cerr << "\n*** Preprocessor Stats:\n";
180 llvm::cerr << NumDirectives << " directives found:\n";
181 llvm::cerr << " " << NumDefined << " #define.\n";
182 llvm::cerr << " " << NumUndefined << " #undef.\n";
183 llvm::cerr << " #include/#include_next/#import:\n";
184 llvm::cerr << " " << NumEnteredSourceFiles << " source files entered.\n";
185 llvm::cerr << " " << MaxIncludeStackDepth << " max include stack depth\n";
186 llvm::cerr << " " << NumIf << " #if/#ifndef/#ifdef.\n";
187 llvm::cerr << " " << NumElse << " #else/#elif.\n";
188 llvm::cerr << " " << NumEndif << " #endif.\n";
189 llvm::cerr << " " << NumPragma << " #pragma.\n";
190 llvm::cerr << NumSkipped << " #if/#ifndef#ifdef regions skipped\n";
Chris Lattner4b009652007-07-25 00:24:17 +0000191
Ted Kremenekce4c64e2008-01-14 16:44:48 +0000192 llvm::cerr << NumMacroExpanded << "/" << NumFnMacroExpanded << "/"
193 << NumBuiltinMacroExpanded << " obj/fn/builtin macros expanded, "
194 << NumFastMacroExpanded << " on the fast path.\n";
195 llvm::cerr << (NumFastTokenPaste+NumTokenPaste)
196 << " token paste (##) operations performed, "
197 << NumFastTokenPaste << " on the fast path.\n";
Chris Lattner4b009652007-07-25 00:24:17 +0000198}
199
200//===----------------------------------------------------------------------===//
201// Token Spelling
202//===----------------------------------------------------------------------===//
203
204
205/// getSpelling() - Return the 'spelling' of this token. The spelling of a
206/// token are the characters used to represent the token in the source file
207/// after trigraph expansion and escaped-newline folding. In particular, this
208/// wants to get the true, uncanonicalized, spelling of things like digraphs
209/// UCNs, etc.
210std::string Preprocessor::getSpelling(const Token &Tok) const {
211 assert((int)Tok.getLength() >= 0 && "Token character range is bogus!");
212
213 // If this token contains nothing interesting, return it directly.
214 const char *TokStart = SourceMgr.getCharacterData(Tok.getLocation());
215 if (!Tok.needsCleaning())
216 return std::string(TokStart, TokStart+Tok.getLength());
217
218 std::string Result;
219 Result.reserve(Tok.getLength());
220
221 // Otherwise, hard case, relex the characters into the string.
222 for (const char *Ptr = TokStart, *End = TokStart+Tok.getLength();
223 Ptr != End; ) {
224 unsigned CharSize;
225 Result.push_back(Lexer::getCharAndSizeNoWarn(Ptr, CharSize, Features));
226 Ptr += CharSize;
227 }
228 assert(Result.size() != unsigned(Tok.getLength()) &&
229 "NeedsCleaning flag set on something that didn't need cleaning!");
230 return Result;
231}
232
233/// getSpelling - This method is used to get the spelling of a token into a
234/// preallocated buffer, instead of as an std::string. The caller is required
235/// to allocate enough space for the token, which is guaranteed to be at least
236/// Tok.getLength() bytes long. The actual length of the token is returned.
237///
238/// Note that this method may do two possible things: it may either fill in
239/// the buffer specified with characters, or it may *change the input pointer*
240/// to point to a constant buffer with the data already in it (avoiding a
241/// copy). The caller is not allowed to modify the returned buffer pointer
242/// if an internal buffer is returned.
243unsigned Preprocessor::getSpelling(const Token &Tok,
244 const char *&Buffer) const {
245 assert((int)Tok.getLength() >= 0 && "Token character range is bogus!");
246
247 // If this token is an identifier, just return the string from the identifier
248 // table, which is very quick.
249 if (const IdentifierInfo *II = Tok.getIdentifierInfo()) {
250 Buffer = II->getName();
251
252 // Return the length of the token. If the token needed cleaning, don't
253 // include the size of the newlines or trigraphs in it.
254 if (!Tok.needsCleaning())
255 return Tok.getLength();
256 else
257 return strlen(Buffer);
258 }
259
260 // Otherwise, compute the start of the token in the input lexer buffer.
261 const char *TokStart = SourceMgr.getCharacterData(Tok.getLocation());
262
263 // If this token contains nothing interesting, return it directly.
264 if (!Tok.needsCleaning()) {
265 Buffer = TokStart;
266 return Tok.getLength();
267 }
268 // Otherwise, hard case, relex the characters into the string.
269 char *OutBuf = const_cast<char*>(Buffer);
270 for (const char *Ptr = TokStart, *End = TokStart+Tok.getLength();
271 Ptr != End; ) {
272 unsigned CharSize;
273 *OutBuf++ = Lexer::getCharAndSizeNoWarn(Ptr, CharSize, Features);
274 Ptr += CharSize;
275 }
276 assert(unsigned(OutBuf-Buffer) != Tok.getLength() &&
277 "NeedsCleaning flag set on something that didn't need cleaning!");
278
279 return OutBuf-Buffer;
280}
281
282
283/// CreateString - Plop the specified string into a scratch buffer and return a
284/// location for it. If specified, the source location provides a source
285/// location for the token.
286SourceLocation Preprocessor::
287CreateString(const char *Buf, unsigned Len, SourceLocation SLoc) {
288 if (SLoc.isValid())
289 return ScratchBuf->getToken(Buf, Len, SLoc);
290 return ScratchBuf->getToken(Buf, Len);
291}
292
293
294/// AdvanceToTokenCharacter - Given a location that specifies the start of a
295/// token, return a new location that specifies a character within the token.
296SourceLocation Preprocessor::AdvanceToTokenCharacter(SourceLocation TokStart,
297 unsigned CharNo) {
298 // If they request the first char of the token, we're trivially done. If this
299 // is a macro expansion, it doesn't make sense to point to a character within
300 // the instantiation point (the name). We could point to the source
301 // character, but without also pointing to instantiation info, this is
302 // confusing.
303 if (CharNo == 0 || TokStart.isMacroID()) return TokStart;
304
305 // Figure out how many physical characters away the specified logical
306 // character is. This needs to take into consideration newlines and
307 // trigraphs.
308 const char *TokPtr = SourceMgr.getCharacterData(TokStart);
309 unsigned PhysOffset = 0;
310
311 // The usual case is that tokens don't contain anything interesting. Skip
312 // over the uninteresting characters. If a token only consists of simple
313 // chars, this method is extremely fast.
314 while (CharNo && Lexer::isObviouslySimpleCharacter(*TokPtr))
315 ++TokPtr, --CharNo, ++PhysOffset;
316
317 // If we have a character that may be a trigraph or escaped newline, create a
318 // lexer to parse it correctly.
319 if (CharNo != 0) {
320 // Create a lexer starting at this token position.
321 Lexer TheLexer(TokStart, *this, TokPtr);
322 Token Tok;
323 // Skip over characters the remaining characters.
324 const char *TokStartPtr = TokPtr;
325 for (; CharNo; --CharNo)
326 TheLexer.getAndAdvanceChar(TokPtr, Tok);
327
328 PhysOffset += TokPtr-TokStartPtr;
329 }
330
331 return TokStart.getFileLocWithOffset(PhysOffset);
332}
333
334
Chris Lattnerd1f21e12007-10-09 22:10:18 +0000335//===----------------------------------------------------------------------===//
336// Preprocessor Initialization Methods
337//===----------------------------------------------------------------------===//
338
339// Append a #define line to Buf for Macro. Macro should be of the form XXX,
340// in which case we emit "#define XXX 1" or "XXX=Y z W" in which case we emit
341// "#define XXX Y z W". To get a #define with no value, use "XXX=".
342static void DefineBuiltinMacro(std::vector<char> &Buf, const char *Macro,
343 const char *Command = "#define ") {
344 Buf.insert(Buf.end(), Command, Command+strlen(Command));
345 if (const char *Equal = strchr(Macro, '=')) {
346 // Turn the = into ' '.
347 Buf.insert(Buf.end(), Macro, Equal);
348 Buf.push_back(' ');
349 Buf.insert(Buf.end(), Equal+1, Equal+strlen(Equal));
350 } else {
351 // Push "macroname 1".
352 Buf.insert(Buf.end(), Macro, Macro+strlen(Macro));
353 Buf.push_back(' ');
354 Buf.push_back('1');
355 }
356 Buf.push_back('\n');
357}
358
359
360static void InitializePredefinedMacros(Preprocessor &PP,
361 std::vector<char> &Buf) {
362 // FIXME: Implement magic like cpp_init_builtins for things like __STDC__
363 // and __DATE__ etc.
364#if 0
365 /* __STDC__ has the value 1 under normal circumstances.
366 However, if (a) we are in a system header, (b) the option
367 stdc_0_in_system_headers is true (set by target config), and
368 (c) we are not in strictly conforming mode, then it has the
369 value 0. (b) and (c) are already checked in cpp_init_builtins. */
370 //case BT_STDC:
371 if (cpp_in_system_header (pfile))
372 number = 0;
373 else
374 number = 1;
375 break;
376#endif
377 // These should all be defined in the preprocessor according to the
378 // current language configuration.
379 DefineBuiltinMacro(Buf, "__STDC__=1");
380 //DefineBuiltinMacro(Buf, "__ASSEMBLER__=1");
381 if (PP.getLangOptions().C99 && !PP.getLangOptions().CPlusPlus)
382 DefineBuiltinMacro(Buf, "__STDC_VERSION__=199901L");
383 else if (0) // STDC94 ?
384 DefineBuiltinMacro(Buf, "__STDC_VERSION__=199409L");
385
386 DefineBuiltinMacro(Buf, "__STDC_HOSTED__=1");
387 if (PP.getLangOptions().ObjC1)
388 DefineBuiltinMacro(Buf, "__OBJC__=1");
389 if (PP.getLangOptions().ObjC2)
390 DefineBuiltinMacro(Buf, "__OBJC2__=1");
Steve Naroffae84af82007-10-31 18:42:27 +0000391
Chris Lattner77cec472007-10-10 17:48:53 +0000392 // Add __builtin_va_list typedef.
393 {
394 const char *VAList = PP.getTargetInfo().getVAListDeclaration();
395 Buf.insert(Buf.end(), VAList, VAList+strlen(VAList));
396 Buf.push_back('\n');
397 }
Chris Lattnerd1f21e12007-10-09 22:10:18 +0000398
399 // Get the target #defines.
400 PP.getTargetInfo().getTargetDefines(Buf);
401
402 // Compiler set macros.
403 DefineBuiltinMacro(Buf, "__APPLE_CC__=5250");
Steve Naroffb5a086e2007-11-10 18:06:36 +0000404 DefineBuiltinMacro(Buf, "__ENVIRONMENT_MAC_OS_X_VERSION_MIN_REQUIRED__=1050");
Chris Lattnerd1f21e12007-10-09 22:10:18 +0000405 DefineBuiltinMacro(Buf, "__GNUC_MINOR__=0");
406 DefineBuiltinMacro(Buf, "__GNUC_PATCHLEVEL__=1");
407 DefineBuiltinMacro(Buf, "__GNUC__=4");
408 DefineBuiltinMacro(Buf, "__GXX_ABI_VERSION=1002");
409 DefineBuiltinMacro(Buf, "__VERSION__=\"4.0.1 (Apple Computer, Inc. "
410 "build 5250)\"");
411
412 // Build configuration options.
413 DefineBuiltinMacro(Buf, "__DYNAMIC__=1");
414 DefineBuiltinMacro(Buf, "__FINITE_MATH_ONLY__=0");
415 DefineBuiltinMacro(Buf, "__NO_INLINE__=1");
416 DefineBuiltinMacro(Buf, "__PIC__=1");
417
418
419 if (PP.getLangOptions().CPlusPlus) {
420 DefineBuiltinMacro(Buf, "__DEPRECATED=1");
421 DefineBuiltinMacro(Buf, "__EXCEPTIONS=1");
422 DefineBuiltinMacro(Buf, "__GNUG__=4");
423 DefineBuiltinMacro(Buf, "__GXX_WEAK__=1");
424 DefineBuiltinMacro(Buf, "__cplusplus=1");
425 DefineBuiltinMacro(Buf, "__private_extern__=extern");
426 }
427
428 // FIXME: Should emit a #line directive here.
429}
430
431
432/// EnterMainSourceFile - Enter the specified FileID as the main source file,
Nate Begeman886bf132008-01-07 04:01:26 +0000433/// which implicitly adds the builtin defines etc.
Ted Kremenek17861c52007-12-19 22:51:13 +0000434void Preprocessor::EnterMainSourceFile() {
435
436 unsigned MainFileID = SourceMgr.getMainFileID();
437
Chris Lattnerd1f21e12007-10-09 22:10:18 +0000438 // Enter the main file source buffer.
439 EnterSourceFile(MainFileID, 0);
440
Chris Lattnerb45f05c2007-11-15 19:07:47 +0000441 // Tell the header info that the main file was entered. If the file is later
442 // #imported, it won't be re-entered.
443 if (const FileEntry *FE =
444 SourceMgr.getFileEntryForLoc(SourceLocation::getFileLoc(MainFileID, 0)))
445 HeaderInfo.IncrementIncludeCount(FE);
446
Chris Lattnerd1f21e12007-10-09 22:10:18 +0000447 std::vector<char> PrologFile;
448 PrologFile.reserve(4080);
449
450 // Install things like __POWERPC__, __GNUC__, etc into the macro table.
451 InitializePredefinedMacros(*this, PrologFile);
452
453 // Add on the predefines from the driver.
454 PrologFile.insert(PrologFile.end(), Predefines,Predefines+strlen(Predefines));
455
456 // Memory buffer must end with a null byte!
457 PrologFile.push_back(0);
458
459 // Now that we have emitted the predefined macros, #includes, etc into
460 // PrologFile, preprocess it to populate the initial preprocessor state.
461 llvm::MemoryBuffer *SB =
462 llvm::MemoryBuffer::getMemBufferCopy(&PrologFile.front(),&PrologFile.back(),
463 "<predefines>");
464 assert(SB && "Cannot fail to create predefined source buffer");
465 unsigned FileID = SourceMgr.createFileIDForMemBuffer(SB);
466 assert(FileID && "Could not create FileID for predefines?");
467
468 // Start parsing the predefines.
469 EnterSourceFile(FileID, 0);
470}
Chris Lattner4b009652007-07-25 00:24:17 +0000471
472//===----------------------------------------------------------------------===//
473// Source File Location Methods.
474//===----------------------------------------------------------------------===//
475
476/// LookupFile - Given a "foo" or <foo> reference, look up the indicated file,
477/// return null on failure. isAngled indicates whether the file reference is
478/// for system #include's or not (i.e. using <> instead of "").
479const FileEntry *Preprocessor::LookupFile(const char *FilenameStart,
480 const char *FilenameEnd,
481 bool isAngled,
482 const DirectoryLookup *FromDir,
483 const DirectoryLookup *&CurDir) {
484 // If the header lookup mechanism may be relative to the current file, pass in
485 // info about where the current file is.
486 const FileEntry *CurFileEnt = 0;
487 if (!FromDir) {
488 SourceLocation FileLoc = getCurrentFileLexer()->getFileLoc();
489 CurFileEnt = SourceMgr.getFileEntryForLoc(FileLoc);
490 }
491
492 // Do a standard file entry lookup.
493 CurDir = CurDirLookup;
494 const FileEntry *FE =
495 HeaderInfo.LookupFile(FilenameStart, FilenameEnd,
496 isAngled, FromDir, CurDir, CurFileEnt);
497 if (FE) return FE;
498
499 // Otherwise, see if this is a subframework header. If so, this is relative
500 // to one of the headers on the #include stack. Walk the list of the current
501 // headers on the #include stack and pass them to HeaderInfo.
502 if (CurLexer && !CurLexer->Is_PragmaLexer) {
Chris Lattner017d65b2008-02-01 05:34:02 +0000503 if ((CurFileEnt = SourceMgr.getFileEntryForLoc(CurLexer->getFileLoc())))
504 if ((FE = HeaderInfo.LookupSubframeworkHeader(FilenameStart, FilenameEnd,
505 CurFileEnt)))
506 return FE;
Chris Lattner4b009652007-07-25 00:24:17 +0000507 }
508
509 for (unsigned i = 0, e = IncludeMacroStack.size(); i != e; ++i) {
510 IncludeStackInfo &ISEntry = IncludeMacroStack[e-i-1];
511 if (ISEntry.TheLexer && !ISEntry.TheLexer->Is_PragmaLexer) {
Chris Lattner017d65b2008-02-01 05:34:02 +0000512 if ((CurFileEnt =
513 SourceMgr.getFileEntryForLoc(ISEntry.TheLexer->getFileLoc())))
514 if ((FE = HeaderInfo.LookupSubframeworkHeader(FilenameStart,
515 FilenameEnd, CurFileEnt)))
516 return FE;
Chris Lattner4b009652007-07-25 00:24:17 +0000517 }
518 }
519
520 // Otherwise, we really couldn't find the file.
521 return 0;
522}
523
524/// isInPrimaryFile - Return true if we're in the top-level file, not in a
525/// #include.
526bool Preprocessor::isInPrimaryFile() const {
527 if (CurLexer && !CurLexer->Is_PragmaLexer)
Chris Lattnerd1f21e12007-10-09 22:10:18 +0000528 return IncludeMacroStack.empty();
Chris Lattner4b009652007-07-25 00:24:17 +0000529
530 // If there are any stacked lexers, we're in a #include.
Chris Lattnerd1f21e12007-10-09 22:10:18 +0000531 assert(IncludeMacroStack[0].TheLexer &&
532 !IncludeMacroStack[0].TheLexer->Is_PragmaLexer &&
533 "Top level include stack isn't our primary lexer?");
534 for (unsigned i = 1, e = IncludeMacroStack.size(); i != e; ++i)
Chris Lattner4b009652007-07-25 00:24:17 +0000535 if (IncludeMacroStack[i].TheLexer &&
536 !IncludeMacroStack[i].TheLexer->Is_PragmaLexer)
Chris Lattnerd1f21e12007-10-09 22:10:18 +0000537 return false;
538 return true;
Chris Lattner4b009652007-07-25 00:24:17 +0000539}
540
541/// getCurrentLexer - Return the current file lexer being lexed from. Note
542/// that this ignores any potentially active macro expansions and _Pragma
543/// expansions going on at the time.
544Lexer *Preprocessor::getCurrentFileLexer() const {
545 if (CurLexer && !CurLexer->Is_PragmaLexer) return CurLexer;
546
547 // Look for a stacked lexer.
548 for (unsigned i = IncludeMacroStack.size(); i != 0; --i) {
549 Lexer *L = IncludeMacroStack[i-1].TheLexer;
550 if (L && !L->Is_PragmaLexer) // Ignore macro & _Pragma expansions.
551 return L;
552 }
553 return 0;
554}
555
556
557/// EnterSourceFile - Add a source file to the top of the include stack and
558/// start lexing tokens from it instead of the current buffer. Return true
559/// on failure.
560void Preprocessor::EnterSourceFile(unsigned FileID,
Chris Lattnerd1f21e12007-10-09 22:10:18 +0000561 const DirectoryLookup *CurDir) {
Chris Lattner4b009652007-07-25 00:24:17 +0000562 assert(CurMacroExpander == 0 && "Cannot #include a file inside a macro!");
563 ++NumEnteredSourceFiles;
564
565 if (MaxIncludeStackDepth < IncludeMacroStack.size())
566 MaxIncludeStackDepth = IncludeMacroStack.size();
567
568 Lexer *TheLexer = new Lexer(SourceLocation::getFileLoc(FileID, 0), *this);
Chris Lattner4b009652007-07-25 00:24:17 +0000569 EnterSourceFileWithLexer(TheLexer, CurDir);
570}
571
572/// EnterSourceFile - Add a source file to the top of the include stack and
573/// start lexing tokens from it instead of the current buffer.
574void Preprocessor::EnterSourceFileWithLexer(Lexer *TheLexer,
575 const DirectoryLookup *CurDir) {
576
577 // Add the current lexer to the include stack.
578 if (CurLexer || CurMacroExpander)
579 IncludeMacroStack.push_back(IncludeStackInfo(CurLexer, CurDirLookup,
580 CurMacroExpander));
581
582 CurLexer = TheLexer;
583 CurDirLookup = CurDir;
584 CurMacroExpander = 0;
585
586 // Notify the client, if desired, that we are in a new source file.
587 if (Callbacks && !CurLexer->Is_PragmaLexer) {
588 DirectoryLookup::DirType FileType = DirectoryLookup::NormalHeaderDir;
589
590 // Get the file entry for the current file.
591 if (const FileEntry *FE =
592 SourceMgr.getFileEntryForLoc(CurLexer->getFileLoc()))
593 FileType = HeaderInfo.getFileDirFlavor(FE);
594
595 Callbacks->FileChanged(CurLexer->getFileLoc(),
596 PPCallbacks::EnterFile, FileType);
597 }
598}
599
600
601
602/// EnterMacro - Add a Macro to the top of the include stack and start lexing
603/// tokens from it instead of the current buffer.
604void Preprocessor::EnterMacro(Token &Tok, MacroArgs *Args) {
605 IncludeMacroStack.push_back(IncludeStackInfo(CurLexer, CurDirLookup,
606 CurMacroExpander));
607 CurLexer = 0;
608 CurDirLookup = 0;
609
610 if (NumCachedMacroExpanders == 0) {
611 CurMacroExpander = new MacroExpander(Tok, Args, *this);
612 } else {
613 CurMacroExpander = MacroExpanderCache[--NumCachedMacroExpanders];
614 CurMacroExpander->Init(Tok, Args);
615 }
616}
617
618/// EnterTokenStream - Add a "macro" context to the top of the include stack,
619/// which will cause the lexer to start returning the specified tokens. Note
620/// that these tokens will be re-macro-expanded when/if expansion is enabled.
621/// This method assumes that the specified stream of tokens has a permanent
622/// owner somewhere, so they do not need to be copied.
623void Preprocessor::EnterTokenStream(const Token *Toks, unsigned NumToks) {
624 // Save our current state.
625 IncludeMacroStack.push_back(IncludeStackInfo(CurLexer, CurDirLookup,
626 CurMacroExpander));
627 CurLexer = 0;
628 CurDirLookup = 0;
629
630 // Create a macro expander to expand from the specified token stream.
631 if (NumCachedMacroExpanders == 0) {
632 CurMacroExpander = new MacroExpander(Toks, NumToks, *this);
633 } else {
634 CurMacroExpander = MacroExpanderCache[--NumCachedMacroExpanders];
635 CurMacroExpander->Init(Toks, NumToks);
636 }
637}
638
639/// RemoveTopOfLexerStack - Pop the current lexer/macro exp off the top of the
640/// lexer stack. This should only be used in situations where the current
641/// state of the top-of-stack lexer is known.
642void Preprocessor::RemoveTopOfLexerStack() {
643 assert(!IncludeMacroStack.empty() && "Ran out of stack entries to load");
644
645 if (CurMacroExpander) {
646 // Delete or cache the now-dead macro expander.
647 if (NumCachedMacroExpanders == MacroExpanderCacheSize)
648 delete CurMacroExpander;
649 else
650 MacroExpanderCache[NumCachedMacroExpanders++] = CurMacroExpander;
651 } else {
652 delete CurLexer;
653 }
654 CurLexer = IncludeMacroStack.back().TheLexer;
655 CurDirLookup = IncludeMacroStack.back().TheDirLookup;
656 CurMacroExpander = IncludeMacroStack.back().TheMacroExpander;
657 IncludeMacroStack.pop_back();
658}
659
660//===----------------------------------------------------------------------===//
661// Macro Expansion Handling.
662//===----------------------------------------------------------------------===//
663
Chris Lattner7a1b0882007-10-07 08:44:20 +0000664/// setMacroInfo - Specify a macro for this identifier.
665///
666void Preprocessor::setMacroInfo(IdentifierInfo *II, MacroInfo *MI) {
667 if (MI == 0) {
668 if (II->hasMacroDefinition()) {
669 Macros.erase(II);
670 II->setHasMacroDefinition(false);
671 }
672 } else {
673 Macros[II] = MI;
674 II->setHasMacroDefinition(true);
675 }
676}
677
Chris Lattner4b009652007-07-25 00:24:17 +0000678/// RegisterBuiltinMacro - Register the specified identifier in the identifier
679/// table and mark it as a builtin macro to be expanded.
680IdentifierInfo *Preprocessor::RegisterBuiltinMacro(const char *Name) {
681 // Get the identifier.
682 IdentifierInfo *Id = getIdentifierInfo(Name);
683
684 // Mark it as being a macro that is builtin.
685 MacroInfo *MI = new MacroInfo(SourceLocation());
686 MI->setIsBuiltinMacro();
Chris Lattner7a1b0882007-10-07 08:44:20 +0000687 setMacroInfo(Id, MI);
Chris Lattner4b009652007-07-25 00:24:17 +0000688 return Id;
689}
690
691
692/// RegisterBuiltinMacros - Register builtin macros, such as __LINE__ with the
693/// identifier table.
694void Preprocessor::RegisterBuiltinMacros() {
695 Ident__LINE__ = RegisterBuiltinMacro("__LINE__");
696 Ident__FILE__ = RegisterBuiltinMacro("__FILE__");
697 Ident__DATE__ = RegisterBuiltinMacro("__DATE__");
698 Ident__TIME__ = RegisterBuiltinMacro("__TIME__");
699 Ident_Pragma = RegisterBuiltinMacro("_Pragma");
700
701 // GCC Extensions.
702 Ident__BASE_FILE__ = RegisterBuiltinMacro("__BASE_FILE__");
703 Ident__INCLUDE_LEVEL__ = RegisterBuiltinMacro("__INCLUDE_LEVEL__");
704 Ident__TIMESTAMP__ = RegisterBuiltinMacro("__TIMESTAMP__");
705}
706
707/// isTrivialSingleTokenExpansion - Return true if MI, which has a single token
708/// in its expansion, currently expands to that token literally.
709static bool isTrivialSingleTokenExpansion(const MacroInfo *MI,
Chris Lattner7a1b0882007-10-07 08:44:20 +0000710 const IdentifierInfo *MacroIdent,
711 Preprocessor &PP) {
Chris Lattner4b009652007-07-25 00:24:17 +0000712 IdentifierInfo *II = MI->getReplacementToken(0).getIdentifierInfo();
713
714 // If the token isn't an identifier, it's always literally expanded.
715 if (II == 0) return true;
716
717 // If the identifier is a macro, and if that macro is enabled, it may be
718 // expanded so it's not a trivial expansion.
Chris Lattner7a1b0882007-10-07 08:44:20 +0000719 if (II->hasMacroDefinition() && PP.getMacroInfo(II)->isEnabled() &&
Chris Lattner4b009652007-07-25 00:24:17 +0000720 // Fast expanding "#define X X" is ok, because X would be disabled.
721 II != MacroIdent)
722 return false;
723
724 // If this is an object-like macro invocation, it is safe to trivially expand
725 // it.
726 if (MI->isObjectLike()) return true;
727
728 // If this is a function-like macro invocation, it's safe to trivially expand
729 // as long as the identifier is not a macro argument.
730 for (MacroInfo::arg_iterator I = MI->arg_begin(), E = MI->arg_end();
731 I != E; ++I)
732 if (*I == II)
733 return false; // Identifier is a macro argument.
734
735 return true;
736}
737
738
739/// isNextPPTokenLParen - Determine whether the next preprocessor token to be
740/// lexed is a '('. If so, consume the token and return true, if not, this
741/// method should have no observable side-effect on the lexed tokens.
742bool Preprocessor::isNextPPTokenLParen() {
743 // Do some quick tests for rejection cases.
744 unsigned Val;
745 if (CurLexer)
746 Val = CurLexer->isNextPPTokenLParen();
747 else
748 Val = CurMacroExpander->isNextTokenLParen();
749
750 if (Val == 2) {
751 // We have run off the end. If it's a source file we don't
752 // examine enclosing ones (C99 5.1.1.2p4). Otherwise walk up the
753 // macro stack.
754 if (CurLexer)
755 return false;
756 for (unsigned i = IncludeMacroStack.size(); i != 0; --i) {
757 IncludeStackInfo &Entry = IncludeMacroStack[i-1];
758 if (Entry.TheLexer)
759 Val = Entry.TheLexer->isNextPPTokenLParen();
760 else
761 Val = Entry.TheMacroExpander->isNextTokenLParen();
762
763 if (Val != 2)
764 break;
765
766 // Ran off the end of a source file?
767 if (Entry.TheLexer)
768 return false;
769 }
770 }
771
772 // Okay, if we know that the token is a '(', lex it and return. Otherwise we
773 // have found something that isn't a '(' or we found the end of the
774 // translation unit. In either case, return false.
775 if (Val != 1)
776 return false;
777
778 Token Tok;
779 LexUnexpandedToken(Tok);
Chris Lattnercb8e41c2007-10-09 18:02:16 +0000780 assert(Tok.is(tok::l_paren) && "Error computing l-paren-ness?");
Chris Lattner4b009652007-07-25 00:24:17 +0000781 return true;
782}
783
784/// HandleMacroExpandedIdentifier - If an identifier token is read that is to be
785/// expanded as a macro, handle it and return the next token as 'Identifier'.
786bool Preprocessor::HandleMacroExpandedIdentifier(Token &Identifier,
787 MacroInfo *MI) {
Chris Lattnerc834ea62008-01-07 19:50:27 +0000788 // If this is a macro exapnsion in the "#if !defined(x)" line for the file,
789 // then the macro could expand to different things in other contexts, we need
790 // to disable the optimization in this case.
791 if (CurLexer) CurLexer->MIOpt.ExpandedMacro();
Chris Lattner4b009652007-07-25 00:24:17 +0000792
793 // If this is a builtin macro, like __LINE__ or _Pragma, handle it specially.
794 if (MI->isBuiltinMacro()) {
795 ExpandBuiltinMacro(Identifier);
796 return false;
797 }
798
799 // If this is the first use of a target-specific macro, warn about it.
800 if (MI->isTargetSpecific()) {
801 MI->setIsTargetSpecific(false); // Don't warn on second use.
Ted Kremenekd7f64cd2007-12-12 22:39:36 +0000802 getTargetInfo().DiagnoseNonPortability(getFullLoc(Identifier.getLocation()),
Chris Lattner4b009652007-07-25 00:24:17 +0000803 diag::port_target_macro_use);
804 }
805
806 /// Args - If this is a function-like macro expansion, this contains,
807 /// for each macro argument, the list of tokens that were provided to the
808 /// invocation.
809 MacroArgs *Args = 0;
810
811 // If this is a function-like macro, read the arguments.
812 if (MI->isFunctionLike()) {
813 // C99 6.10.3p10: If the preprocessing token immediately after the the macro
814 // name isn't a '(', this macro should not be expanded. Otherwise, consume
815 // it.
816 if (!isNextPPTokenLParen())
817 return true;
818
819 // Remember that we are now parsing the arguments to a macro invocation.
820 // Preprocessor directives used inside macro arguments are not portable, and
821 // this enables the warning.
822 InMacroArgs = true;
823 Args = ReadFunctionLikeMacroArgs(Identifier, MI);
824
825 // Finished parsing args.
826 InMacroArgs = false;
827
828 // If there was an error parsing the arguments, bail out.
829 if (Args == 0) return false;
830
831 ++NumFnMacroExpanded;
832 } else {
833 ++NumMacroExpanded;
834 }
835
836 // Notice that this macro has been used.
837 MI->setIsUsed(true);
838
839 // If we started lexing a macro, enter the macro expansion body.
840
841 // If this macro expands to no tokens, don't bother to push it onto the
842 // expansion stack, only to take it right back off.
843 if (MI->getNumTokens() == 0) {
844 // No need for arg info.
845 if (Args) Args->destroy();
846
847 // Ignore this macro use, just return the next token in the current
848 // buffer.
849 bool HadLeadingSpace = Identifier.hasLeadingSpace();
850 bool IsAtStartOfLine = Identifier.isAtStartOfLine();
851
852 Lex(Identifier);
853
854 // If the identifier isn't on some OTHER line, inherit the leading
855 // whitespace/first-on-a-line property of this token. This handles
856 // stuff like "! XX," -> "! ," and " XX," -> " ,", when XX is
857 // empty.
858 if (!Identifier.isAtStartOfLine()) {
859 if (IsAtStartOfLine) Identifier.setFlag(Token::StartOfLine);
860 if (HadLeadingSpace) Identifier.setFlag(Token::LeadingSpace);
861 }
862 ++NumFastMacroExpanded;
863 return false;
864
865 } else if (MI->getNumTokens() == 1 &&
Chris Lattner7a1b0882007-10-07 08:44:20 +0000866 isTrivialSingleTokenExpansion(MI, Identifier.getIdentifierInfo(),
867 *this)){
Chris Lattner4b009652007-07-25 00:24:17 +0000868 // Otherwise, if this macro expands into a single trivially-expanded
869 // token: expand it now. This handles common cases like
870 // "#define VAL 42".
871
872 // Propagate the isAtStartOfLine/hasLeadingSpace markers of the macro
873 // identifier to the expanded token.
874 bool isAtStartOfLine = Identifier.isAtStartOfLine();
875 bool hasLeadingSpace = Identifier.hasLeadingSpace();
876
877 // Remember where the token is instantiated.
878 SourceLocation InstantiateLoc = Identifier.getLocation();
879
880 // Replace the result token.
881 Identifier = MI->getReplacementToken(0);
882
883 // Restore the StartOfLine/LeadingSpace markers.
884 Identifier.setFlagValue(Token::StartOfLine , isAtStartOfLine);
885 Identifier.setFlagValue(Token::LeadingSpace, hasLeadingSpace);
886
887 // Update the tokens location to include both its logical and physical
888 // locations.
889 SourceLocation Loc =
890 SourceMgr.getInstantiationLoc(Identifier.getLocation(), InstantiateLoc);
891 Identifier.setLocation(Loc);
892
893 // If this is #define X X, we must mark the result as unexpandible.
894 if (IdentifierInfo *NewII = Identifier.getIdentifierInfo())
Chris Lattner7a1b0882007-10-07 08:44:20 +0000895 if (getMacroInfo(NewII) == MI)
Chris Lattner4b009652007-07-25 00:24:17 +0000896 Identifier.setFlag(Token::DisableExpand);
897
898 // Since this is not an identifier token, it can't be macro expanded, so
899 // we're done.
900 ++NumFastMacroExpanded;
901 return false;
902 }
903
904 // Start expanding the macro.
905 EnterMacro(Identifier, Args);
906
907 // Now that the macro is at the top of the include stack, ask the
908 // preprocessor to read the next token from it.
909 Lex(Identifier);
910 return false;
911}
912
913/// ReadFunctionLikeMacroArgs - After reading "MACRO(", this method is
914/// invoked to read all of the actual arguments specified for the macro
915/// invocation. This returns null on error.
916MacroArgs *Preprocessor::ReadFunctionLikeMacroArgs(Token &MacroName,
917 MacroInfo *MI) {
918 // The number of fixed arguments to parse.
919 unsigned NumFixedArgsLeft = MI->getNumArgs();
920 bool isVariadic = MI->isVariadic();
921
922 // Outer loop, while there are more arguments, keep reading them.
923 Token Tok;
924 Tok.setKind(tok::comma);
925 --NumFixedArgsLeft; // Start reading the first arg.
926
927 // ArgTokens - Build up a list of tokens that make up each argument. Each
928 // argument is separated by an EOF token. Use a SmallVector so we can avoid
929 // heap allocations in the common case.
930 llvm::SmallVector<Token, 64> ArgTokens;
931
932 unsigned NumActuals = 0;
Chris Lattnercb8e41c2007-10-09 18:02:16 +0000933 while (Tok.is(tok::comma)) {
Chris Lattner4b009652007-07-25 00:24:17 +0000934 // C99 6.10.3p11: Keep track of the number of l_parens we have seen. Note
935 // that we already consumed the first one.
936 unsigned NumParens = 0;
937
938 while (1) {
939 // Read arguments as unexpanded tokens. This avoids issues, e.g., where
940 // an argument value in a macro could expand to ',' or '(' or ')'.
941 LexUnexpandedToken(Tok);
942
Chris Lattnerecdf4f02008-01-22 19:34:51 +0000943 if (Tok.is(tok::eof) || Tok.is(tok::eom)) { // "#if f(<eof>" & "#if f(\n"
Chris Lattner4b009652007-07-25 00:24:17 +0000944 Diag(MacroName, diag::err_unterm_macro_invoc);
Chris Lattnerecdf4f02008-01-22 19:34:51 +0000945 // Do not lose the EOF/EOM. Return it to the client.
Chris Lattner4b009652007-07-25 00:24:17 +0000946 MacroName = Tok;
947 return 0;
Chris Lattnercb8e41c2007-10-09 18:02:16 +0000948 } else if (Tok.is(tok::r_paren)) {
Chris Lattner4b009652007-07-25 00:24:17 +0000949 // If we found the ) token, the macro arg list is done.
950 if (NumParens-- == 0)
951 break;
Chris Lattnercb8e41c2007-10-09 18:02:16 +0000952 } else if (Tok.is(tok::l_paren)) {
Chris Lattner4b009652007-07-25 00:24:17 +0000953 ++NumParens;
Chris Lattnercb8e41c2007-10-09 18:02:16 +0000954 } else if (Tok.is(tok::comma) && NumParens == 0) {
Chris Lattner4b009652007-07-25 00:24:17 +0000955 // Comma ends this argument if there are more fixed arguments expected.
956 if (NumFixedArgsLeft)
957 break;
958
959 // If this is not a variadic macro, too many args were specified.
960 if (!isVariadic) {
961 // Emit the diagnostic at the macro name in case there is a missing ).
962 // Emitting it at the , could be far away from the macro name.
963 Diag(MacroName, diag::err_too_many_args_in_macro_invoc);
964 return 0;
965 }
966 // Otherwise, continue to add the tokens to this variable argument.
Chris Lattnercb8e41c2007-10-09 18:02:16 +0000967 } else if (Tok.is(tok::comment) && !KeepMacroComments) {
Chris Lattner4b009652007-07-25 00:24:17 +0000968 // If this is a comment token in the argument list and we're just in
969 // -C mode (not -CC mode), discard the comment.
970 continue;
Chris Lattnere373b052007-11-23 06:50:21 +0000971 } else if (Tok.is(tok::identifier)) {
972 // Reading macro arguments can cause macros that we are currently
973 // expanding from to be popped off the expansion stack. Doing so causes
974 // them to be reenabled for expansion. Here we record whether any
975 // identifiers we lex as macro arguments correspond to disabled macros.
976 // If so, we mark the token as noexpand. This is a subtle aspect of
977 // C99 6.10.3.4p2.
978 if (MacroInfo *MI = getMacroInfo(Tok.getIdentifierInfo()))
979 if (!MI->isEnabled())
980 Tok.setFlag(Token::DisableExpand);
Chris Lattner4b009652007-07-25 00:24:17 +0000981 }
982
983 ArgTokens.push_back(Tok);
984 }
985
986 // Empty arguments are standard in C99 and supported as an extension in
987 // other modes.
988 if (ArgTokens.empty() && !Features.C99)
989 Diag(Tok, diag::ext_empty_fnmacro_arg);
990
991 // Add a marker EOF token to the end of the token list for this argument.
992 Token EOFTok;
993 EOFTok.startToken();
994 EOFTok.setKind(tok::eof);
995 EOFTok.setLocation(Tok.getLocation());
996 EOFTok.setLength(0);
997 ArgTokens.push_back(EOFTok);
998 ++NumActuals;
999 --NumFixedArgsLeft;
1000 };
1001
1002 // Okay, we either found the r_paren. Check to see if we parsed too few
1003 // arguments.
1004 unsigned MinArgsExpected = MI->getNumArgs();
1005
1006 // See MacroArgs instance var for description of this.
1007 bool isVarargsElided = false;
1008
1009 if (NumActuals < MinArgsExpected) {
1010 // There are several cases where too few arguments is ok, handle them now.
1011 if (NumActuals+1 == MinArgsExpected && MI->isVariadic()) {
1012 // Varargs where the named vararg parameter is missing: ok as extension.
1013 // #define A(x, ...)
1014 // A("blah")
1015 Diag(Tok, diag::ext_missing_varargs_arg);
1016
1017 // Remember this occurred if this is a C99 macro invocation with at least
1018 // one actual argument.
1019 isVarargsElided = MI->isC99Varargs() && MI->getNumArgs() > 1;
1020 } else if (MI->getNumArgs() == 1) {
1021 // #define A(x)
1022 // A()
1023 // is ok because it is an empty argument.
1024
1025 // Empty arguments are standard in C99 and supported as an extension in
1026 // other modes.
1027 if (ArgTokens.empty() && !Features.C99)
1028 Diag(Tok, diag::ext_empty_fnmacro_arg);
1029 } else {
1030 // Otherwise, emit the error.
1031 Diag(Tok, diag::err_too_few_args_in_macro_invoc);
1032 return 0;
1033 }
1034
1035 // Add a marker EOF token to the end of the token list for this argument.
1036 SourceLocation EndLoc = Tok.getLocation();
1037 Tok.startToken();
1038 Tok.setKind(tok::eof);
1039 Tok.setLocation(EndLoc);
1040 Tok.setLength(0);
1041 ArgTokens.push_back(Tok);
1042 }
1043
1044 return MacroArgs::create(MI, &ArgTokens[0], ArgTokens.size(),isVarargsElided);
1045}
1046
1047/// ComputeDATE_TIME - Compute the current time, enter it into the specified
1048/// scratch buffer, then return DATELoc/TIMELoc locations with the position of
1049/// the identifier tokens inserted.
1050static void ComputeDATE_TIME(SourceLocation &DATELoc, SourceLocation &TIMELoc,
1051 Preprocessor &PP) {
1052 time_t TT = time(0);
1053 struct tm *TM = localtime(&TT);
1054
1055 static const char * const Months[] = {
1056 "Jan","Feb","Mar","Apr","May","Jun","Jul","Aug","Sep","Oct","Nov","Dec"
1057 };
1058
1059 char TmpBuffer[100];
1060 sprintf(TmpBuffer, "\"%s %2d %4d\"", Months[TM->tm_mon], TM->tm_mday,
1061 TM->tm_year+1900);
1062 DATELoc = PP.CreateString(TmpBuffer, strlen(TmpBuffer));
1063
1064 sprintf(TmpBuffer, "\"%02d:%02d:%02d\"", TM->tm_hour, TM->tm_min, TM->tm_sec);
1065 TIMELoc = PP.CreateString(TmpBuffer, strlen(TmpBuffer));
1066}
1067
1068/// ExpandBuiltinMacro - If an identifier token is read that is to be expanded
1069/// as a builtin macro, handle it and return the next token as 'Tok'.
1070void Preprocessor::ExpandBuiltinMacro(Token &Tok) {
1071 // Figure out which token this is.
1072 IdentifierInfo *II = Tok.getIdentifierInfo();
1073 assert(II && "Can't be a macro without id info!");
1074
1075 // If this is an _Pragma directive, expand it, invoke the pragma handler, then
1076 // lex the token after it.
1077 if (II == Ident_Pragma)
1078 return Handle_Pragma(Tok);
1079
1080 ++NumBuiltinMacroExpanded;
1081
1082 char TmpBuffer[100];
1083
1084 // Set up the return result.
1085 Tok.setIdentifierInfo(0);
1086 Tok.clearFlag(Token::NeedsCleaning);
1087
1088 if (II == Ident__LINE__) {
1089 // __LINE__ expands to a simple numeric value.
1090 sprintf(TmpBuffer, "%u", SourceMgr.getLogicalLineNumber(Tok.getLocation()));
1091 unsigned Length = strlen(TmpBuffer);
1092 Tok.setKind(tok::numeric_constant);
1093 Tok.setLength(Length);
1094 Tok.setLocation(CreateString(TmpBuffer, Length, Tok.getLocation()));
1095 } else if (II == Ident__FILE__ || II == Ident__BASE_FILE__) {
1096 SourceLocation Loc = Tok.getLocation();
1097 if (II == Ident__BASE_FILE__) {
1098 Diag(Tok, diag::ext_pp_base_file);
1099 SourceLocation NextLoc = SourceMgr.getIncludeLoc(Loc);
1100 while (NextLoc.isValid()) {
1101 Loc = NextLoc;
1102 NextLoc = SourceMgr.getIncludeLoc(Loc);
1103 }
1104 }
1105
1106 // Escape this filename. Turn '\' -> '\\' '"' -> '\"'
1107 std::string FN = SourceMgr.getSourceName(SourceMgr.getLogicalLoc(Loc));
1108 FN = '"' + Lexer::Stringify(FN) + '"';
1109 Tok.setKind(tok::string_literal);
1110 Tok.setLength(FN.size());
1111 Tok.setLocation(CreateString(&FN[0], FN.size(), Tok.getLocation()));
1112 } else if (II == Ident__DATE__) {
1113 if (!DATELoc.isValid())
1114 ComputeDATE_TIME(DATELoc, TIMELoc, *this);
1115 Tok.setKind(tok::string_literal);
1116 Tok.setLength(strlen("\"Mmm dd yyyy\""));
1117 Tok.setLocation(SourceMgr.getInstantiationLoc(DATELoc, Tok.getLocation()));
1118 } else if (II == Ident__TIME__) {
1119 if (!TIMELoc.isValid())
1120 ComputeDATE_TIME(DATELoc, TIMELoc, *this);
1121 Tok.setKind(tok::string_literal);
1122 Tok.setLength(strlen("\"hh:mm:ss\""));
1123 Tok.setLocation(SourceMgr.getInstantiationLoc(TIMELoc, Tok.getLocation()));
1124 } else if (II == Ident__INCLUDE_LEVEL__) {
1125 Diag(Tok, diag::ext_pp_include_level);
1126
1127 // Compute the include depth of this token.
1128 unsigned Depth = 0;
1129 SourceLocation Loc = SourceMgr.getIncludeLoc(Tok.getLocation());
1130 for (; Loc.isValid(); ++Depth)
1131 Loc = SourceMgr.getIncludeLoc(Loc);
1132
1133 // __INCLUDE_LEVEL__ expands to a simple numeric value.
1134 sprintf(TmpBuffer, "%u", Depth);
1135 unsigned Length = strlen(TmpBuffer);
1136 Tok.setKind(tok::numeric_constant);
1137 Tok.setLength(Length);
1138 Tok.setLocation(CreateString(TmpBuffer, Length, Tok.getLocation()));
1139 } else if (II == Ident__TIMESTAMP__) {
1140 // MSVC, ICC, GCC, VisualAge C++ extension. The generated string should be
1141 // of the form "Ddd Mmm dd hh::mm::ss yyyy", which is returned by asctime.
1142 Diag(Tok, diag::ext_pp_timestamp);
1143
1144 // Get the file that we are lexing out of. If we're currently lexing from
1145 // a macro, dig into the include stack.
1146 const FileEntry *CurFile = 0;
1147 Lexer *TheLexer = getCurrentFileLexer();
1148
1149 if (TheLexer)
1150 CurFile = SourceMgr.getFileEntryForLoc(TheLexer->getFileLoc());
1151
1152 // If this file is older than the file it depends on, emit a diagnostic.
1153 const char *Result;
1154 if (CurFile) {
1155 time_t TT = CurFile->getModificationTime();
1156 struct tm *TM = localtime(&TT);
1157 Result = asctime(TM);
1158 } else {
1159 Result = "??? ??? ?? ??:??:?? ????\n";
1160 }
1161 TmpBuffer[0] = '"';
1162 strcpy(TmpBuffer+1, Result);
1163 unsigned Len = strlen(TmpBuffer);
1164 TmpBuffer[Len-1] = '"'; // Replace the newline with a quote.
1165 Tok.setKind(tok::string_literal);
1166 Tok.setLength(Len);
1167 Tok.setLocation(CreateString(TmpBuffer, Len, Tok.getLocation()));
1168 } else {
1169 assert(0 && "Unknown identifier!");
Chris Lattnerc0f7c512007-12-09 20:31:55 +00001170 }
Chris Lattner4b009652007-07-25 00:24:17 +00001171}
1172
1173//===----------------------------------------------------------------------===//
1174// Lexer Event Handling.
1175//===----------------------------------------------------------------------===//
1176
1177/// LookUpIdentifierInfo - Given a tok::identifier token, look up the
1178/// identifier information for the token and install it into the token.
1179IdentifierInfo *Preprocessor::LookUpIdentifierInfo(Token &Identifier,
1180 const char *BufPtr) {
Chris Lattnercb8e41c2007-10-09 18:02:16 +00001181 assert(Identifier.is(tok::identifier) && "Not an identifier!");
Chris Lattner4b009652007-07-25 00:24:17 +00001182 assert(Identifier.getIdentifierInfo() == 0 && "Identinfo already exists!");
1183
1184 // Look up this token, see if it is a macro, or if it is a language keyword.
1185 IdentifierInfo *II;
1186 if (BufPtr && !Identifier.needsCleaning()) {
1187 // No cleaning needed, just use the characters from the lexed buffer.
1188 II = getIdentifierInfo(BufPtr, BufPtr+Identifier.getLength());
1189 } else {
1190 // Cleaning needed, alloca a buffer, clean into it, then use the buffer.
1191 llvm::SmallVector<char, 64> IdentifierBuffer;
1192 IdentifierBuffer.resize(Identifier.getLength());
1193 const char *TmpBuf = &IdentifierBuffer[0];
1194 unsigned Size = getSpelling(Identifier, TmpBuf);
1195 II = getIdentifierInfo(TmpBuf, TmpBuf+Size);
1196 }
1197 Identifier.setIdentifierInfo(II);
1198 return II;
1199}
1200
1201
1202/// HandleIdentifier - This callback is invoked when the lexer reads an
1203/// identifier. This callback looks up the identifier in the map and/or
1204/// potentially macro expands it or turns it into a named token (like 'for').
1205void Preprocessor::HandleIdentifier(Token &Identifier) {
1206 assert(Identifier.getIdentifierInfo() &&
1207 "Can't handle identifiers without identifier info!");
1208
1209 IdentifierInfo &II = *Identifier.getIdentifierInfo();
1210
1211 // If this identifier was poisoned, and if it was not produced from a macro
1212 // expansion, emit an error.
1213 if (II.isPoisoned() && CurLexer) {
1214 if (&II != Ident__VA_ARGS__) // We warn about __VA_ARGS__ with poisoning.
1215 Diag(Identifier, diag::err_pp_used_poisoned_id);
1216 else
1217 Diag(Identifier, diag::ext_pp_bad_vaargs_use);
1218 }
1219
1220 // If this is a macro to be expanded, do it.
Chris Lattner7a1b0882007-10-07 08:44:20 +00001221 if (MacroInfo *MI = getMacroInfo(&II)) {
Chris Lattner4b009652007-07-25 00:24:17 +00001222 if (!DisableMacroExpansion && !Identifier.isExpandDisabled()) {
1223 if (MI->isEnabled()) {
1224 if (!HandleMacroExpandedIdentifier(Identifier, MI))
1225 return;
1226 } else {
1227 // C99 6.10.3.4p2 says that a disabled macro may never again be
1228 // expanded, even if it's in a context where it could be expanded in the
1229 // future.
1230 Identifier.setFlag(Token::DisableExpand);
1231 }
1232 }
1233 } else if (II.isOtherTargetMacro() && !DisableMacroExpansion) {
1234 // If this identifier is a macro on some other target, emit a diagnostic.
1235 // This diagnosic is only emitted when macro expansion is enabled, because
1236 // the macro would not have been expanded for the other target either.
1237 II.setIsOtherTargetMacro(false); // Don't warn on second use.
Ted Kremenekd7f64cd2007-12-12 22:39:36 +00001238 getTargetInfo().DiagnoseNonPortability(getFullLoc(Identifier.getLocation()),
Chris Lattner4b009652007-07-25 00:24:17 +00001239 diag::port_target_macro_use);
1240
1241 }
1242
1243 // C++ 2.11p2: If this is an alternative representation of a C++ operator,
1244 // then we act as if it is the actual operator and not the textual
1245 // representation of it.
1246 if (II.isCPlusPlusOperatorKeyword())
1247 Identifier.setIdentifierInfo(0);
1248
1249 // Change the kind of this identifier to the appropriate token kind, e.g.
1250 // turning "for" into a keyword.
1251 Identifier.setKind(II.getTokenID());
1252
1253 // If this is an extension token, diagnose its use.
1254 // FIXME: tried (unsuccesfully) to shut this up when compiling with gnu99
1255 // For now, I'm just commenting it out (while I work on attributes).
1256 if (II.isExtensionToken() && Features.C99)
1257 Diag(Identifier, diag::ext_token_used);
1258}
1259
1260/// HandleEndOfFile - This callback is invoked when the lexer hits the end of
1261/// the current file. This either returns the EOF token or pops a level off
1262/// the include stack and keeps going.
1263bool Preprocessor::HandleEndOfFile(Token &Result, bool isEndOfMacro) {
1264 assert(!CurMacroExpander &&
1265 "Ending a file when currently in a macro!");
1266
1267 // See if this file had a controlling macro.
1268 if (CurLexer) { // Not ending a macro, ignore it.
1269 if (const IdentifierInfo *ControllingMacro =
1270 CurLexer->MIOpt.GetControllingMacroAtEndOfFile()) {
1271 // Okay, this has a controlling macro, remember in PerFileInfo.
1272 if (const FileEntry *FE =
1273 SourceMgr.getFileEntryForLoc(CurLexer->getFileLoc()))
1274 HeaderInfo.SetFileControllingMacro(FE, ControllingMacro);
1275 }
1276 }
1277
1278 // If this is a #include'd file, pop it off the include stack and continue
1279 // lexing the #includer file.
1280 if (!IncludeMacroStack.empty()) {
1281 // We're done with the #included file.
1282 RemoveTopOfLexerStack();
1283
1284 // Notify the client, if desired, that we are in a new source file.
1285 if (Callbacks && !isEndOfMacro && CurLexer) {
1286 DirectoryLookup::DirType FileType = DirectoryLookup::NormalHeaderDir;
1287
1288 // Get the file entry for the current file.
1289 if (const FileEntry *FE =
1290 SourceMgr.getFileEntryForLoc(CurLexer->getFileLoc()))
1291 FileType = HeaderInfo.getFileDirFlavor(FE);
1292
1293 Callbacks->FileChanged(CurLexer->getSourceLocation(CurLexer->BufferPtr),
1294 PPCallbacks::ExitFile, FileType);
1295 }
1296
1297 // Client should lex another token.
1298 return false;
1299 }
Chris Lattner1d34a7c2008-01-25 00:00:30 +00001300
1301 // If the file ends with a newline, form the EOF token on the newline itself,
1302 // rather than "on the line following it", which doesn't exist. This makes
1303 // diagnostics relating to the end of file include the last file that the user
1304 // actually typed, which is goodness.
1305 const char *EndPos = CurLexer->BufferEnd;
1306 if (EndPos != CurLexer->BufferStart &&
1307 (EndPos[-1] == '\n' || EndPos[-1] == '\r')) {
1308 --EndPos;
1309
1310 // Handle \n\r and \r\n:
1311 if (EndPos != CurLexer->BufferStart &&
1312 (EndPos[-1] == '\n' || EndPos[-1] == '\r') &&
1313 EndPos[-1] != EndPos[0])
1314 --EndPos;
1315 }
Chris Lattner4b009652007-07-25 00:24:17 +00001316
1317 Result.startToken();
Chris Lattner1d34a7c2008-01-25 00:00:30 +00001318 CurLexer->BufferPtr = EndPos;
1319 CurLexer->FormTokenWithChars(Result, EndPos);
Chris Lattner4b009652007-07-25 00:24:17 +00001320 Result.setKind(tok::eof);
1321
1322 // We're done with the #included file.
1323 delete CurLexer;
1324 CurLexer = 0;
1325
1326 // This is the end of the top-level file. If the diag::pp_macro_not_used
Chris Lattner7a1b0882007-10-07 08:44:20 +00001327 // diagnostic is enabled, look for macros that have not been used.
Chris Lattner4b009652007-07-25 00:24:17 +00001328 if (Diags.getDiagnosticLevel(diag::pp_macro_not_used) != Diagnostic::Ignored){
Chris Lattner7a1b0882007-10-07 08:44:20 +00001329 for (llvm::DenseMap<IdentifierInfo*, MacroInfo*>::iterator I =
1330 Macros.begin(), E = Macros.end(); I != E; ++I) {
1331 if (!I->second->isUsed())
1332 Diag(I->second->getDefinitionLoc(), diag::pp_macro_not_used);
Chris Lattner4b009652007-07-25 00:24:17 +00001333 }
1334 }
Chris Lattner4b009652007-07-25 00:24:17 +00001335 return true;
1336}
1337
1338/// HandleEndOfMacro - This callback is invoked when the lexer hits the end of
1339/// the current macro expansion or token stream expansion.
1340bool Preprocessor::HandleEndOfMacro(Token &Result) {
1341 assert(CurMacroExpander && !CurLexer &&
1342 "Ending a macro when currently in a #include file!");
1343
1344 // Delete or cache the now-dead macro expander.
1345 if (NumCachedMacroExpanders == MacroExpanderCacheSize)
1346 delete CurMacroExpander;
1347 else
1348 MacroExpanderCache[NumCachedMacroExpanders++] = CurMacroExpander;
1349
1350 // Handle this like a #include file being popped off the stack.
1351 CurMacroExpander = 0;
1352 return HandleEndOfFile(Result, true);
1353}
1354
1355
1356//===----------------------------------------------------------------------===//
1357// Utility Methods for Preprocessor Directive Handling.
1358//===----------------------------------------------------------------------===//
1359
1360/// DiscardUntilEndOfDirective - Read and discard all tokens remaining on the
1361/// current line until the tok::eom token is found.
1362void Preprocessor::DiscardUntilEndOfDirective() {
1363 Token Tmp;
1364 do {
1365 LexUnexpandedToken(Tmp);
Chris Lattnercb8e41c2007-10-09 18:02:16 +00001366 } while (Tmp.isNot(tok::eom));
Chris Lattner4b009652007-07-25 00:24:17 +00001367}
1368
1369/// isCXXNamedOperator - Returns "true" if the token is a named operator in C++.
1370static bool isCXXNamedOperator(const std::string &Spelling) {
1371 return Spelling == "and" || Spelling == "bitand" || Spelling == "bitor" ||
1372 Spelling == "compl" || Spelling == "not" || Spelling == "not_eq" ||
1373 Spelling == "or" || Spelling == "xor";
1374}
1375
1376/// ReadMacroName - Lex and validate a macro name, which occurs after a
1377/// #define or #undef. This sets the token kind to eom and discards the rest
1378/// of the macro line if the macro name is invalid. isDefineUndef is 1 if
1379/// this is due to a a #define, 2 if #undef directive, 0 if it is something
1380/// else (e.g. #ifdef).
1381void Preprocessor::ReadMacroName(Token &MacroNameTok, char isDefineUndef) {
1382 // Read the token, don't allow macro expansion on it.
1383 LexUnexpandedToken(MacroNameTok);
1384
1385 // Missing macro name?
Chris Lattnercb8e41c2007-10-09 18:02:16 +00001386 if (MacroNameTok.is(tok::eom))
Chris Lattner4b009652007-07-25 00:24:17 +00001387 return Diag(MacroNameTok, diag::err_pp_missing_macro_name);
1388
1389 IdentifierInfo *II = MacroNameTok.getIdentifierInfo();
1390 if (II == 0) {
1391 std::string Spelling = getSpelling(MacroNameTok);
1392 if (isCXXNamedOperator(Spelling))
1393 // C++ 2.5p2: Alternative tokens behave the same as its primary token
1394 // except for their spellings.
1395 Diag(MacroNameTok, diag::err_pp_operator_used_as_macro_name, Spelling);
1396 else
1397 Diag(MacroNameTok, diag::err_pp_macro_not_identifier);
1398 // Fall through on error.
1399 } else if (isDefineUndef && II->getPPKeywordID() == tok::pp_defined) {
1400 // Error if defining "defined": C99 6.10.8.4.
1401 Diag(MacroNameTok, diag::err_defined_macro_name);
Chris Lattner3b56a012007-10-07 08:04:56 +00001402 } else if (isDefineUndef && II->hasMacroDefinition() &&
Chris Lattner7a1b0882007-10-07 08:44:20 +00001403 getMacroInfo(II)->isBuiltinMacro()) {
Chris Lattner4b009652007-07-25 00:24:17 +00001404 // Error if defining "__LINE__" and other builtins: C99 6.10.8.4.
1405 if (isDefineUndef == 1)
1406 Diag(MacroNameTok, diag::pp_redef_builtin_macro);
1407 else
1408 Diag(MacroNameTok, diag::pp_undef_builtin_macro);
1409 } else {
1410 // Okay, we got a good identifier node. Return it.
1411 return;
1412 }
1413
1414 // Invalid macro name, read and discard the rest of the line. Then set the
1415 // token kind to tok::eom.
1416 MacroNameTok.setKind(tok::eom);
1417 return DiscardUntilEndOfDirective();
1418}
1419
1420/// CheckEndOfDirective - Ensure that the next token is a tok::eom token. If
1421/// not, emit a diagnostic and consume up until the eom.
1422void Preprocessor::CheckEndOfDirective(const char *DirType) {
1423 Token Tmp;
1424 Lex(Tmp);
1425 // There should be no tokens after the directive, but we allow them as an
1426 // extension.
Chris Lattnercb8e41c2007-10-09 18:02:16 +00001427 while (Tmp.is(tok::comment)) // Skip comments in -C mode.
Chris Lattner4b009652007-07-25 00:24:17 +00001428 Lex(Tmp);
1429
Chris Lattnercb8e41c2007-10-09 18:02:16 +00001430 if (Tmp.isNot(tok::eom)) {
Chris Lattner4b009652007-07-25 00:24:17 +00001431 Diag(Tmp, diag::ext_pp_extra_tokens_at_eol, DirType);
1432 DiscardUntilEndOfDirective();
1433 }
1434}
1435
1436
1437
1438/// SkipExcludedConditionalBlock - We just read a #if or related directive and
1439/// decided that the subsequent tokens are in the #if'd out portion of the
1440/// file. Lex the rest of the file, until we see an #endif. If
1441/// FoundNonSkipPortion is true, then we have already emitted code for part of
1442/// this #if directive, so #else/#elif blocks should never be entered. If ElseOk
1443/// is true, then #else directives are ok, if not, then we have already seen one
1444/// so a #else directive is a duplicate. When this returns, the caller can lex
1445/// the first valid token.
1446void Preprocessor::SkipExcludedConditionalBlock(SourceLocation IfTokenLoc,
1447 bool FoundNonSkipPortion,
1448 bool FoundElse) {
1449 ++NumSkipped;
1450 assert(CurMacroExpander == 0 && CurLexer &&
1451 "Lexing a macro, not a file?");
1452
1453 CurLexer->pushConditionalLevel(IfTokenLoc, /*isSkipping*/false,
1454 FoundNonSkipPortion, FoundElse);
1455
1456 // Enter raw mode to disable identifier lookup (and thus macro expansion),
1457 // disabling warnings, etc.
1458 CurLexer->LexingRawMode = true;
1459 Token Tok;
1460 while (1) {
1461 CurLexer->Lex(Tok);
1462
1463 // If this is the end of the buffer, we have an error.
Chris Lattnercb8e41c2007-10-09 18:02:16 +00001464 if (Tok.is(tok::eof)) {
Chris Lattner4b009652007-07-25 00:24:17 +00001465 // Emit errors for each unterminated conditional on the stack, including
1466 // the current one.
1467 while (!CurLexer->ConditionalStack.empty()) {
1468 Diag(CurLexer->ConditionalStack.back().IfLoc,
1469 diag::err_pp_unterminated_conditional);
1470 CurLexer->ConditionalStack.pop_back();
1471 }
1472
1473 // Just return and let the caller lex after this #include.
1474 break;
1475 }
1476
1477 // If this token is not a preprocessor directive, just skip it.
Chris Lattnercb8e41c2007-10-09 18:02:16 +00001478 if (Tok.isNot(tok::hash) || !Tok.isAtStartOfLine())
Chris Lattner4b009652007-07-25 00:24:17 +00001479 continue;
1480
1481 // We just parsed a # character at the start of a line, so we're in
1482 // directive mode. Tell the lexer this so any newlines we see will be
1483 // converted into an EOM token (this terminates the macro).
1484 CurLexer->ParsingPreprocessorDirective = true;
1485 CurLexer->KeepCommentMode = false;
1486
1487
1488 // Read the next token, the directive flavor.
1489 LexUnexpandedToken(Tok);
1490
1491 // If this isn't an identifier directive (e.g. is "# 1\n" or "#\n", or
1492 // something bogus), skip it.
Chris Lattnercb8e41c2007-10-09 18:02:16 +00001493 if (Tok.isNot(tok::identifier)) {
Chris Lattner4b009652007-07-25 00:24:17 +00001494 CurLexer->ParsingPreprocessorDirective = false;
1495 // Restore comment saving mode.
1496 CurLexer->KeepCommentMode = KeepComments;
1497 continue;
1498 }
1499
1500 // If the first letter isn't i or e, it isn't intesting to us. We know that
1501 // this is safe in the face of spelling differences, because there is no way
1502 // to spell an i/e in a strange way that is another letter. Skipping this
1503 // allows us to avoid looking up the identifier info for #define/#undef and
1504 // other common directives.
1505 const char *RawCharData = SourceMgr.getCharacterData(Tok.getLocation());
1506 char FirstChar = RawCharData[0];
1507 if (FirstChar >= 'a' && FirstChar <= 'z' &&
1508 FirstChar != 'i' && FirstChar != 'e') {
1509 CurLexer->ParsingPreprocessorDirective = false;
1510 // Restore comment saving mode.
1511 CurLexer->KeepCommentMode = KeepComments;
1512 continue;
1513 }
1514
1515 // Get the identifier name without trigraphs or embedded newlines. Note
1516 // that we can't use Tok.getIdentifierInfo() because its lookup is disabled
1517 // when skipping.
1518 // TODO: could do this with zero copies in the no-clean case by using
1519 // strncmp below.
1520 char Directive[20];
1521 unsigned IdLen;
1522 if (!Tok.needsCleaning() && Tok.getLength() < 20) {
1523 IdLen = Tok.getLength();
1524 memcpy(Directive, RawCharData, IdLen);
1525 Directive[IdLen] = 0;
1526 } else {
1527 std::string DirectiveStr = getSpelling(Tok);
1528 IdLen = DirectiveStr.size();
1529 if (IdLen >= 20) {
1530 CurLexer->ParsingPreprocessorDirective = false;
1531 // Restore comment saving mode.
1532 CurLexer->KeepCommentMode = KeepComments;
1533 continue;
1534 }
1535 memcpy(Directive, &DirectiveStr[0], IdLen);
1536 Directive[IdLen] = 0;
1537 }
1538
1539 if (FirstChar == 'i' && Directive[1] == 'f') {
1540 if ((IdLen == 2) || // "if"
1541 (IdLen == 5 && !strcmp(Directive+2, "def")) || // "ifdef"
1542 (IdLen == 6 && !strcmp(Directive+2, "ndef"))) { // "ifndef"
1543 // We know the entire #if/#ifdef/#ifndef block will be skipped, don't
1544 // bother parsing the condition.
1545 DiscardUntilEndOfDirective();
1546 CurLexer->pushConditionalLevel(Tok.getLocation(), /*wasskipping*/true,
1547 /*foundnonskip*/false,
1548 /*fnddelse*/false);
1549 }
1550 } else if (FirstChar == 'e') {
1551 if (IdLen == 5 && !strcmp(Directive+1, "ndif")) { // "endif"
1552 CheckEndOfDirective("#endif");
1553 PPConditionalInfo CondInfo;
1554 CondInfo.WasSkipping = true; // Silence bogus warning.
1555 bool InCond = CurLexer->popConditionalLevel(CondInfo);
1556 InCond = InCond; // Silence warning in no-asserts mode.
1557 assert(!InCond && "Can't be skipping if not in a conditional!");
1558
1559 // If we popped the outermost skipping block, we're done skipping!
1560 if (!CondInfo.WasSkipping)
1561 break;
1562 } else if (IdLen == 4 && !strcmp(Directive+1, "lse")) { // "else".
1563 // #else directive in a skipping conditional. If not in some other
1564 // skipping conditional, and if #else hasn't already been seen, enter it
1565 // as a non-skipping conditional.
1566 CheckEndOfDirective("#else");
1567 PPConditionalInfo &CondInfo = CurLexer->peekConditionalLevel();
1568
1569 // If this is a #else with a #else before it, report the error.
1570 if (CondInfo.FoundElse) Diag(Tok, diag::pp_err_else_after_else);
1571
1572 // Note that we've seen a #else in this conditional.
1573 CondInfo.FoundElse = true;
1574
1575 // If the conditional is at the top level, and the #if block wasn't
1576 // entered, enter the #else block now.
1577 if (!CondInfo.WasSkipping && !CondInfo.FoundNonSkip) {
1578 CondInfo.FoundNonSkip = true;
1579 break;
1580 }
1581 } else if (IdLen == 4 && !strcmp(Directive+1, "lif")) { // "elif".
1582 PPConditionalInfo &CondInfo = CurLexer->peekConditionalLevel();
1583
1584 bool ShouldEnter;
1585 // If this is in a skipping block or if we're already handled this #if
1586 // block, don't bother parsing the condition.
1587 if (CondInfo.WasSkipping || CondInfo.FoundNonSkip) {
1588 DiscardUntilEndOfDirective();
1589 ShouldEnter = false;
1590 } else {
1591 // Restore the value of LexingRawMode so that identifiers are
1592 // looked up, etc, inside the #elif expression.
1593 assert(CurLexer->LexingRawMode && "We have to be skipping here!");
1594 CurLexer->LexingRawMode = false;
1595 IdentifierInfo *IfNDefMacro = 0;
1596 ShouldEnter = EvaluateDirectiveExpression(IfNDefMacro);
1597 CurLexer->LexingRawMode = true;
1598 }
1599
1600 // If this is a #elif with a #else before it, report the error.
1601 if (CondInfo.FoundElse) Diag(Tok, diag::pp_err_elif_after_else);
1602
1603 // If this condition is true, enter it!
1604 if (ShouldEnter) {
1605 CondInfo.FoundNonSkip = true;
1606 break;
1607 }
1608 }
1609 }
1610
1611 CurLexer->ParsingPreprocessorDirective = false;
1612 // Restore comment saving mode.
1613 CurLexer->KeepCommentMode = KeepComments;
1614 }
1615
1616 // Finally, if we are out of the conditional (saw an #endif or ran off the end
1617 // of the file, just stop skipping and return to lexing whatever came after
1618 // the #if block.
1619 CurLexer->LexingRawMode = false;
1620}
1621
1622//===----------------------------------------------------------------------===//
1623// Preprocessor Directive Handling.
1624//===----------------------------------------------------------------------===//
1625
1626/// HandleDirective - This callback is invoked when the lexer sees a # token
1627/// at the start of a line. This consumes the directive, modifies the
1628/// lexer/preprocessor state, and advances the lexer(s) so that the next token
1629/// read is the correct one.
1630void Preprocessor::HandleDirective(Token &Result) {
1631 // FIXME: Traditional: # with whitespace before it not recognized by K&R?
1632
1633 // We just parsed a # character at the start of a line, so we're in directive
1634 // mode. Tell the lexer this so any newlines we see will be converted into an
1635 // EOM token (which terminates the directive).
1636 CurLexer->ParsingPreprocessorDirective = true;
1637
1638 ++NumDirectives;
1639
1640 // We are about to read a token. For the multiple-include optimization FA to
1641 // work, we have to remember if we had read any tokens *before* this
1642 // pp-directive.
1643 bool ReadAnyTokensBeforeDirective = CurLexer->MIOpt.getHasReadAnyTokensVal();
1644
1645 // Read the next token, the directive flavor. This isn't expanded due to
1646 // C99 6.10.3p8.
1647 LexUnexpandedToken(Result);
1648
1649 // C99 6.10.3p11: Is this preprocessor directive in macro invocation? e.g.:
1650 // #define A(x) #x
1651 // A(abc
1652 // #warning blah
1653 // def)
1654 // If so, the user is relying on non-portable behavior, emit a diagnostic.
1655 if (InMacroArgs)
1656 Diag(Result, diag::ext_embedded_directive);
1657
1658TryAgain:
1659 switch (Result.getKind()) {
1660 case tok::eom:
1661 return; // null directive.
1662 case tok::comment:
1663 // Handle stuff like "# /*foo*/ define X" in -E -C mode.
1664 LexUnexpandedToken(Result);
1665 goto TryAgain;
1666
1667 case tok::numeric_constant:
1668 // FIXME: implement # 7 line numbers!
1669 DiscardUntilEndOfDirective();
1670 return;
1671 default:
1672 IdentifierInfo *II = Result.getIdentifierInfo();
1673 if (II == 0) break; // Not an identifier.
1674
1675 // Ask what the preprocessor keyword ID is.
1676 switch (II->getPPKeywordID()) {
1677 default: break;
1678 // C99 6.10.1 - Conditional Inclusion.
1679 case tok::pp_if:
1680 return HandleIfDirective(Result, ReadAnyTokensBeforeDirective);
1681 case tok::pp_ifdef:
1682 return HandleIfdefDirective(Result, false, true/*not valid for miopt*/);
1683 case tok::pp_ifndef:
1684 return HandleIfdefDirective(Result, true, ReadAnyTokensBeforeDirective);
1685 case tok::pp_elif:
1686 return HandleElifDirective(Result);
1687 case tok::pp_else:
1688 return HandleElseDirective(Result);
1689 case tok::pp_endif:
1690 return HandleEndifDirective(Result);
1691
1692 // C99 6.10.2 - Source File Inclusion.
1693 case tok::pp_include:
1694 return HandleIncludeDirective(Result); // Handle #include.
1695
1696 // C99 6.10.3 - Macro Replacement.
1697 case tok::pp_define:
1698 return HandleDefineDirective(Result, false);
1699 case tok::pp_undef:
1700 return HandleUndefDirective(Result);
1701
1702 // C99 6.10.4 - Line Control.
1703 case tok::pp_line:
1704 // FIXME: implement #line
1705 DiscardUntilEndOfDirective();
1706 return;
1707
1708 // C99 6.10.5 - Error Directive.
1709 case tok::pp_error:
1710 return HandleUserDiagnosticDirective(Result, false);
1711
1712 // C99 6.10.6 - Pragma Directive.
1713 case tok::pp_pragma:
1714 return HandlePragmaDirective();
1715
1716 // GNU Extensions.
1717 case tok::pp_import:
1718 return HandleImportDirective(Result);
1719 case tok::pp_include_next:
1720 return HandleIncludeNextDirective(Result);
1721
1722 case tok::pp_warning:
1723 Diag(Result, diag::ext_pp_warning_directive);
1724 return HandleUserDiagnosticDirective(Result, true);
1725 case tok::pp_ident:
1726 return HandleIdentSCCSDirective(Result);
1727 case tok::pp_sccs:
1728 return HandleIdentSCCSDirective(Result);
1729 case tok::pp_assert:
1730 //isExtension = true; // FIXME: implement #assert
1731 break;
1732 case tok::pp_unassert:
1733 //isExtension = true; // FIXME: implement #unassert
1734 break;
1735
1736 // clang extensions.
1737 case tok::pp_define_target:
1738 return HandleDefineDirective(Result, true);
1739 case tok::pp_define_other_target:
1740 return HandleDefineOtherTargetDirective(Result);
1741 }
1742 break;
1743 }
1744
1745 // If we reached here, the preprocessing token is not valid!
1746 Diag(Result, diag::err_pp_invalid_directive);
1747
1748 // Read the rest of the PP line.
1749 DiscardUntilEndOfDirective();
1750
1751 // Okay, we're done parsing the directive.
1752}
1753
1754void Preprocessor::HandleUserDiagnosticDirective(Token &Tok,
1755 bool isWarning) {
1756 // Read the rest of the line raw. We do this because we don't want macros
1757 // to be expanded and we don't require that the tokens be valid preprocessing
1758 // tokens. For example, this is allowed: "#warning ` 'foo". GCC does
1759 // collapse multiple consequtive white space between tokens, but this isn't
1760 // specified by the standard.
1761 std::string Message = CurLexer->ReadToEndOfLine();
1762
1763 unsigned DiagID = isWarning ? diag::pp_hash_warning : diag::err_pp_hash_error;
1764 return Diag(Tok, DiagID, Message);
1765}
1766
1767/// HandleIdentSCCSDirective - Handle a #ident/#sccs directive.
1768///
1769void Preprocessor::HandleIdentSCCSDirective(Token &Tok) {
1770 // Yes, this directive is an extension.
1771 Diag(Tok, diag::ext_pp_ident_directive);
1772
1773 // Read the string argument.
1774 Token StrTok;
1775 Lex(StrTok);
1776
1777 // If the token kind isn't a string, it's a malformed directive.
Chris Lattnercb8e41c2007-10-09 18:02:16 +00001778 if (StrTok.isNot(tok::string_literal) &&
1779 StrTok.isNot(tok::wide_string_literal))
Chris Lattner4b009652007-07-25 00:24:17 +00001780 return Diag(StrTok, diag::err_pp_malformed_ident);
1781
1782 // Verify that there is nothing after the string, other than EOM.
1783 CheckEndOfDirective("#ident");
1784
1785 if (Callbacks)
1786 Callbacks->Ident(Tok.getLocation(), getSpelling(StrTok));
1787}
1788
1789//===----------------------------------------------------------------------===//
1790// Preprocessor Include Directive Handling.
1791//===----------------------------------------------------------------------===//
1792
1793/// GetIncludeFilenameSpelling - Turn the specified lexer token into a fully
1794/// checked and spelled filename, e.g. as an operand of #include. This returns
1795/// true if the input filename was in <>'s or false if it were in ""'s. The
1796/// caller is expected to provide a buffer that is large enough to hold the
1797/// spelling of the filename, but is also expected to handle the case when
1798/// this method decides to use a different buffer.
1799bool Preprocessor::GetIncludeFilenameSpelling(SourceLocation Loc,
1800 const char *&BufStart,
1801 const char *&BufEnd) {
1802 // Get the text form of the filename.
1803 assert(BufStart != BufEnd && "Can't have tokens with empty spellings!");
1804
1805 // Make sure the filename is <x> or "x".
1806 bool isAngled;
1807 if (BufStart[0] == '<') {
1808 if (BufEnd[-1] != '>') {
1809 Diag(Loc, diag::err_pp_expects_filename);
1810 BufStart = 0;
1811 return true;
1812 }
1813 isAngled = true;
1814 } else if (BufStart[0] == '"') {
1815 if (BufEnd[-1] != '"') {
1816 Diag(Loc, diag::err_pp_expects_filename);
1817 BufStart = 0;
1818 return true;
1819 }
1820 isAngled = false;
1821 } else {
1822 Diag(Loc, diag::err_pp_expects_filename);
1823 BufStart = 0;
1824 return true;
1825 }
1826
1827 // Diagnose #include "" as invalid.
1828 if (BufEnd-BufStart <= 2) {
1829 Diag(Loc, diag::err_pp_empty_filename);
1830 BufStart = 0;
1831 return "";
1832 }
1833
1834 // Skip the brackets.
1835 ++BufStart;
1836 --BufEnd;
1837 return isAngled;
1838}
1839
1840/// ConcatenateIncludeName - Handle cases where the #include name is expanded
1841/// from a macro as multiple tokens, which need to be glued together. This
1842/// occurs for code like:
1843/// #define FOO <a/b.h>
1844/// #include FOO
1845/// because in this case, "<a/b.h>" is returned as 7 tokens, not one.
1846///
1847/// This code concatenates and consumes tokens up to the '>' token. It returns
1848/// false if the > was found, otherwise it returns true if it finds and consumes
1849/// the EOM marker.
1850static bool ConcatenateIncludeName(llvm::SmallVector<char, 128> &FilenameBuffer,
1851 Preprocessor &PP) {
1852 Token CurTok;
1853
1854 PP.Lex(CurTok);
Chris Lattnercb8e41c2007-10-09 18:02:16 +00001855 while (CurTok.isNot(tok::eom)) {
Chris Lattner4b009652007-07-25 00:24:17 +00001856 // Append the spelling of this token to the buffer. If there was a space
1857 // before it, add it now.
1858 if (CurTok.hasLeadingSpace())
1859 FilenameBuffer.push_back(' ');
1860
1861 // Get the spelling of the token, directly into FilenameBuffer if possible.
1862 unsigned PreAppendSize = FilenameBuffer.size();
1863 FilenameBuffer.resize(PreAppendSize+CurTok.getLength());
1864
1865 const char *BufPtr = &FilenameBuffer[PreAppendSize];
1866 unsigned ActualLen = PP.getSpelling(CurTok, BufPtr);
1867
1868 // If the token was spelled somewhere else, copy it into FilenameBuffer.
1869 if (BufPtr != &FilenameBuffer[PreAppendSize])
1870 memcpy(&FilenameBuffer[PreAppendSize], BufPtr, ActualLen);
1871
1872 // Resize FilenameBuffer to the correct size.
1873 if (CurTok.getLength() != ActualLen)
1874 FilenameBuffer.resize(PreAppendSize+ActualLen);
1875
1876 // If we found the '>' marker, return success.
Chris Lattnercb8e41c2007-10-09 18:02:16 +00001877 if (CurTok.is(tok::greater))
Chris Lattner4b009652007-07-25 00:24:17 +00001878 return false;
1879
1880 PP.Lex(CurTok);
1881 }
1882
1883 // If we hit the eom marker, emit an error and return true so that the caller
1884 // knows the EOM has been read.
1885 PP.Diag(CurTok.getLocation(), diag::err_pp_expects_filename);
1886 return true;
1887}
1888
1889/// HandleIncludeDirective - The "#include" tokens have just been read, read the
1890/// file to be included from the lexer, then include it! This is a common
1891/// routine with functionality shared between #include, #include_next and
1892/// #import.
1893void Preprocessor::HandleIncludeDirective(Token &IncludeTok,
1894 const DirectoryLookup *LookupFrom,
1895 bool isImport) {
1896
1897 Token FilenameTok;
1898 CurLexer->LexIncludeFilename(FilenameTok);
1899
1900 // Reserve a buffer to get the spelling.
1901 llvm::SmallVector<char, 128> FilenameBuffer;
1902 const char *FilenameStart, *FilenameEnd;
1903
1904 switch (FilenameTok.getKind()) {
1905 case tok::eom:
1906 // If the token kind is EOM, the error has already been diagnosed.
1907 return;
1908
1909 case tok::angle_string_literal:
1910 case tok::string_literal: {
1911 FilenameBuffer.resize(FilenameTok.getLength());
1912 FilenameStart = &FilenameBuffer[0];
1913 unsigned Len = getSpelling(FilenameTok, FilenameStart);
1914 FilenameEnd = FilenameStart+Len;
1915 break;
1916 }
1917
1918 case tok::less:
1919 // This could be a <foo/bar.h> file coming from a macro expansion. In this
1920 // case, glue the tokens together into FilenameBuffer and interpret those.
1921 FilenameBuffer.push_back('<');
1922 if (ConcatenateIncludeName(FilenameBuffer, *this))
1923 return; // Found <eom> but no ">"? Diagnostic already emitted.
1924 FilenameStart = &FilenameBuffer[0];
1925 FilenameEnd = &FilenameBuffer[FilenameBuffer.size()];
1926 break;
1927 default:
1928 Diag(FilenameTok.getLocation(), diag::err_pp_expects_filename);
1929 DiscardUntilEndOfDirective();
1930 return;
1931 }
1932
1933 bool isAngled = GetIncludeFilenameSpelling(FilenameTok.getLocation(),
1934 FilenameStart, FilenameEnd);
1935 // If GetIncludeFilenameSpelling set the start ptr to null, there was an
1936 // error.
1937 if (FilenameStart == 0) {
1938 DiscardUntilEndOfDirective();
1939 return;
1940 }
1941
1942 // Verify that there is nothing after the filename, other than EOM. Use the
1943 // preprocessor to lex this in case lexing the filename entered a macro.
1944 CheckEndOfDirective("#include");
1945
1946 // Check that we don't have infinite #include recursion.
1947 if (IncludeMacroStack.size() == MaxAllowedIncludeStackDepth-1)
1948 return Diag(FilenameTok, diag::err_pp_include_too_deep);
1949
1950 // Search include directories.
1951 const DirectoryLookup *CurDir;
1952 const FileEntry *File = LookupFile(FilenameStart, FilenameEnd,
1953 isAngled, LookupFrom, CurDir);
1954 if (File == 0)
1955 return Diag(FilenameTok, diag::err_pp_file_not_found,
1956 std::string(FilenameStart, FilenameEnd));
1957
1958 // Ask HeaderInfo if we should enter this #include file.
1959 if (!HeaderInfo.ShouldEnterIncludeFile(File, isImport)) {
1960 // If it returns true, #including this file will have no effect.
1961 return;
1962 }
1963
1964 // Look up the file, create a File ID for it.
1965 unsigned FileID = SourceMgr.createFileID(File, FilenameTok.getLocation());
1966 if (FileID == 0)
1967 return Diag(FilenameTok, diag::err_pp_file_not_found,
1968 std::string(FilenameStart, FilenameEnd));
1969
1970 // Finally, if all is good, enter the new file!
1971 EnterSourceFile(FileID, CurDir);
1972}
1973
1974/// HandleIncludeNextDirective - Implements #include_next.
1975///
1976void Preprocessor::HandleIncludeNextDirective(Token &IncludeNextTok) {
1977 Diag(IncludeNextTok, diag::ext_pp_include_next_directive);
1978
1979 // #include_next is like #include, except that we start searching after
1980 // the current found directory. If we can't do this, issue a
1981 // diagnostic.
1982 const DirectoryLookup *Lookup = CurDirLookup;
1983 if (isInPrimaryFile()) {
1984 Lookup = 0;
1985 Diag(IncludeNextTok, diag::pp_include_next_in_primary);
1986 } else if (Lookup == 0) {
1987 Diag(IncludeNextTok, diag::pp_include_next_absolute_path);
1988 } else {
1989 // Start looking up in the next directory.
1990 ++Lookup;
1991 }
1992
1993 return HandleIncludeDirective(IncludeNextTok, Lookup);
1994}
1995
1996/// HandleImportDirective - Implements #import.
1997///
1998void Preprocessor::HandleImportDirective(Token &ImportTok) {
1999 Diag(ImportTok, diag::ext_pp_import_directive);
2000
2001 return HandleIncludeDirective(ImportTok, 0, true);
2002}
2003
2004//===----------------------------------------------------------------------===//
2005// Preprocessor Macro Directive Handling.
2006//===----------------------------------------------------------------------===//
2007
2008/// ReadMacroDefinitionArgList - The ( starting an argument list of a macro
2009/// definition has just been read. Lex the rest of the arguments and the
2010/// closing ), updating MI with what we learn. Return true if an error occurs
2011/// parsing the arg list.
2012bool Preprocessor::ReadMacroDefinitionArgList(MacroInfo *MI) {
2013 llvm::SmallVector<IdentifierInfo*, 32> Arguments;
2014
2015 Token Tok;
2016 while (1) {
2017 LexUnexpandedToken(Tok);
2018 switch (Tok.getKind()) {
2019 case tok::r_paren:
2020 // Found the end of the argument list.
2021 if (Arguments.empty()) { // #define FOO()
2022 MI->setArgumentList(Arguments.begin(), Arguments.end());
2023 return false;
2024 }
2025 // Otherwise we have #define FOO(A,)
2026 Diag(Tok, diag::err_pp_expected_ident_in_arg_list);
2027 return true;
2028 case tok::ellipsis: // #define X(... -> C99 varargs
2029 // Warn if use of C99 feature in non-C99 mode.
2030 if (!Features.C99) Diag(Tok, diag::ext_variadic_macro);
2031
2032 // Lex the token after the identifier.
2033 LexUnexpandedToken(Tok);
Chris Lattnercb8e41c2007-10-09 18:02:16 +00002034 if (Tok.isNot(tok::r_paren)) {
Chris Lattner4b009652007-07-25 00:24:17 +00002035 Diag(Tok, diag::err_pp_missing_rparen_in_macro_def);
2036 return true;
2037 }
2038 // Add the __VA_ARGS__ identifier as an argument.
2039 Arguments.push_back(Ident__VA_ARGS__);
2040 MI->setIsC99Varargs();
2041 MI->setArgumentList(Arguments.begin(), Arguments.end());
2042 return false;
2043 case tok::eom: // #define X(
2044 Diag(Tok, diag::err_pp_missing_rparen_in_macro_def);
2045 return true;
2046 default:
2047 // Handle keywords and identifiers here to accept things like
2048 // #define Foo(for) for.
2049 IdentifierInfo *II = Tok.getIdentifierInfo();
2050 if (II == 0) {
2051 // #define X(1
2052 Diag(Tok, diag::err_pp_invalid_tok_in_arg_list);
2053 return true;
2054 }
2055
2056 // If this is already used as an argument, it is used multiple times (e.g.
2057 // #define X(A,A.
2058 if (std::find(Arguments.begin(), Arguments.end(), II) !=
2059 Arguments.end()) { // C99 6.10.3p6
2060 Diag(Tok, diag::err_pp_duplicate_name_in_arg_list, II->getName());
2061 return true;
2062 }
2063
2064 // Add the argument to the macro info.
2065 Arguments.push_back(II);
2066
2067 // Lex the token after the identifier.
2068 LexUnexpandedToken(Tok);
2069
2070 switch (Tok.getKind()) {
2071 default: // #define X(A B
2072 Diag(Tok, diag::err_pp_expected_comma_in_arg_list);
2073 return true;
2074 case tok::r_paren: // #define X(A)
2075 MI->setArgumentList(Arguments.begin(), Arguments.end());
2076 return false;
2077 case tok::comma: // #define X(A,
2078 break;
2079 case tok::ellipsis: // #define X(A... -> GCC extension
2080 // Diagnose extension.
2081 Diag(Tok, diag::ext_named_variadic_macro);
2082
2083 // Lex the token after the identifier.
2084 LexUnexpandedToken(Tok);
Chris Lattnercb8e41c2007-10-09 18:02:16 +00002085 if (Tok.isNot(tok::r_paren)) {
Chris Lattner4b009652007-07-25 00:24:17 +00002086 Diag(Tok, diag::err_pp_missing_rparen_in_macro_def);
2087 return true;
2088 }
2089
2090 MI->setIsGNUVarargs();
2091 MI->setArgumentList(Arguments.begin(), Arguments.end());
2092 return false;
2093 }
2094 }
2095 }
2096}
2097
2098/// HandleDefineDirective - Implements #define. This consumes the entire macro
2099/// line then lets the caller lex the next real token. If 'isTargetSpecific' is
2100/// true, then this is a "#define_target", otherwise this is a "#define".
2101///
2102void Preprocessor::HandleDefineDirective(Token &DefineTok,
2103 bool isTargetSpecific) {
2104 ++NumDefined;
2105
2106 Token MacroNameTok;
2107 ReadMacroName(MacroNameTok, 1);
2108
2109 // Error reading macro name? If so, diagnostic already issued.
Chris Lattnercb8e41c2007-10-09 18:02:16 +00002110 if (MacroNameTok.is(tok::eom))
Chris Lattner4b009652007-07-25 00:24:17 +00002111 return;
2112
2113 // If we are supposed to keep comments in #defines, reenable comment saving
2114 // mode.
2115 CurLexer->KeepCommentMode = KeepMacroComments;
2116
2117 // Create the new macro.
2118 MacroInfo *MI = new MacroInfo(MacroNameTok.getLocation());
2119 if (isTargetSpecific) MI->setIsTargetSpecific();
2120
2121 // If the identifier is an 'other target' macro, clear this bit.
2122 MacroNameTok.getIdentifierInfo()->setIsOtherTargetMacro(false);
2123
2124
2125 Token Tok;
2126 LexUnexpandedToken(Tok);
2127
2128 // If this is a function-like macro definition, parse the argument list,
2129 // marking each of the identifiers as being used as macro arguments. Also,
2130 // check other constraints on the first token of the macro body.
Chris Lattnercb8e41c2007-10-09 18:02:16 +00002131 if (Tok.is(tok::eom)) {
Chris Lattner4b009652007-07-25 00:24:17 +00002132 // If there is no body to this macro, we have no special handling here.
Chris Lattnercb8e41c2007-10-09 18:02:16 +00002133 } else if (Tok.is(tok::l_paren) && !Tok.hasLeadingSpace()) {
Chris Lattner4b009652007-07-25 00:24:17 +00002134 // This is a function-like macro definition. Read the argument list.
2135 MI->setIsFunctionLike();
2136 if (ReadMacroDefinitionArgList(MI)) {
2137 // Forget about MI.
2138 delete MI;
2139 // Throw away the rest of the line.
2140 if (CurLexer->ParsingPreprocessorDirective)
2141 DiscardUntilEndOfDirective();
2142 return;
2143 }
2144
2145 // Read the first token after the arg list for down below.
2146 LexUnexpandedToken(Tok);
2147 } else if (!Tok.hasLeadingSpace()) {
2148 // C99 requires whitespace between the macro definition and the body. Emit
2149 // a diagnostic for something like "#define X+".
2150 if (Features.C99) {
2151 Diag(Tok, diag::ext_c99_whitespace_required_after_macro_name);
2152 } else {
2153 // FIXME: C90/C++ do not get this diagnostic, but it does get a similar
2154 // one in some cases!
2155 }
2156 } else {
2157 // This is a normal token with leading space. Clear the leading space
2158 // marker on the first token to get proper expansion.
2159 Tok.clearFlag(Token::LeadingSpace);
2160 }
2161
2162 // If this is a definition of a variadic C99 function-like macro, not using
2163 // the GNU named varargs extension, enabled __VA_ARGS__.
2164
2165 // "Poison" __VA_ARGS__, which can only appear in the expansion of a macro.
2166 // This gets unpoisoned where it is allowed.
2167 assert(Ident__VA_ARGS__->isPoisoned() && "__VA_ARGS__ should be poisoned!");
2168 if (MI->isC99Varargs())
2169 Ident__VA_ARGS__->setIsPoisoned(false);
2170
2171 // Read the rest of the macro body.
2172 if (MI->isObjectLike()) {
2173 // Object-like macros are very simple, just read their body.
Chris Lattnercb8e41c2007-10-09 18:02:16 +00002174 while (Tok.isNot(tok::eom)) {
Chris Lattner4b009652007-07-25 00:24:17 +00002175 MI->AddTokenToBody(Tok);
2176 // Get the next token of the macro.
2177 LexUnexpandedToken(Tok);
2178 }
2179
2180 } else {
2181 // Otherwise, read the body of a function-like macro. This has to validate
2182 // the # (stringize) operator.
Chris Lattnercb8e41c2007-10-09 18:02:16 +00002183 while (Tok.isNot(tok::eom)) {
Chris Lattner4b009652007-07-25 00:24:17 +00002184 MI->AddTokenToBody(Tok);
2185
2186 // Check C99 6.10.3.2p1: ensure that # operators are followed by macro
2187 // parameters in function-like macro expansions.
Chris Lattnercb8e41c2007-10-09 18:02:16 +00002188 if (Tok.isNot(tok::hash)) {
Chris Lattner4b009652007-07-25 00:24:17 +00002189 // Get the next token of the macro.
2190 LexUnexpandedToken(Tok);
2191 continue;
2192 }
2193
2194 // Get the next token of the macro.
2195 LexUnexpandedToken(Tok);
2196
2197 // Not a macro arg identifier?
2198 if (!Tok.getIdentifierInfo() ||
2199 MI->getArgumentNum(Tok.getIdentifierInfo()) == -1) {
2200 Diag(Tok, diag::err_pp_stringize_not_parameter);
2201 delete MI;
2202
2203 // Disable __VA_ARGS__ again.
2204 Ident__VA_ARGS__->setIsPoisoned(true);
2205 return;
2206 }
2207
2208 // Things look ok, add the param name token to the macro.
2209 MI->AddTokenToBody(Tok);
2210
2211 // Get the next token of the macro.
2212 LexUnexpandedToken(Tok);
2213 }
2214 }
2215
2216
2217 // Disable __VA_ARGS__ again.
2218 Ident__VA_ARGS__->setIsPoisoned(true);
2219
2220 // Check that there is no paste (##) operator at the begining or end of the
2221 // replacement list.
2222 unsigned NumTokens = MI->getNumTokens();
2223 if (NumTokens != 0) {
Chris Lattnercb8e41c2007-10-09 18:02:16 +00002224 if (MI->getReplacementToken(0).is(tok::hashhash)) {
Chris Lattner4b009652007-07-25 00:24:17 +00002225 Diag(MI->getReplacementToken(0), diag::err_paste_at_start);
2226 delete MI;
2227 return;
2228 }
Chris Lattnercb8e41c2007-10-09 18:02:16 +00002229 if (MI->getReplacementToken(NumTokens-1).is(tok::hashhash)) {
Chris Lattner4b009652007-07-25 00:24:17 +00002230 Diag(MI->getReplacementToken(NumTokens-1), diag::err_paste_at_end);
2231 delete MI;
2232 return;
2233 }
2234 }
2235
2236 // If this is the primary source file, remember that this macro hasn't been
2237 // used yet.
2238 if (isInPrimaryFile())
2239 MI->setIsUsed(false);
2240
2241 // Finally, if this identifier already had a macro defined for it, verify that
2242 // the macro bodies are identical and free the old definition.
Chris Lattner7a1b0882007-10-07 08:44:20 +00002243 if (MacroInfo *OtherMI = getMacroInfo(MacroNameTok.getIdentifierInfo())) {
Chris Lattner4b009652007-07-25 00:24:17 +00002244 if (!OtherMI->isUsed())
2245 Diag(OtherMI->getDefinitionLoc(), diag::pp_macro_not_used);
2246
2247 // Macros must be identical. This means all tokes and whitespace separation
2248 // must be the same. C99 6.10.3.2.
2249 if (!MI->isIdenticalTo(*OtherMI, *this)) {
2250 Diag(MI->getDefinitionLoc(), diag::ext_pp_macro_redef,
2251 MacroNameTok.getIdentifierInfo()->getName());
2252 Diag(OtherMI->getDefinitionLoc(), diag::ext_pp_macro_redef2);
2253 }
2254 delete OtherMI;
2255 }
2256
Chris Lattner7a1b0882007-10-07 08:44:20 +00002257 setMacroInfo(MacroNameTok.getIdentifierInfo(), MI);
Chris Lattner4b009652007-07-25 00:24:17 +00002258}
2259
2260/// HandleDefineOtherTargetDirective - Implements #define_other_target.
2261void Preprocessor::HandleDefineOtherTargetDirective(Token &Tok) {
2262 Token MacroNameTok;
2263 ReadMacroName(MacroNameTok, 1);
2264
2265 // Error reading macro name? If so, diagnostic already issued.
Chris Lattnercb8e41c2007-10-09 18:02:16 +00002266 if (MacroNameTok.is(tok::eom))
Chris Lattner4b009652007-07-25 00:24:17 +00002267 return;
2268
2269 // Check to see if this is the last token on the #undef line.
2270 CheckEndOfDirective("#define_other_target");
2271
2272 // If there is already a macro defined by this name, turn it into a
2273 // target-specific define.
Chris Lattner7a1b0882007-10-07 08:44:20 +00002274 if (MacroInfo *MI = getMacroInfo(MacroNameTok.getIdentifierInfo())) {
Chris Lattner4b009652007-07-25 00:24:17 +00002275 MI->setIsTargetSpecific(true);
2276 return;
2277 }
2278
2279 // Mark the identifier as being a macro on some other target.
2280 MacroNameTok.getIdentifierInfo()->setIsOtherTargetMacro();
2281}
2282
2283
2284/// HandleUndefDirective - Implements #undef.
2285///
2286void Preprocessor::HandleUndefDirective(Token &UndefTok) {
2287 ++NumUndefined;
2288
2289 Token MacroNameTok;
2290 ReadMacroName(MacroNameTok, 2);
2291
2292 // Error reading macro name? If so, diagnostic already issued.
Chris Lattnercb8e41c2007-10-09 18:02:16 +00002293 if (MacroNameTok.is(tok::eom))
Chris Lattner4b009652007-07-25 00:24:17 +00002294 return;
2295
2296 // Check to see if this is the last token on the #undef line.
2297 CheckEndOfDirective("#undef");
2298
2299 // Okay, we finally have a valid identifier to undef.
Chris Lattner7a1b0882007-10-07 08:44:20 +00002300 MacroInfo *MI = getMacroInfo(MacroNameTok.getIdentifierInfo());
Chris Lattner4b009652007-07-25 00:24:17 +00002301
2302 // #undef untaints an identifier if it were marked by define_other_target.
2303 MacroNameTok.getIdentifierInfo()->setIsOtherTargetMacro(false);
2304
2305 // If the macro is not defined, this is a noop undef, just return.
2306 if (MI == 0) return;
2307
2308 if (!MI->isUsed())
2309 Diag(MI->getDefinitionLoc(), diag::pp_macro_not_used);
2310
2311 // Free macro definition.
2312 delete MI;
Chris Lattner7a1b0882007-10-07 08:44:20 +00002313 setMacroInfo(MacroNameTok.getIdentifierInfo(), 0);
Chris Lattner4b009652007-07-25 00:24:17 +00002314}
2315
2316
2317//===----------------------------------------------------------------------===//
2318// Preprocessor Conditional Directive Handling.
2319//===----------------------------------------------------------------------===//
2320
2321/// HandleIfdefDirective - Implements the #ifdef/#ifndef directive. isIfndef is
2322/// true when this is a #ifndef directive. ReadAnyTokensBeforeDirective is true
2323/// if any tokens have been returned or pp-directives activated before this
2324/// #ifndef has been lexed.
2325///
2326void Preprocessor::HandleIfdefDirective(Token &Result, bool isIfndef,
2327 bool ReadAnyTokensBeforeDirective) {
2328 ++NumIf;
2329 Token DirectiveTok = Result;
2330
2331 Token MacroNameTok;
2332 ReadMacroName(MacroNameTok);
2333
2334 // Error reading macro name? If so, diagnostic already issued.
Chris Lattnercb8e41c2007-10-09 18:02:16 +00002335 if (MacroNameTok.is(tok::eom)) {
Chris Lattnere6cdeb52007-09-24 05:14:57 +00002336 // Skip code until we get to #endif. This helps with recovery by not
2337 // emitting an error when the #endif is reached.
2338 SkipExcludedConditionalBlock(DirectiveTok.getLocation(),
2339 /*Foundnonskip*/false, /*FoundElse*/false);
Chris Lattner4b009652007-07-25 00:24:17 +00002340 return;
Chris Lattnere6cdeb52007-09-24 05:14:57 +00002341 }
Chris Lattner4b009652007-07-25 00:24:17 +00002342
2343 // Check to see if this is the last token on the #if[n]def line.
2344 CheckEndOfDirective(isIfndef ? "#ifndef" : "#ifdef");
2345
2346 // If the start of a top-level #ifdef, inform MIOpt.
2347 if (!ReadAnyTokensBeforeDirective &&
2348 CurLexer->getConditionalStackDepth() == 0) {
2349 assert(isIfndef && "#ifdef shouldn't reach here");
2350 CurLexer->MIOpt.EnterTopLevelIFNDEF(MacroNameTok.getIdentifierInfo());
2351 }
2352
2353 IdentifierInfo *MII = MacroNameTok.getIdentifierInfo();
Chris Lattner7a1b0882007-10-07 08:44:20 +00002354 MacroInfo *MI = getMacroInfo(MII);
Chris Lattner4b009652007-07-25 00:24:17 +00002355
2356 // If there is a macro, process it.
2357 if (MI) {
2358 // Mark it used.
2359 MI->setIsUsed(true);
2360
2361 // If this is the first use of a target-specific macro, warn about it.
2362 if (MI->isTargetSpecific()) {
2363 MI->setIsTargetSpecific(false); // Don't warn on second use.
Ted Kremenekd7f64cd2007-12-12 22:39:36 +00002364 getTargetInfo().DiagnoseNonPortability(
2365 getFullLoc(MacroNameTok.getLocation()),
2366 diag::port_target_macro_use);
Chris Lattner4b009652007-07-25 00:24:17 +00002367 }
2368 } else {
2369 // Use of a target-specific macro for some other target? If so, warn.
2370 if (MII->isOtherTargetMacro()) {
2371 MII->setIsOtherTargetMacro(false); // Don't warn on second use.
Ted Kremenekd7f64cd2007-12-12 22:39:36 +00002372 getTargetInfo().DiagnoseNonPortability(
2373 getFullLoc(MacroNameTok.getLocation()),
2374 diag::port_target_macro_use);
Chris Lattner4b009652007-07-25 00:24:17 +00002375 }
2376 }
2377
2378 // Should we include the stuff contained by this directive?
2379 if (!MI == isIfndef) {
2380 // Yes, remember that we are inside a conditional, then lex the next token.
2381 CurLexer->pushConditionalLevel(DirectiveTok.getLocation(), /*wasskip*/false,
2382 /*foundnonskip*/true, /*foundelse*/false);
2383 } else {
2384 // No, skip the contents of this block and return the first token after it.
2385 SkipExcludedConditionalBlock(DirectiveTok.getLocation(),
2386 /*Foundnonskip*/false,
2387 /*FoundElse*/false);
2388 }
2389}
2390
2391/// HandleIfDirective - Implements the #if directive.
2392///
2393void Preprocessor::HandleIfDirective(Token &IfToken,
2394 bool ReadAnyTokensBeforeDirective) {
2395 ++NumIf;
2396
2397 // Parse and evaluation the conditional expression.
2398 IdentifierInfo *IfNDefMacro = 0;
2399 bool ConditionalTrue = EvaluateDirectiveExpression(IfNDefMacro);
2400
2401 // Should we include the stuff contained by this directive?
2402 if (ConditionalTrue) {
2403 // If this condition is equivalent to #ifndef X, and if this is the first
2404 // directive seen, handle it for the multiple-include optimization.
2405 if (!ReadAnyTokensBeforeDirective &&
2406 CurLexer->getConditionalStackDepth() == 0 && IfNDefMacro)
2407 CurLexer->MIOpt.EnterTopLevelIFNDEF(IfNDefMacro);
2408
2409 // Yes, remember that we are inside a conditional, then lex the next token.
2410 CurLexer->pushConditionalLevel(IfToken.getLocation(), /*wasskip*/false,
2411 /*foundnonskip*/true, /*foundelse*/false);
2412 } else {
2413 // No, skip the contents of this block and return the first token after it.
2414 SkipExcludedConditionalBlock(IfToken.getLocation(), /*Foundnonskip*/false,
2415 /*FoundElse*/false);
2416 }
2417}
2418
2419/// HandleEndifDirective - Implements the #endif directive.
2420///
2421void Preprocessor::HandleEndifDirective(Token &EndifToken) {
2422 ++NumEndif;
2423
2424 // Check that this is the whole directive.
2425 CheckEndOfDirective("#endif");
2426
2427 PPConditionalInfo CondInfo;
2428 if (CurLexer->popConditionalLevel(CondInfo)) {
2429 // No conditionals on the stack: this is an #endif without an #if.
2430 return Diag(EndifToken, diag::err_pp_endif_without_if);
2431 }
2432
2433 // If this the end of a top-level #endif, inform MIOpt.
2434 if (CurLexer->getConditionalStackDepth() == 0)
2435 CurLexer->MIOpt.ExitTopLevelConditional();
2436
2437 assert(!CondInfo.WasSkipping && !CurLexer->LexingRawMode &&
2438 "This code should only be reachable in the non-skipping case!");
2439}
2440
2441
2442void Preprocessor::HandleElseDirective(Token &Result) {
2443 ++NumElse;
2444
2445 // #else directive in a non-skipping conditional... start skipping.
2446 CheckEndOfDirective("#else");
2447
2448 PPConditionalInfo CI;
2449 if (CurLexer->popConditionalLevel(CI))
2450 return Diag(Result, diag::pp_err_else_without_if);
2451
2452 // If this is a top-level #else, inform the MIOpt.
2453 if (CurLexer->getConditionalStackDepth() == 0)
2454 CurLexer->MIOpt.FoundTopLevelElse();
2455
2456 // If this is a #else with a #else before it, report the error.
2457 if (CI.FoundElse) Diag(Result, diag::pp_err_else_after_else);
2458
2459 // Finally, skip the rest of the contents of this block and return the first
2460 // token after it.
2461 return SkipExcludedConditionalBlock(CI.IfLoc, /*Foundnonskip*/true,
2462 /*FoundElse*/true);
2463}
2464
2465void Preprocessor::HandleElifDirective(Token &ElifToken) {
2466 ++NumElse;
2467
2468 // #elif directive in a non-skipping conditional... start skipping.
2469 // We don't care what the condition is, because we will always skip it (since
2470 // the block immediately before it was included).
2471 DiscardUntilEndOfDirective();
2472
2473 PPConditionalInfo CI;
2474 if (CurLexer->popConditionalLevel(CI))
2475 return Diag(ElifToken, diag::pp_err_elif_without_if);
2476
2477 // If this is a top-level #elif, inform the MIOpt.
2478 if (CurLexer->getConditionalStackDepth() == 0)
2479 CurLexer->MIOpt.FoundTopLevelElse();
2480
2481 // If this is a #elif with a #else before it, report the error.
2482 if (CI.FoundElse) Diag(ElifToken, diag::pp_err_elif_after_else);
2483
2484 // Finally, skip the rest of the contents of this block and return the first
2485 // token after it.
2486 return SkipExcludedConditionalBlock(CI.IfLoc, /*Foundnonskip*/true,
2487 /*FoundElse*/CI.FoundElse);
2488}
2489