blob: 0d3ac521d05638efb687a58c673fcbeab69bf975 [file] [log] [blame]
Chris Lattner4b009652007-07-25 00:24:17 +00001//===--- Preprocess.cpp - C Language Family Preprocessor Implementation ---===//
2//
3// The LLVM Compiler Infrastructure
4//
5// This file was developed by Chris Lattner and is distributed under
6// the University of Illinois Open Source License. See LICENSE.TXT for details.
7//
8//===----------------------------------------------------------------------===//
9//
10// This file implements the Preprocessor interface.
11//
12//===----------------------------------------------------------------------===//
13//
14// Options to support:
15// -H - Print the name of each header file used.
16// -d[MDNI] - Dump various things.
17// -fworking-directory - #line's with preprocessor's working dir.
18// -fpreprocessed
19// -dependency-file,-M,-MM,-MF,-MG,-MP,-MT,-MQ,-MD,-MMD
20// -W*
21// -w
22//
23// Messages to emit:
24// "Multiple include guards may be useful for:\n"
25//
26//===----------------------------------------------------------------------===//
27
28#include "clang/Lex/Preprocessor.h"
29#include "clang/Lex/HeaderSearch.h"
30#include "clang/Lex/MacroInfo.h"
31#include "clang/Lex/PPCallbacks.h"
32#include "clang/Lex/Pragma.h"
33#include "clang/Lex/ScratchBuffer.h"
34#include "clang/Basic/Diagnostic.h"
35#include "clang/Basic/FileManager.h"
36#include "clang/Basic/SourceManager.h"
37#include "clang/Basic/TargetInfo.h"
38#include "llvm/ADT/SmallVector.h"
39#include "llvm/Support/MemoryBuffer.h"
40#include <iostream>
Chris Lattner1b023182007-09-03 18:30:32 +000041#include <ctime>
Chris Lattner4b009652007-07-25 00:24:17 +000042using namespace clang;
43
44//===----------------------------------------------------------------------===//
45
46Preprocessor::Preprocessor(Diagnostic &diags, const LangOptions &opts,
47 TargetInfo &target, SourceManager &SM,
48 HeaderSearch &Headers)
49 : Diags(diags), Features(opts), Target(target), FileMgr(Headers.getFileMgr()),
50 SourceMgr(SM), HeaderInfo(Headers), Identifiers(opts),
51 CurLexer(0), CurDirLookup(0), CurMacroExpander(0), Callbacks(0) {
52 ScratchBuf = new ScratchBuffer(SourceMgr);
53
54 // Clear stats.
55 NumDirectives = NumDefined = NumUndefined = NumPragma = 0;
56 NumIf = NumElse = NumEndif = 0;
57 NumEnteredSourceFiles = 0;
58 NumMacroExpanded = NumFnMacroExpanded = NumBuiltinMacroExpanded = 0;
59 NumFastMacroExpanded = NumTokenPaste = NumFastTokenPaste = 0;
60 MaxIncludeStackDepth = 0;
61 NumSkipped = 0;
62
63 // Default to discarding comments.
64 KeepComments = false;
65 KeepMacroComments = false;
66
67 // Macro expansion is enabled.
68 DisableMacroExpansion = false;
69 InMacroArgs = false;
70 NumCachedMacroExpanders = 0;
71
72 // "Poison" __VA_ARGS__, which can only appear in the expansion of a macro.
73 // This gets unpoisoned where it is allowed.
74 (Ident__VA_ARGS__ = getIdentifierInfo("__VA_ARGS__"))->setIsPoisoned();
75
Chris Lattnerd1f21e12007-10-09 22:10:18 +000076 Predefines = 0;
77
Chris Lattner4b009652007-07-25 00:24:17 +000078 // Initialize the pragma handlers.
79 PragmaHandlers = new PragmaNamespace(0);
80 RegisterBuiltinPragmas();
81
82 // Initialize builtin macros like __LINE__ and friends.
83 RegisterBuiltinMacros();
84}
85
86Preprocessor::~Preprocessor() {
87 // Free any active lexers.
88 delete CurLexer;
89
90 while (!IncludeMacroStack.empty()) {
91 delete IncludeMacroStack.back().TheLexer;
92 delete IncludeMacroStack.back().TheMacroExpander;
93 IncludeMacroStack.pop_back();
94 }
Chris Lattner7a1b0882007-10-07 08:44:20 +000095
96 // Free any macro definitions.
97 for (llvm::DenseMap<IdentifierInfo*, MacroInfo*>::iterator I =
98 Macros.begin(), E = Macros.end(); I != E; ++I) {
99 // Free the macro definition.
100 delete I->second;
101 I->second = 0;
102 I->first->setHasMacroDefinition(false);
103 }
Chris Lattner4b009652007-07-25 00:24:17 +0000104
105 // Free any cached macro expanders.
106 for (unsigned i = 0, e = NumCachedMacroExpanders; i != e; ++i)
107 delete MacroExpanderCache[i];
108
109 // Release pragma information.
110 delete PragmaHandlers;
111
112 // Delete the scratch buffer info.
113 delete ScratchBuf;
114}
115
116PPCallbacks::~PPCallbacks() {
117}
118
119/// Diag - Forwarding function for diagnostics. This emits a diagnostic at
120/// the specified Token's location, translating the token's start
121/// position in the current buffer into a SourcePosition object for rendering.
122void Preprocessor::Diag(SourceLocation Loc, unsigned DiagID) {
123 Diags.Report(Loc, DiagID);
124}
125
126void Preprocessor::Diag(SourceLocation Loc, unsigned DiagID,
127 const std::string &Msg) {
128 Diags.Report(Loc, DiagID, &Msg, 1);
129}
130
131void Preprocessor::DumpToken(const Token &Tok, bool DumpFlags) const {
132 std::cerr << tok::getTokenName(Tok.getKind()) << " '"
133 << getSpelling(Tok) << "'";
134
135 if (!DumpFlags) return;
136 std::cerr << "\t";
137 if (Tok.isAtStartOfLine())
138 std::cerr << " [StartOfLine]";
139 if (Tok.hasLeadingSpace())
140 std::cerr << " [LeadingSpace]";
141 if (Tok.isExpandDisabled())
142 std::cerr << " [ExpandDisabled]";
143 if (Tok.needsCleaning()) {
144 const char *Start = SourceMgr.getCharacterData(Tok.getLocation());
145 std::cerr << " [UnClean='" << std::string(Start, Start+Tok.getLength())
146 << "']";
147 }
148}
149
150void Preprocessor::DumpMacro(const MacroInfo &MI) const {
151 std::cerr << "MACRO: ";
152 for (unsigned i = 0, e = MI.getNumTokens(); i != e; ++i) {
153 DumpToken(MI.getReplacementToken(i));
154 std::cerr << " ";
155 }
156 std::cerr << "\n";
157}
158
159void Preprocessor::PrintStats() {
160 std::cerr << "\n*** Preprocessor Stats:\n";
161 std::cerr << NumDirectives << " directives found:\n";
162 std::cerr << " " << NumDefined << " #define.\n";
163 std::cerr << " " << NumUndefined << " #undef.\n";
164 std::cerr << " #include/#include_next/#import:\n";
165 std::cerr << " " << NumEnteredSourceFiles << " source files entered.\n";
166 std::cerr << " " << MaxIncludeStackDepth << " max include stack depth\n";
167 std::cerr << " " << NumIf << " #if/#ifndef/#ifdef.\n";
168 std::cerr << " " << NumElse << " #else/#elif.\n";
169 std::cerr << " " << NumEndif << " #endif.\n";
170 std::cerr << " " << NumPragma << " #pragma.\n";
171 std::cerr << NumSkipped << " #if/#ifndef#ifdef regions skipped\n";
172
173 std::cerr << NumMacroExpanded << "/" << NumFnMacroExpanded << "/"
174 << NumBuiltinMacroExpanded << " obj/fn/builtin macros expanded, "
175 << NumFastMacroExpanded << " on the fast path.\n";
176 std::cerr << (NumFastTokenPaste+NumTokenPaste)
177 << " token paste (##) operations performed, "
178 << NumFastTokenPaste << " on the fast path.\n";
179}
180
181//===----------------------------------------------------------------------===//
182// Token Spelling
183//===----------------------------------------------------------------------===//
184
185
186/// getSpelling() - Return the 'spelling' of this token. The spelling of a
187/// token are the characters used to represent the token in the source file
188/// after trigraph expansion and escaped-newline folding. In particular, this
189/// wants to get the true, uncanonicalized, spelling of things like digraphs
190/// UCNs, etc.
191std::string Preprocessor::getSpelling(const Token &Tok) const {
192 assert((int)Tok.getLength() >= 0 && "Token character range is bogus!");
193
194 // If this token contains nothing interesting, return it directly.
195 const char *TokStart = SourceMgr.getCharacterData(Tok.getLocation());
196 if (!Tok.needsCleaning())
197 return std::string(TokStart, TokStart+Tok.getLength());
198
199 std::string Result;
200 Result.reserve(Tok.getLength());
201
202 // Otherwise, hard case, relex the characters into the string.
203 for (const char *Ptr = TokStart, *End = TokStart+Tok.getLength();
204 Ptr != End; ) {
205 unsigned CharSize;
206 Result.push_back(Lexer::getCharAndSizeNoWarn(Ptr, CharSize, Features));
207 Ptr += CharSize;
208 }
209 assert(Result.size() != unsigned(Tok.getLength()) &&
210 "NeedsCleaning flag set on something that didn't need cleaning!");
211 return Result;
212}
213
214/// getSpelling - This method is used to get the spelling of a token into a
215/// preallocated buffer, instead of as an std::string. The caller is required
216/// to allocate enough space for the token, which is guaranteed to be at least
217/// Tok.getLength() bytes long. The actual length of the token is returned.
218///
219/// Note that this method may do two possible things: it may either fill in
220/// the buffer specified with characters, or it may *change the input pointer*
221/// to point to a constant buffer with the data already in it (avoiding a
222/// copy). The caller is not allowed to modify the returned buffer pointer
223/// if an internal buffer is returned.
224unsigned Preprocessor::getSpelling(const Token &Tok,
225 const char *&Buffer) const {
226 assert((int)Tok.getLength() >= 0 && "Token character range is bogus!");
227
228 // If this token is an identifier, just return the string from the identifier
229 // table, which is very quick.
230 if (const IdentifierInfo *II = Tok.getIdentifierInfo()) {
231 Buffer = II->getName();
232
233 // Return the length of the token. If the token needed cleaning, don't
234 // include the size of the newlines or trigraphs in it.
235 if (!Tok.needsCleaning())
236 return Tok.getLength();
237 else
238 return strlen(Buffer);
239 }
240
241 // Otherwise, compute the start of the token in the input lexer buffer.
242 const char *TokStart = SourceMgr.getCharacterData(Tok.getLocation());
243
244 // If this token contains nothing interesting, return it directly.
245 if (!Tok.needsCleaning()) {
246 Buffer = TokStart;
247 return Tok.getLength();
248 }
249 // Otherwise, hard case, relex the characters into the string.
250 char *OutBuf = const_cast<char*>(Buffer);
251 for (const char *Ptr = TokStart, *End = TokStart+Tok.getLength();
252 Ptr != End; ) {
253 unsigned CharSize;
254 *OutBuf++ = Lexer::getCharAndSizeNoWarn(Ptr, CharSize, Features);
255 Ptr += CharSize;
256 }
257 assert(unsigned(OutBuf-Buffer) != Tok.getLength() &&
258 "NeedsCleaning flag set on something that didn't need cleaning!");
259
260 return OutBuf-Buffer;
261}
262
263
264/// CreateString - Plop the specified string into a scratch buffer and return a
265/// location for it. If specified, the source location provides a source
266/// location for the token.
267SourceLocation Preprocessor::
268CreateString(const char *Buf, unsigned Len, SourceLocation SLoc) {
269 if (SLoc.isValid())
270 return ScratchBuf->getToken(Buf, Len, SLoc);
271 return ScratchBuf->getToken(Buf, Len);
272}
273
274
275/// AdvanceToTokenCharacter - Given a location that specifies the start of a
276/// token, return a new location that specifies a character within the token.
277SourceLocation Preprocessor::AdvanceToTokenCharacter(SourceLocation TokStart,
278 unsigned CharNo) {
279 // If they request the first char of the token, we're trivially done. If this
280 // is a macro expansion, it doesn't make sense to point to a character within
281 // the instantiation point (the name). We could point to the source
282 // character, but without also pointing to instantiation info, this is
283 // confusing.
284 if (CharNo == 0 || TokStart.isMacroID()) return TokStart;
285
286 // Figure out how many physical characters away the specified logical
287 // character is. This needs to take into consideration newlines and
288 // trigraphs.
289 const char *TokPtr = SourceMgr.getCharacterData(TokStart);
290 unsigned PhysOffset = 0;
291
292 // The usual case is that tokens don't contain anything interesting. Skip
293 // over the uninteresting characters. If a token only consists of simple
294 // chars, this method is extremely fast.
295 while (CharNo && Lexer::isObviouslySimpleCharacter(*TokPtr))
296 ++TokPtr, --CharNo, ++PhysOffset;
297
298 // If we have a character that may be a trigraph or escaped newline, create a
299 // lexer to parse it correctly.
300 if (CharNo != 0) {
301 // Create a lexer starting at this token position.
302 Lexer TheLexer(TokStart, *this, TokPtr);
303 Token Tok;
304 // Skip over characters the remaining characters.
305 const char *TokStartPtr = TokPtr;
306 for (; CharNo; --CharNo)
307 TheLexer.getAndAdvanceChar(TokPtr, Tok);
308
309 PhysOffset += TokPtr-TokStartPtr;
310 }
311
312 return TokStart.getFileLocWithOffset(PhysOffset);
313}
314
315
Chris Lattnerd1f21e12007-10-09 22:10:18 +0000316//===----------------------------------------------------------------------===//
317// Preprocessor Initialization Methods
318//===----------------------------------------------------------------------===//
319
320// Append a #define line to Buf for Macro. Macro should be of the form XXX,
321// in which case we emit "#define XXX 1" or "XXX=Y z W" in which case we emit
322// "#define XXX Y z W". To get a #define with no value, use "XXX=".
323static void DefineBuiltinMacro(std::vector<char> &Buf, const char *Macro,
324 const char *Command = "#define ") {
325 Buf.insert(Buf.end(), Command, Command+strlen(Command));
326 if (const char *Equal = strchr(Macro, '=')) {
327 // Turn the = into ' '.
328 Buf.insert(Buf.end(), Macro, Equal);
329 Buf.push_back(' ');
330 Buf.insert(Buf.end(), Equal+1, Equal+strlen(Equal));
331 } else {
332 // Push "macroname 1".
333 Buf.insert(Buf.end(), Macro, Macro+strlen(Macro));
334 Buf.push_back(' ');
335 Buf.push_back('1');
336 }
337 Buf.push_back('\n');
338}
339
340
341static void InitializePredefinedMacros(Preprocessor &PP,
342 std::vector<char> &Buf) {
343 // FIXME: Implement magic like cpp_init_builtins for things like __STDC__
344 // and __DATE__ etc.
345#if 0
346 /* __STDC__ has the value 1 under normal circumstances.
347 However, if (a) we are in a system header, (b) the option
348 stdc_0_in_system_headers is true (set by target config), and
349 (c) we are not in strictly conforming mode, then it has the
350 value 0. (b) and (c) are already checked in cpp_init_builtins. */
351 //case BT_STDC:
352 if (cpp_in_system_header (pfile))
353 number = 0;
354 else
355 number = 1;
356 break;
357#endif
358 // These should all be defined in the preprocessor according to the
359 // current language configuration.
360 DefineBuiltinMacro(Buf, "__STDC__=1");
361 //DefineBuiltinMacro(Buf, "__ASSEMBLER__=1");
362 if (PP.getLangOptions().C99 && !PP.getLangOptions().CPlusPlus)
363 DefineBuiltinMacro(Buf, "__STDC_VERSION__=199901L");
364 else if (0) // STDC94 ?
365 DefineBuiltinMacro(Buf, "__STDC_VERSION__=199409L");
366
367 DefineBuiltinMacro(Buf, "__STDC_HOSTED__=1");
368 if (PP.getLangOptions().ObjC1)
369 DefineBuiltinMacro(Buf, "__OBJC__=1");
370 if (PP.getLangOptions().ObjC2)
371 DefineBuiltinMacro(Buf, "__OBJC2__=1");
Steve Naroffae84af82007-10-31 18:42:27 +0000372
Chris Lattner77cec472007-10-10 17:48:53 +0000373 // Add __builtin_va_list typedef.
374 {
375 const char *VAList = PP.getTargetInfo().getVAListDeclaration();
376 Buf.insert(Buf.end(), VAList, VAList+strlen(VAList));
377 Buf.push_back('\n');
378 }
Chris Lattnerd1f21e12007-10-09 22:10:18 +0000379
380 // Get the target #defines.
381 PP.getTargetInfo().getTargetDefines(Buf);
382
383 // Compiler set macros.
384 DefineBuiltinMacro(Buf, "__APPLE_CC__=5250");
385 DefineBuiltinMacro(Buf, "__ENVIRONMENT_MAC_OS_X_VERSION_MIN_REQUIRED__=1030");
386 DefineBuiltinMacro(Buf, "__GNUC_MINOR__=0");
387 DefineBuiltinMacro(Buf, "__GNUC_PATCHLEVEL__=1");
388 DefineBuiltinMacro(Buf, "__GNUC__=4");
389 DefineBuiltinMacro(Buf, "__GXX_ABI_VERSION=1002");
390 DefineBuiltinMacro(Buf, "__VERSION__=\"4.0.1 (Apple Computer, Inc. "
391 "build 5250)\"");
392
393 // Build configuration options.
394 DefineBuiltinMacro(Buf, "__DYNAMIC__=1");
395 DefineBuiltinMacro(Buf, "__FINITE_MATH_ONLY__=0");
396 DefineBuiltinMacro(Buf, "__NO_INLINE__=1");
397 DefineBuiltinMacro(Buf, "__PIC__=1");
398
399
400 if (PP.getLangOptions().CPlusPlus) {
401 DefineBuiltinMacro(Buf, "__DEPRECATED=1");
402 DefineBuiltinMacro(Buf, "__EXCEPTIONS=1");
403 DefineBuiltinMacro(Buf, "__GNUG__=4");
404 DefineBuiltinMacro(Buf, "__GXX_WEAK__=1");
405 DefineBuiltinMacro(Buf, "__cplusplus=1");
406 DefineBuiltinMacro(Buf, "__private_extern__=extern");
407 }
408
409 // FIXME: Should emit a #line directive here.
410}
411
412
413/// EnterMainSourceFile - Enter the specified FileID as the main source file,
414/// which implicitly adds the builting defines etc.
415void Preprocessor::EnterMainSourceFile(unsigned MainFileID) {
416 // Enter the main file source buffer.
417 EnterSourceFile(MainFileID, 0);
418
419
420 std::vector<char> PrologFile;
421 PrologFile.reserve(4080);
422
423 // Install things like __POWERPC__, __GNUC__, etc into the macro table.
424 InitializePredefinedMacros(*this, PrologFile);
425
426 // Add on the predefines from the driver.
427 PrologFile.insert(PrologFile.end(), Predefines,Predefines+strlen(Predefines));
428
429 // Memory buffer must end with a null byte!
430 PrologFile.push_back(0);
431
432 // Now that we have emitted the predefined macros, #includes, etc into
433 // PrologFile, preprocess it to populate the initial preprocessor state.
434 llvm::MemoryBuffer *SB =
435 llvm::MemoryBuffer::getMemBufferCopy(&PrologFile.front(),&PrologFile.back(),
436 "<predefines>");
437 assert(SB && "Cannot fail to create predefined source buffer");
438 unsigned FileID = SourceMgr.createFileIDForMemBuffer(SB);
439 assert(FileID && "Could not create FileID for predefines?");
440
441 // Start parsing the predefines.
442 EnterSourceFile(FileID, 0);
443}
Chris Lattner4b009652007-07-25 00:24:17 +0000444
445//===----------------------------------------------------------------------===//
446// Source File Location Methods.
447//===----------------------------------------------------------------------===//
448
449/// LookupFile - Given a "foo" or <foo> reference, look up the indicated file,
450/// return null on failure. isAngled indicates whether the file reference is
451/// for system #include's or not (i.e. using <> instead of "").
452const FileEntry *Preprocessor::LookupFile(const char *FilenameStart,
453 const char *FilenameEnd,
454 bool isAngled,
455 const DirectoryLookup *FromDir,
456 const DirectoryLookup *&CurDir) {
457 // If the header lookup mechanism may be relative to the current file, pass in
458 // info about where the current file is.
459 const FileEntry *CurFileEnt = 0;
460 if (!FromDir) {
461 SourceLocation FileLoc = getCurrentFileLexer()->getFileLoc();
462 CurFileEnt = SourceMgr.getFileEntryForLoc(FileLoc);
463 }
464
465 // Do a standard file entry lookup.
466 CurDir = CurDirLookup;
467 const FileEntry *FE =
468 HeaderInfo.LookupFile(FilenameStart, FilenameEnd,
469 isAngled, FromDir, CurDir, CurFileEnt);
470 if (FE) return FE;
471
472 // Otherwise, see if this is a subframework header. If so, this is relative
473 // to one of the headers on the #include stack. Walk the list of the current
474 // headers on the #include stack and pass them to HeaderInfo.
475 if (CurLexer && !CurLexer->Is_PragmaLexer) {
476 CurFileEnt = SourceMgr.getFileEntryForLoc(CurLexer->getFileLoc());
477 if ((FE = HeaderInfo.LookupSubframeworkHeader(FilenameStart, FilenameEnd,
478 CurFileEnt)))
479 return FE;
480 }
481
482 for (unsigned i = 0, e = IncludeMacroStack.size(); i != e; ++i) {
483 IncludeStackInfo &ISEntry = IncludeMacroStack[e-i-1];
484 if (ISEntry.TheLexer && !ISEntry.TheLexer->Is_PragmaLexer) {
485 CurFileEnt = SourceMgr.getFileEntryForLoc(ISEntry.TheLexer->getFileLoc());
486 if ((FE = HeaderInfo.LookupSubframeworkHeader(FilenameStart, FilenameEnd,
487 CurFileEnt)))
488 return FE;
489 }
490 }
491
492 // Otherwise, we really couldn't find the file.
493 return 0;
494}
495
496/// isInPrimaryFile - Return true if we're in the top-level file, not in a
497/// #include.
498bool Preprocessor::isInPrimaryFile() const {
499 if (CurLexer && !CurLexer->Is_PragmaLexer)
Chris Lattnerd1f21e12007-10-09 22:10:18 +0000500 return IncludeMacroStack.empty();
Chris Lattner4b009652007-07-25 00:24:17 +0000501
502 // If there are any stacked lexers, we're in a #include.
Chris Lattnerd1f21e12007-10-09 22:10:18 +0000503 assert(IncludeMacroStack[0].TheLexer &&
504 !IncludeMacroStack[0].TheLexer->Is_PragmaLexer &&
505 "Top level include stack isn't our primary lexer?");
506 for (unsigned i = 1, e = IncludeMacroStack.size(); i != e; ++i)
Chris Lattner4b009652007-07-25 00:24:17 +0000507 if (IncludeMacroStack[i].TheLexer &&
508 !IncludeMacroStack[i].TheLexer->Is_PragmaLexer)
Chris Lattnerd1f21e12007-10-09 22:10:18 +0000509 return false;
510 return true;
Chris Lattner4b009652007-07-25 00:24:17 +0000511}
512
513/// getCurrentLexer - Return the current file lexer being lexed from. Note
514/// that this ignores any potentially active macro expansions and _Pragma
515/// expansions going on at the time.
516Lexer *Preprocessor::getCurrentFileLexer() const {
517 if (CurLexer && !CurLexer->Is_PragmaLexer) return CurLexer;
518
519 // Look for a stacked lexer.
520 for (unsigned i = IncludeMacroStack.size(); i != 0; --i) {
521 Lexer *L = IncludeMacroStack[i-1].TheLexer;
522 if (L && !L->Is_PragmaLexer) // Ignore macro & _Pragma expansions.
523 return L;
524 }
525 return 0;
526}
527
528
529/// EnterSourceFile - Add a source file to the top of the include stack and
530/// start lexing tokens from it instead of the current buffer. Return true
531/// on failure.
532void Preprocessor::EnterSourceFile(unsigned FileID,
Chris Lattnerd1f21e12007-10-09 22:10:18 +0000533 const DirectoryLookup *CurDir) {
Chris Lattner4b009652007-07-25 00:24:17 +0000534 assert(CurMacroExpander == 0 && "Cannot #include a file inside a macro!");
535 ++NumEnteredSourceFiles;
536
537 if (MaxIncludeStackDepth < IncludeMacroStack.size())
538 MaxIncludeStackDepth = IncludeMacroStack.size();
539
540 Lexer *TheLexer = new Lexer(SourceLocation::getFileLoc(FileID, 0), *this);
Chris Lattner4b009652007-07-25 00:24:17 +0000541 EnterSourceFileWithLexer(TheLexer, CurDir);
542}
543
544/// EnterSourceFile - Add a source file to the top of the include stack and
545/// start lexing tokens from it instead of the current buffer.
546void Preprocessor::EnterSourceFileWithLexer(Lexer *TheLexer,
547 const DirectoryLookup *CurDir) {
548
549 // Add the current lexer to the include stack.
550 if (CurLexer || CurMacroExpander)
551 IncludeMacroStack.push_back(IncludeStackInfo(CurLexer, CurDirLookup,
552 CurMacroExpander));
553
554 CurLexer = TheLexer;
555 CurDirLookup = CurDir;
556 CurMacroExpander = 0;
557
558 // Notify the client, if desired, that we are in a new source file.
559 if (Callbacks && !CurLexer->Is_PragmaLexer) {
560 DirectoryLookup::DirType FileType = DirectoryLookup::NormalHeaderDir;
561
562 // Get the file entry for the current file.
563 if (const FileEntry *FE =
564 SourceMgr.getFileEntryForLoc(CurLexer->getFileLoc()))
565 FileType = HeaderInfo.getFileDirFlavor(FE);
566
567 Callbacks->FileChanged(CurLexer->getFileLoc(),
568 PPCallbacks::EnterFile, FileType);
569 }
570}
571
572
573
574/// EnterMacro - Add a Macro to the top of the include stack and start lexing
575/// tokens from it instead of the current buffer.
576void Preprocessor::EnterMacro(Token &Tok, MacroArgs *Args) {
577 IncludeMacroStack.push_back(IncludeStackInfo(CurLexer, CurDirLookup,
578 CurMacroExpander));
579 CurLexer = 0;
580 CurDirLookup = 0;
581
582 if (NumCachedMacroExpanders == 0) {
583 CurMacroExpander = new MacroExpander(Tok, Args, *this);
584 } else {
585 CurMacroExpander = MacroExpanderCache[--NumCachedMacroExpanders];
586 CurMacroExpander->Init(Tok, Args);
587 }
588}
589
590/// EnterTokenStream - Add a "macro" context to the top of the include stack,
591/// which will cause the lexer to start returning the specified tokens. Note
592/// that these tokens will be re-macro-expanded when/if expansion is enabled.
593/// This method assumes that the specified stream of tokens has a permanent
594/// owner somewhere, so they do not need to be copied.
595void Preprocessor::EnterTokenStream(const Token *Toks, unsigned NumToks) {
596 // Save our current state.
597 IncludeMacroStack.push_back(IncludeStackInfo(CurLexer, CurDirLookup,
598 CurMacroExpander));
599 CurLexer = 0;
600 CurDirLookup = 0;
601
602 // Create a macro expander to expand from the specified token stream.
603 if (NumCachedMacroExpanders == 0) {
604 CurMacroExpander = new MacroExpander(Toks, NumToks, *this);
605 } else {
606 CurMacroExpander = MacroExpanderCache[--NumCachedMacroExpanders];
607 CurMacroExpander->Init(Toks, NumToks);
608 }
609}
610
611/// RemoveTopOfLexerStack - Pop the current lexer/macro exp off the top of the
612/// lexer stack. This should only be used in situations where the current
613/// state of the top-of-stack lexer is known.
614void Preprocessor::RemoveTopOfLexerStack() {
615 assert(!IncludeMacroStack.empty() && "Ran out of stack entries to load");
616
617 if (CurMacroExpander) {
618 // Delete or cache the now-dead macro expander.
619 if (NumCachedMacroExpanders == MacroExpanderCacheSize)
620 delete CurMacroExpander;
621 else
622 MacroExpanderCache[NumCachedMacroExpanders++] = CurMacroExpander;
623 } else {
624 delete CurLexer;
625 }
626 CurLexer = IncludeMacroStack.back().TheLexer;
627 CurDirLookup = IncludeMacroStack.back().TheDirLookup;
628 CurMacroExpander = IncludeMacroStack.back().TheMacroExpander;
629 IncludeMacroStack.pop_back();
630}
631
632//===----------------------------------------------------------------------===//
633// Macro Expansion Handling.
634//===----------------------------------------------------------------------===//
635
Chris Lattner7a1b0882007-10-07 08:44:20 +0000636/// setMacroInfo - Specify a macro for this identifier.
637///
638void Preprocessor::setMacroInfo(IdentifierInfo *II, MacroInfo *MI) {
639 if (MI == 0) {
640 if (II->hasMacroDefinition()) {
641 Macros.erase(II);
642 II->setHasMacroDefinition(false);
643 }
644 } else {
645 Macros[II] = MI;
646 II->setHasMacroDefinition(true);
647 }
648}
649
Chris Lattner4b009652007-07-25 00:24:17 +0000650/// RegisterBuiltinMacro - Register the specified identifier in the identifier
651/// table and mark it as a builtin macro to be expanded.
652IdentifierInfo *Preprocessor::RegisterBuiltinMacro(const char *Name) {
653 // Get the identifier.
654 IdentifierInfo *Id = getIdentifierInfo(Name);
655
656 // Mark it as being a macro that is builtin.
657 MacroInfo *MI = new MacroInfo(SourceLocation());
658 MI->setIsBuiltinMacro();
Chris Lattner7a1b0882007-10-07 08:44:20 +0000659 setMacroInfo(Id, MI);
Chris Lattner4b009652007-07-25 00:24:17 +0000660 return Id;
661}
662
663
664/// RegisterBuiltinMacros - Register builtin macros, such as __LINE__ with the
665/// identifier table.
666void Preprocessor::RegisterBuiltinMacros() {
667 Ident__LINE__ = RegisterBuiltinMacro("__LINE__");
668 Ident__FILE__ = RegisterBuiltinMacro("__FILE__");
669 Ident__DATE__ = RegisterBuiltinMacro("__DATE__");
670 Ident__TIME__ = RegisterBuiltinMacro("__TIME__");
671 Ident_Pragma = RegisterBuiltinMacro("_Pragma");
672
673 // GCC Extensions.
674 Ident__BASE_FILE__ = RegisterBuiltinMacro("__BASE_FILE__");
675 Ident__INCLUDE_LEVEL__ = RegisterBuiltinMacro("__INCLUDE_LEVEL__");
676 Ident__TIMESTAMP__ = RegisterBuiltinMacro("__TIMESTAMP__");
677}
678
679/// isTrivialSingleTokenExpansion - Return true if MI, which has a single token
680/// in its expansion, currently expands to that token literally.
681static bool isTrivialSingleTokenExpansion(const MacroInfo *MI,
Chris Lattner7a1b0882007-10-07 08:44:20 +0000682 const IdentifierInfo *MacroIdent,
683 Preprocessor &PP) {
Chris Lattner4b009652007-07-25 00:24:17 +0000684 IdentifierInfo *II = MI->getReplacementToken(0).getIdentifierInfo();
685
686 // If the token isn't an identifier, it's always literally expanded.
687 if (II == 0) return true;
688
689 // If the identifier is a macro, and if that macro is enabled, it may be
690 // expanded so it's not a trivial expansion.
Chris Lattner7a1b0882007-10-07 08:44:20 +0000691 if (II->hasMacroDefinition() && PP.getMacroInfo(II)->isEnabled() &&
Chris Lattner4b009652007-07-25 00:24:17 +0000692 // Fast expanding "#define X X" is ok, because X would be disabled.
693 II != MacroIdent)
694 return false;
695
696 // If this is an object-like macro invocation, it is safe to trivially expand
697 // it.
698 if (MI->isObjectLike()) return true;
699
700 // If this is a function-like macro invocation, it's safe to trivially expand
701 // as long as the identifier is not a macro argument.
702 for (MacroInfo::arg_iterator I = MI->arg_begin(), E = MI->arg_end();
703 I != E; ++I)
704 if (*I == II)
705 return false; // Identifier is a macro argument.
706
707 return true;
708}
709
710
711/// isNextPPTokenLParen - Determine whether the next preprocessor token to be
712/// lexed is a '('. If so, consume the token and return true, if not, this
713/// method should have no observable side-effect on the lexed tokens.
714bool Preprocessor::isNextPPTokenLParen() {
715 // Do some quick tests for rejection cases.
716 unsigned Val;
717 if (CurLexer)
718 Val = CurLexer->isNextPPTokenLParen();
719 else
720 Val = CurMacroExpander->isNextTokenLParen();
721
722 if (Val == 2) {
723 // We have run off the end. If it's a source file we don't
724 // examine enclosing ones (C99 5.1.1.2p4). Otherwise walk up the
725 // macro stack.
726 if (CurLexer)
727 return false;
728 for (unsigned i = IncludeMacroStack.size(); i != 0; --i) {
729 IncludeStackInfo &Entry = IncludeMacroStack[i-1];
730 if (Entry.TheLexer)
731 Val = Entry.TheLexer->isNextPPTokenLParen();
732 else
733 Val = Entry.TheMacroExpander->isNextTokenLParen();
734
735 if (Val != 2)
736 break;
737
738 // Ran off the end of a source file?
739 if (Entry.TheLexer)
740 return false;
741 }
742 }
743
744 // Okay, if we know that the token is a '(', lex it and return. Otherwise we
745 // have found something that isn't a '(' or we found the end of the
746 // translation unit. In either case, return false.
747 if (Val != 1)
748 return false;
749
750 Token Tok;
751 LexUnexpandedToken(Tok);
Chris Lattnercb8e41c2007-10-09 18:02:16 +0000752 assert(Tok.is(tok::l_paren) && "Error computing l-paren-ness?");
Chris Lattner4b009652007-07-25 00:24:17 +0000753 return true;
754}
755
756/// HandleMacroExpandedIdentifier - If an identifier token is read that is to be
757/// expanded as a macro, handle it and return the next token as 'Identifier'.
758bool Preprocessor::HandleMacroExpandedIdentifier(Token &Identifier,
759 MacroInfo *MI) {
760
761 // If this is a builtin macro, like __LINE__ or _Pragma, handle it specially.
762 if (MI->isBuiltinMacro()) {
763 ExpandBuiltinMacro(Identifier);
764 return false;
765 }
766
767 // If this is the first use of a target-specific macro, warn about it.
768 if (MI->isTargetSpecific()) {
769 MI->setIsTargetSpecific(false); // Don't warn on second use.
770 getTargetInfo().DiagnoseNonPortability(Identifier.getLocation(),
771 diag::port_target_macro_use);
772 }
773
774 /// Args - If this is a function-like macro expansion, this contains,
775 /// for each macro argument, the list of tokens that were provided to the
776 /// invocation.
777 MacroArgs *Args = 0;
778
779 // If this is a function-like macro, read the arguments.
780 if (MI->isFunctionLike()) {
781 // C99 6.10.3p10: If the preprocessing token immediately after the the macro
782 // name isn't a '(', this macro should not be expanded. Otherwise, consume
783 // it.
784 if (!isNextPPTokenLParen())
785 return true;
786
787 // Remember that we are now parsing the arguments to a macro invocation.
788 // Preprocessor directives used inside macro arguments are not portable, and
789 // this enables the warning.
790 InMacroArgs = true;
791 Args = ReadFunctionLikeMacroArgs(Identifier, MI);
792
793 // Finished parsing args.
794 InMacroArgs = false;
795
796 // If there was an error parsing the arguments, bail out.
797 if (Args == 0) return false;
798
799 ++NumFnMacroExpanded;
800 } else {
801 ++NumMacroExpanded;
802 }
803
804 // Notice that this macro has been used.
805 MI->setIsUsed(true);
806
807 // If we started lexing a macro, enter the macro expansion body.
808
809 // If this macro expands to no tokens, don't bother to push it onto the
810 // expansion stack, only to take it right back off.
811 if (MI->getNumTokens() == 0) {
812 // No need for arg info.
813 if (Args) Args->destroy();
814
815 // Ignore this macro use, just return the next token in the current
816 // buffer.
817 bool HadLeadingSpace = Identifier.hasLeadingSpace();
818 bool IsAtStartOfLine = Identifier.isAtStartOfLine();
819
820 Lex(Identifier);
821
822 // If the identifier isn't on some OTHER line, inherit the leading
823 // whitespace/first-on-a-line property of this token. This handles
824 // stuff like "! XX," -> "! ," and " XX," -> " ,", when XX is
825 // empty.
826 if (!Identifier.isAtStartOfLine()) {
827 if (IsAtStartOfLine) Identifier.setFlag(Token::StartOfLine);
828 if (HadLeadingSpace) Identifier.setFlag(Token::LeadingSpace);
829 }
830 ++NumFastMacroExpanded;
831 return false;
832
833 } else if (MI->getNumTokens() == 1 &&
Chris Lattner7a1b0882007-10-07 08:44:20 +0000834 isTrivialSingleTokenExpansion(MI, Identifier.getIdentifierInfo(),
835 *this)){
Chris Lattner4b009652007-07-25 00:24:17 +0000836 // Otherwise, if this macro expands into a single trivially-expanded
837 // token: expand it now. This handles common cases like
838 // "#define VAL 42".
839
840 // Propagate the isAtStartOfLine/hasLeadingSpace markers of the macro
841 // identifier to the expanded token.
842 bool isAtStartOfLine = Identifier.isAtStartOfLine();
843 bool hasLeadingSpace = Identifier.hasLeadingSpace();
844
845 // Remember where the token is instantiated.
846 SourceLocation InstantiateLoc = Identifier.getLocation();
847
848 // Replace the result token.
849 Identifier = MI->getReplacementToken(0);
850
851 // Restore the StartOfLine/LeadingSpace markers.
852 Identifier.setFlagValue(Token::StartOfLine , isAtStartOfLine);
853 Identifier.setFlagValue(Token::LeadingSpace, hasLeadingSpace);
854
855 // Update the tokens location to include both its logical and physical
856 // locations.
857 SourceLocation Loc =
858 SourceMgr.getInstantiationLoc(Identifier.getLocation(), InstantiateLoc);
859 Identifier.setLocation(Loc);
860
861 // If this is #define X X, we must mark the result as unexpandible.
862 if (IdentifierInfo *NewII = Identifier.getIdentifierInfo())
Chris Lattner7a1b0882007-10-07 08:44:20 +0000863 if (getMacroInfo(NewII) == MI)
Chris Lattner4b009652007-07-25 00:24:17 +0000864 Identifier.setFlag(Token::DisableExpand);
865
866 // Since this is not an identifier token, it can't be macro expanded, so
867 // we're done.
868 ++NumFastMacroExpanded;
869 return false;
870 }
871
872 // Start expanding the macro.
873 EnterMacro(Identifier, Args);
874
875 // Now that the macro is at the top of the include stack, ask the
876 // preprocessor to read the next token from it.
877 Lex(Identifier);
878 return false;
879}
880
881/// ReadFunctionLikeMacroArgs - After reading "MACRO(", this method is
882/// invoked to read all of the actual arguments specified for the macro
883/// invocation. This returns null on error.
884MacroArgs *Preprocessor::ReadFunctionLikeMacroArgs(Token &MacroName,
885 MacroInfo *MI) {
886 // The number of fixed arguments to parse.
887 unsigned NumFixedArgsLeft = MI->getNumArgs();
888 bool isVariadic = MI->isVariadic();
889
890 // Outer loop, while there are more arguments, keep reading them.
891 Token Tok;
892 Tok.setKind(tok::comma);
893 --NumFixedArgsLeft; // Start reading the first arg.
894
895 // ArgTokens - Build up a list of tokens that make up each argument. Each
896 // argument is separated by an EOF token. Use a SmallVector so we can avoid
897 // heap allocations in the common case.
898 llvm::SmallVector<Token, 64> ArgTokens;
899
900 unsigned NumActuals = 0;
Chris Lattnercb8e41c2007-10-09 18:02:16 +0000901 while (Tok.is(tok::comma)) {
Chris Lattner4b009652007-07-25 00:24:17 +0000902 // C99 6.10.3p11: Keep track of the number of l_parens we have seen. Note
903 // that we already consumed the first one.
904 unsigned NumParens = 0;
905
906 while (1) {
907 // Read arguments as unexpanded tokens. This avoids issues, e.g., where
908 // an argument value in a macro could expand to ',' or '(' or ')'.
909 LexUnexpandedToken(Tok);
910
Chris Lattnercb8e41c2007-10-09 18:02:16 +0000911 if (Tok.is(tok::eof)) {
Chris Lattner4b009652007-07-25 00:24:17 +0000912 Diag(MacroName, diag::err_unterm_macro_invoc);
913 // Do not lose the EOF. Return it to the client.
914 MacroName = Tok;
915 return 0;
Chris Lattnercb8e41c2007-10-09 18:02:16 +0000916 } else if (Tok.is(tok::r_paren)) {
Chris Lattner4b009652007-07-25 00:24:17 +0000917 // If we found the ) token, the macro arg list is done.
918 if (NumParens-- == 0)
919 break;
Chris Lattnercb8e41c2007-10-09 18:02:16 +0000920 } else if (Tok.is(tok::l_paren)) {
Chris Lattner4b009652007-07-25 00:24:17 +0000921 ++NumParens;
Chris Lattnercb8e41c2007-10-09 18:02:16 +0000922 } else if (Tok.is(tok::comma) && NumParens == 0) {
Chris Lattner4b009652007-07-25 00:24:17 +0000923 // Comma ends this argument if there are more fixed arguments expected.
924 if (NumFixedArgsLeft)
925 break;
926
927 // If this is not a variadic macro, too many args were specified.
928 if (!isVariadic) {
929 // Emit the diagnostic at the macro name in case there is a missing ).
930 // Emitting it at the , could be far away from the macro name.
931 Diag(MacroName, diag::err_too_many_args_in_macro_invoc);
932 return 0;
933 }
934 // Otherwise, continue to add the tokens to this variable argument.
Chris Lattnercb8e41c2007-10-09 18:02:16 +0000935 } else if (Tok.is(tok::comment) && !KeepMacroComments) {
Chris Lattner4b009652007-07-25 00:24:17 +0000936 // If this is a comment token in the argument list and we're just in
937 // -C mode (not -CC mode), discard the comment.
938 continue;
939 }
940
941 ArgTokens.push_back(Tok);
942 }
943
944 // Empty arguments are standard in C99 and supported as an extension in
945 // other modes.
946 if (ArgTokens.empty() && !Features.C99)
947 Diag(Tok, diag::ext_empty_fnmacro_arg);
948
949 // Add a marker EOF token to the end of the token list for this argument.
950 Token EOFTok;
951 EOFTok.startToken();
952 EOFTok.setKind(tok::eof);
953 EOFTok.setLocation(Tok.getLocation());
954 EOFTok.setLength(0);
955 ArgTokens.push_back(EOFTok);
956 ++NumActuals;
957 --NumFixedArgsLeft;
958 };
959
960 // Okay, we either found the r_paren. Check to see if we parsed too few
961 // arguments.
962 unsigned MinArgsExpected = MI->getNumArgs();
963
964 // See MacroArgs instance var for description of this.
965 bool isVarargsElided = false;
966
967 if (NumActuals < MinArgsExpected) {
968 // There are several cases where too few arguments is ok, handle them now.
969 if (NumActuals+1 == MinArgsExpected && MI->isVariadic()) {
970 // Varargs where the named vararg parameter is missing: ok as extension.
971 // #define A(x, ...)
972 // A("blah")
973 Diag(Tok, diag::ext_missing_varargs_arg);
974
975 // Remember this occurred if this is a C99 macro invocation with at least
976 // one actual argument.
977 isVarargsElided = MI->isC99Varargs() && MI->getNumArgs() > 1;
978 } else if (MI->getNumArgs() == 1) {
979 // #define A(x)
980 // A()
981 // is ok because it is an empty argument.
982
983 // Empty arguments are standard in C99 and supported as an extension in
984 // other modes.
985 if (ArgTokens.empty() && !Features.C99)
986 Diag(Tok, diag::ext_empty_fnmacro_arg);
987 } else {
988 // Otherwise, emit the error.
989 Diag(Tok, diag::err_too_few_args_in_macro_invoc);
990 return 0;
991 }
992
993 // Add a marker EOF token to the end of the token list for this argument.
994 SourceLocation EndLoc = Tok.getLocation();
995 Tok.startToken();
996 Tok.setKind(tok::eof);
997 Tok.setLocation(EndLoc);
998 Tok.setLength(0);
999 ArgTokens.push_back(Tok);
1000 }
1001
1002 return MacroArgs::create(MI, &ArgTokens[0], ArgTokens.size(),isVarargsElided);
1003}
1004
1005/// ComputeDATE_TIME - Compute the current time, enter it into the specified
1006/// scratch buffer, then return DATELoc/TIMELoc locations with the position of
1007/// the identifier tokens inserted.
1008static void ComputeDATE_TIME(SourceLocation &DATELoc, SourceLocation &TIMELoc,
1009 Preprocessor &PP) {
1010 time_t TT = time(0);
1011 struct tm *TM = localtime(&TT);
1012
1013 static const char * const Months[] = {
1014 "Jan","Feb","Mar","Apr","May","Jun","Jul","Aug","Sep","Oct","Nov","Dec"
1015 };
1016
1017 char TmpBuffer[100];
1018 sprintf(TmpBuffer, "\"%s %2d %4d\"", Months[TM->tm_mon], TM->tm_mday,
1019 TM->tm_year+1900);
1020 DATELoc = PP.CreateString(TmpBuffer, strlen(TmpBuffer));
1021
1022 sprintf(TmpBuffer, "\"%02d:%02d:%02d\"", TM->tm_hour, TM->tm_min, TM->tm_sec);
1023 TIMELoc = PP.CreateString(TmpBuffer, strlen(TmpBuffer));
1024}
1025
1026/// ExpandBuiltinMacro - If an identifier token is read that is to be expanded
1027/// as a builtin macro, handle it and return the next token as 'Tok'.
1028void Preprocessor::ExpandBuiltinMacro(Token &Tok) {
1029 // Figure out which token this is.
1030 IdentifierInfo *II = Tok.getIdentifierInfo();
1031 assert(II && "Can't be a macro without id info!");
1032
1033 // If this is an _Pragma directive, expand it, invoke the pragma handler, then
1034 // lex the token after it.
1035 if (II == Ident_Pragma)
1036 return Handle_Pragma(Tok);
1037
1038 ++NumBuiltinMacroExpanded;
1039
1040 char TmpBuffer[100];
1041
1042 // Set up the return result.
1043 Tok.setIdentifierInfo(0);
1044 Tok.clearFlag(Token::NeedsCleaning);
1045
1046 if (II == Ident__LINE__) {
1047 // __LINE__ expands to a simple numeric value.
1048 sprintf(TmpBuffer, "%u", SourceMgr.getLogicalLineNumber(Tok.getLocation()));
1049 unsigned Length = strlen(TmpBuffer);
1050 Tok.setKind(tok::numeric_constant);
1051 Tok.setLength(Length);
1052 Tok.setLocation(CreateString(TmpBuffer, Length, Tok.getLocation()));
1053 } else if (II == Ident__FILE__ || II == Ident__BASE_FILE__) {
1054 SourceLocation Loc = Tok.getLocation();
1055 if (II == Ident__BASE_FILE__) {
1056 Diag(Tok, diag::ext_pp_base_file);
1057 SourceLocation NextLoc = SourceMgr.getIncludeLoc(Loc);
1058 while (NextLoc.isValid()) {
1059 Loc = NextLoc;
1060 NextLoc = SourceMgr.getIncludeLoc(Loc);
1061 }
1062 }
1063
1064 // Escape this filename. Turn '\' -> '\\' '"' -> '\"'
1065 std::string FN = SourceMgr.getSourceName(SourceMgr.getLogicalLoc(Loc));
1066 FN = '"' + Lexer::Stringify(FN) + '"';
1067 Tok.setKind(tok::string_literal);
1068 Tok.setLength(FN.size());
1069 Tok.setLocation(CreateString(&FN[0], FN.size(), Tok.getLocation()));
1070 } else if (II == Ident__DATE__) {
1071 if (!DATELoc.isValid())
1072 ComputeDATE_TIME(DATELoc, TIMELoc, *this);
1073 Tok.setKind(tok::string_literal);
1074 Tok.setLength(strlen("\"Mmm dd yyyy\""));
1075 Tok.setLocation(SourceMgr.getInstantiationLoc(DATELoc, Tok.getLocation()));
1076 } else if (II == Ident__TIME__) {
1077 if (!TIMELoc.isValid())
1078 ComputeDATE_TIME(DATELoc, TIMELoc, *this);
1079 Tok.setKind(tok::string_literal);
1080 Tok.setLength(strlen("\"hh:mm:ss\""));
1081 Tok.setLocation(SourceMgr.getInstantiationLoc(TIMELoc, Tok.getLocation()));
1082 } else if (II == Ident__INCLUDE_LEVEL__) {
1083 Diag(Tok, diag::ext_pp_include_level);
1084
1085 // Compute the include depth of this token.
1086 unsigned Depth = 0;
1087 SourceLocation Loc = SourceMgr.getIncludeLoc(Tok.getLocation());
1088 for (; Loc.isValid(); ++Depth)
1089 Loc = SourceMgr.getIncludeLoc(Loc);
1090
1091 // __INCLUDE_LEVEL__ expands to a simple numeric value.
1092 sprintf(TmpBuffer, "%u", Depth);
1093 unsigned Length = strlen(TmpBuffer);
1094 Tok.setKind(tok::numeric_constant);
1095 Tok.setLength(Length);
1096 Tok.setLocation(CreateString(TmpBuffer, Length, Tok.getLocation()));
1097 } else if (II == Ident__TIMESTAMP__) {
1098 // MSVC, ICC, GCC, VisualAge C++ extension. The generated string should be
1099 // of the form "Ddd Mmm dd hh::mm::ss yyyy", which is returned by asctime.
1100 Diag(Tok, diag::ext_pp_timestamp);
1101
1102 // Get the file that we are lexing out of. If we're currently lexing from
1103 // a macro, dig into the include stack.
1104 const FileEntry *CurFile = 0;
1105 Lexer *TheLexer = getCurrentFileLexer();
1106
1107 if (TheLexer)
1108 CurFile = SourceMgr.getFileEntryForLoc(TheLexer->getFileLoc());
1109
1110 // If this file is older than the file it depends on, emit a diagnostic.
1111 const char *Result;
1112 if (CurFile) {
1113 time_t TT = CurFile->getModificationTime();
1114 struct tm *TM = localtime(&TT);
1115 Result = asctime(TM);
1116 } else {
1117 Result = "??? ??? ?? ??:??:?? ????\n";
1118 }
1119 TmpBuffer[0] = '"';
1120 strcpy(TmpBuffer+1, Result);
1121 unsigned Len = strlen(TmpBuffer);
1122 TmpBuffer[Len-1] = '"'; // Replace the newline with a quote.
1123 Tok.setKind(tok::string_literal);
1124 Tok.setLength(Len);
1125 Tok.setLocation(CreateString(TmpBuffer, Len, Tok.getLocation()));
1126 } else {
1127 assert(0 && "Unknown identifier!");
1128 }
1129}
1130
1131//===----------------------------------------------------------------------===//
1132// Lexer Event Handling.
1133//===----------------------------------------------------------------------===//
1134
1135/// LookUpIdentifierInfo - Given a tok::identifier token, look up the
1136/// identifier information for the token and install it into the token.
1137IdentifierInfo *Preprocessor::LookUpIdentifierInfo(Token &Identifier,
1138 const char *BufPtr) {
Chris Lattnercb8e41c2007-10-09 18:02:16 +00001139 assert(Identifier.is(tok::identifier) && "Not an identifier!");
Chris Lattner4b009652007-07-25 00:24:17 +00001140 assert(Identifier.getIdentifierInfo() == 0 && "Identinfo already exists!");
1141
1142 // Look up this token, see if it is a macro, or if it is a language keyword.
1143 IdentifierInfo *II;
1144 if (BufPtr && !Identifier.needsCleaning()) {
1145 // No cleaning needed, just use the characters from the lexed buffer.
1146 II = getIdentifierInfo(BufPtr, BufPtr+Identifier.getLength());
1147 } else {
1148 // Cleaning needed, alloca a buffer, clean into it, then use the buffer.
1149 llvm::SmallVector<char, 64> IdentifierBuffer;
1150 IdentifierBuffer.resize(Identifier.getLength());
1151 const char *TmpBuf = &IdentifierBuffer[0];
1152 unsigned Size = getSpelling(Identifier, TmpBuf);
1153 II = getIdentifierInfo(TmpBuf, TmpBuf+Size);
1154 }
1155 Identifier.setIdentifierInfo(II);
1156 return II;
1157}
1158
1159
1160/// HandleIdentifier - This callback is invoked when the lexer reads an
1161/// identifier. This callback looks up the identifier in the map and/or
1162/// potentially macro expands it or turns it into a named token (like 'for').
1163void Preprocessor::HandleIdentifier(Token &Identifier) {
1164 assert(Identifier.getIdentifierInfo() &&
1165 "Can't handle identifiers without identifier info!");
1166
1167 IdentifierInfo &II = *Identifier.getIdentifierInfo();
1168
1169 // If this identifier was poisoned, and if it was not produced from a macro
1170 // expansion, emit an error.
1171 if (II.isPoisoned() && CurLexer) {
1172 if (&II != Ident__VA_ARGS__) // We warn about __VA_ARGS__ with poisoning.
1173 Diag(Identifier, diag::err_pp_used_poisoned_id);
1174 else
1175 Diag(Identifier, diag::ext_pp_bad_vaargs_use);
1176 }
1177
1178 // If this is a macro to be expanded, do it.
Chris Lattner7a1b0882007-10-07 08:44:20 +00001179 if (MacroInfo *MI = getMacroInfo(&II)) {
Chris Lattner4b009652007-07-25 00:24:17 +00001180 if (!DisableMacroExpansion && !Identifier.isExpandDisabled()) {
1181 if (MI->isEnabled()) {
1182 if (!HandleMacroExpandedIdentifier(Identifier, MI))
1183 return;
1184 } else {
1185 // C99 6.10.3.4p2 says that a disabled macro may never again be
1186 // expanded, even if it's in a context where it could be expanded in the
1187 // future.
1188 Identifier.setFlag(Token::DisableExpand);
1189 }
1190 }
1191 } else if (II.isOtherTargetMacro() && !DisableMacroExpansion) {
1192 // If this identifier is a macro on some other target, emit a diagnostic.
1193 // This diagnosic is only emitted when macro expansion is enabled, because
1194 // the macro would not have been expanded for the other target either.
1195 II.setIsOtherTargetMacro(false); // Don't warn on second use.
1196 getTargetInfo().DiagnoseNonPortability(Identifier.getLocation(),
1197 diag::port_target_macro_use);
1198
1199 }
1200
1201 // C++ 2.11p2: If this is an alternative representation of a C++ operator,
1202 // then we act as if it is the actual operator and not the textual
1203 // representation of it.
1204 if (II.isCPlusPlusOperatorKeyword())
1205 Identifier.setIdentifierInfo(0);
1206
1207 // Change the kind of this identifier to the appropriate token kind, e.g.
1208 // turning "for" into a keyword.
1209 Identifier.setKind(II.getTokenID());
1210
1211 // If this is an extension token, diagnose its use.
1212 // FIXME: tried (unsuccesfully) to shut this up when compiling with gnu99
1213 // For now, I'm just commenting it out (while I work on attributes).
1214 if (II.isExtensionToken() && Features.C99)
1215 Diag(Identifier, diag::ext_token_used);
1216}
1217
1218/// HandleEndOfFile - This callback is invoked when the lexer hits the end of
1219/// the current file. This either returns the EOF token or pops a level off
1220/// the include stack and keeps going.
1221bool Preprocessor::HandleEndOfFile(Token &Result, bool isEndOfMacro) {
1222 assert(!CurMacroExpander &&
1223 "Ending a file when currently in a macro!");
1224
1225 // See if this file had a controlling macro.
1226 if (CurLexer) { // Not ending a macro, ignore it.
1227 if (const IdentifierInfo *ControllingMacro =
1228 CurLexer->MIOpt.GetControllingMacroAtEndOfFile()) {
1229 // Okay, this has a controlling macro, remember in PerFileInfo.
1230 if (const FileEntry *FE =
1231 SourceMgr.getFileEntryForLoc(CurLexer->getFileLoc()))
1232 HeaderInfo.SetFileControllingMacro(FE, ControllingMacro);
1233 }
1234 }
1235
1236 // If this is a #include'd file, pop it off the include stack and continue
1237 // lexing the #includer file.
1238 if (!IncludeMacroStack.empty()) {
1239 // We're done with the #included file.
1240 RemoveTopOfLexerStack();
1241
1242 // Notify the client, if desired, that we are in a new source file.
1243 if (Callbacks && !isEndOfMacro && CurLexer) {
1244 DirectoryLookup::DirType FileType = DirectoryLookup::NormalHeaderDir;
1245
1246 // Get the file entry for the current file.
1247 if (const FileEntry *FE =
1248 SourceMgr.getFileEntryForLoc(CurLexer->getFileLoc()))
1249 FileType = HeaderInfo.getFileDirFlavor(FE);
1250
1251 Callbacks->FileChanged(CurLexer->getSourceLocation(CurLexer->BufferPtr),
1252 PPCallbacks::ExitFile, FileType);
1253 }
1254
1255 // Client should lex another token.
1256 return false;
1257 }
1258
1259 Result.startToken();
1260 CurLexer->BufferPtr = CurLexer->BufferEnd;
1261 CurLexer->FormTokenWithChars(Result, CurLexer->BufferEnd);
1262 Result.setKind(tok::eof);
1263
1264 // We're done with the #included file.
1265 delete CurLexer;
1266 CurLexer = 0;
1267
1268 // This is the end of the top-level file. If the diag::pp_macro_not_used
Chris Lattner7a1b0882007-10-07 08:44:20 +00001269 // diagnostic is enabled, look for macros that have not been used.
Chris Lattner4b009652007-07-25 00:24:17 +00001270 if (Diags.getDiagnosticLevel(diag::pp_macro_not_used) != Diagnostic::Ignored){
Chris Lattner7a1b0882007-10-07 08:44:20 +00001271 for (llvm::DenseMap<IdentifierInfo*, MacroInfo*>::iterator I =
1272 Macros.begin(), E = Macros.end(); I != E; ++I) {
1273 if (!I->second->isUsed())
1274 Diag(I->second->getDefinitionLoc(), diag::pp_macro_not_used);
Chris Lattner4b009652007-07-25 00:24:17 +00001275 }
1276 }
Chris Lattner4b009652007-07-25 00:24:17 +00001277 return true;
1278}
1279
1280/// HandleEndOfMacro - This callback is invoked when the lexer hits the end of
1281/// the current macro expansion or token stream expansion.
1282bool Preprocessor::HandleEndOfMacro(Token &Result) {
1283 assert(CurMacroExpander && !CurLexer &&
1284 "Ending a macro when currently in a #include file!");
1285
1286 // Delete or cache the now-dead macro expander.
1287 if (NumCachedMacroExpanders == MacroExpanderCacheSize)
1288 delete CurMacroExpander;
1289 else
1290 MacroExpanderCache[NumCachedMacroExpanders++] = CurMacroExpander;
1291
1292 // Handle this like a #include file being popped off the stack.
1293 CurMacroExpander = 0;
1294 return HandleEndOfFile(Result, true);
1295}
1296
1297
1298//===----------------------------------------------------------------------===//
1299// Utility Methods for Preprocessor Directive Handling.
1300//===----------------------------------------------------------------------===//
1301
1302/// DiscardUntilEndOfDirective - Read and discard all tokens remaining on the
1303/// current line until the tok::eom token is found.
1304void Preprocessor::DiscardUntilEndOfDirective() {
1305 Token Tmp;
1306 do {
1307 LexUnexpandedToken(Tmp);
Chris Lattnercb8e41c2007-10-09 18:02:16 +00001308 } while (Tmp.isNot(tok::eom));
Chris Lattner4b009652007-07-25 00:24:17 +00001309}
1310
1311/// isCXXNamedOperator - Returns "true" if the token is a named operator in C++.
1312static bool isCXXNamedOperator(const std::string &Spelling) {
1313 return Spelling == "and" || Spelling == "bitand" || Spelling == "bitor" ||
1314 Spelling == "compl" || Spelling == "not" || Spelling == "not_eq" ||
1315 Spelling == "or" || Spelling == "xor";
1316}
1317
1318/// ReadMacroName - Lex and validate a macro name, which occurs after a
1319/// #define or #undef. This sets the token kind to eom and discards the rest
1320/// of the macro line if the macro name is invalid. isDefineUndef is 1 if
1321/// this is due to a a #define, 2 if #undef directive, 0 if it is something
1322/// else (e.g. #ifdef).
1323void Preprocessor::ReadMacroName(Token &MacroNameTok, char isDefineUndef) {
1324 // Read the token, don't allow macro expansion on it.
1325 LexUnexpandedToken(MacroNameTok);
1326
1327 // Missing macro name?
Chris Lattnercb8e41c2007-10-09 18:02:16 +00001328 if (MacroNameTok.is(tok::eom))
Chris Lattner4b009652007-07-25 00:24:17 +00001329 return Diag(MacroNameTok, diag::err_pp_missing_macro_name);
1330
1331 IdentifierInfo *II = MacroNameTok.getIdentifierInfo();
1332 if (II == 0) {
1333 std::string Spelling = getSpelling(MacroNameTok);
1334 if (isCXXNamedOperator(Spelling))
1335 // C++ 2.5p2: Alternative tokens behave the same as its primary token
1336 // except for their spellings.
1337 Diag(MacroNameTok, diag::err_pp_operator_used_as_macro_name, Spelling);
1338 else
1339 Diag(MacroNameTok, diag::err_pp_macro_not_identifier);
1340 // Fall through on error.
1341 } else if (isDefineUndef && II->getPPKeywordID() == tok::pp_defined) {
1342 // Error if defining "defined": C99 6.10.8.4.
1343 Diag(MacroNameTok, diag::err_defined_macro_name);
Chris Lattner3b56a012007-10-07 08:04:56 +00001344 } else if (isDefineUndef && II->hasMacroDefinition() &&
Chris Lattner7a1b0882007-10-07 08:44:20 +00001345 getMacroInfo(II)->isBuiltinMacro()) {
Chris Lattner4b009652007-07-25 00:24:17 +00001346 // Error if defining "__LINE__" and other builtins: C99 6.10.8.4.
1347 if (isDefineUndef == 1)
1348 Diag(MacroNameTok, diag::pp_redef_builtin_macro);
1349 else
1350 Diag(MacroNameTok, diag::pp_undef_builtin_macro);
1351 } else {
1352 // Okay, we got a good identifier node. Return it.
1353 return;
1354 }
1355
1356 // Invalid macro name, read and discard the rest of the line. Then set the
1357 // token kind to tok::eom.
1358 MacroNameTok.setKind(tok::eom);
1359 return DiscardUntilEndOfDirective();
1360}
1361
1362/// CheckEndOfDirective - Ensure that the next token is a tok::eom token. If
1363/// not, emit a diagnostic and consume up until the eom.
1364void Preprocessor::CheckEndOfDirective(const char *DirType) {
1365 Token Tmp;
1366 Lex(Tmp);
1367 // There should be no tokens after the directive, but we allow them as an
1368 // extension.
Chris Lattnercb8e41c2007-10-09 18:02:16 +00001369 while (Tmp.is(tok::comment)) // Skip comments in -C mode.
Chris Lattner4b009652007-07-25 00:24:17 +00001370 Lex(Tmp);
1371
Chris Lattnercb8e41c2007-10-09 18:02:16 +00001372 if (Tmp.isNot(tok::eom)) {
Chris Lattner4b009652007-07-25 00:24:17 +00001373 Diag(Tmp, diag::ext_pp_extra_tokens_at_eol, DirType);
1374 DiscardUntilEndOfDirective();
1375 }
1376}
1377
1378
1379
1380/// SkipExcludedConditionalBlock - We just read a #if or related directive and
1381/// decided that the subsequent tokens are in the #if'd out portion of the
1382/// file. Lex the rest of the file, until we see an #endif. If
1383/// FoundNonSkipPortion is true, then we have already emitted code for part of
1384/// this #if directive, so #else/#elif blocks should never be entered. If ElseOk
1385/// is true, then #else directives are ok, if not, then we have already seen one
1386/// so a #else directive is a duplicate. When this returns, the caller can lex
1387/// the first valid token.
1388void Preprocessor::SkipExcludedConditionalBlock(SourceLocation IfTokenLoc,
1389 bool FoundNonSkipPortion,
1390 bool FoundElse) {
1391 ++NumSkipped;
1392 assert(CurMacroExpander == 0 && CurLexer &&
1393 "Lexing a macro, not a file?");
1394
1395 CurLexer->pushConditionalLevel(IfTokenLoc, /*isSkipping*/false,
1396 FoundNonSkipPortion, FoundElse);
1397
1398 // Enter raw mode to disable identifier lookup (and thus macro expansion),
1399 // disabling warnings, etc.
1400 CurLexer->LexingRawMode = true;
1401 Token Tok;
1402 while (1) {
1403 CurLexer->Lex(Tok);
1404
1405 // If this is the end of the buffer, we have an error.
Chris Lattnercb8e41c2007-10-09 18:02:16 +00001406 if (Tok.is(tok::eof)) {
Chris Lattner4b009652007-07-25 00:24:17 +00001407 // Emit errors for each unterminated conditional on the stack, including
1408 // the current one.
1409 while (!CurLexer->ConditionalStack.empty()) {
1410 Diag(CurLexer->ConditionalStack.back().IfLoc,
1411 diag::err_pp_unterminated_conditional);
1412 CurLexer->ConditionalStack.pop_back();
1413 }
1414
1415 // Just return and let the caller lex after this #include.
1416 break;
1417 }
1418
1419 // If this token is not a preprocessor directive, just skip it.
Chris Lattnercb8e41c2007-10-09 18:02:16 +00001420 if (Tok.isNot(tok::hash) || !Tok.isAtStartOfLine())
Chris Lattner4b009652007-07-25 00:24:17 +00001421 continue;
1422
1423 // We just parsed a # character at the start of a line, so we're in
1424 // directive mode. Tell the lexer this so any newlines we see will be
1425 // converted into an EOM token (this terminates the macro).
1426 CurLexer->ParsingPreprocessorDirective = true;
1427 CurLexer->KeepCommentMode = false;
1428
1429
1430 // Read the next token, the directive flavor.
1431 LexUnexpandedToken(Tok);
1432
1433 // If this isn't an identifier directive (e.g. is "# 1\n" or "#\n", or
1434 // something bogus), skip it.
Chris Lattnercb8e41c2007-10-09 18:02:16 +00001435 if (Tok.isNot(tok::identifier)) {
Chris Lattner4b009652007-07-25 00:24:17 +00001436 CurLexer->ParsingPreprocessorDirective = false;
1437 // Restore comment saving mode.
1438 CurLexer->KeepCommentMode = KeepComments;
1439 continue;
1440 }
1441
1442 // If the first letter isn't i or e, it isn't intesting to us. We know that
1443 // this is safe in the face of spelling differences, because there is no way
1444 // to spell an i/e in a strange way that is another letter. Skipping this
1445 // allows us to avoid looking up the identifier info for #define/#undef and
1446 // other common directives.
1447 const char *RawCharData = SourceMgr.getCharacterData(Tok.getLocation());
1448 char FirstChar = RawCharData[0];
1449 if (FirstChar >= 'a' && FirstChar <= 'z' &&
1450 FirstChar != 'i' && FirstChar != 'e') {
1451 CurLexer->ParsingPreprocessorDirective = false;
1452 // Restore comment saving mode.
1453 CurLexer->KeepCommentMode = KeepComments;
1454 continue;
1455 }
1456
1457 // Get the identifier name without trigraphs or embedded newlines. Note
1458 // that we can't use Tok.getIdentifierInfo() because its lookup is disabled
1459 // when skipping.
1460 // TODO: could do this with zero copies in the no-clean case by using
1461 // strncmp below.
1462 char Directive[20];
1463 unsigned IdLen;
1464 if (!Tok.needsCleaning() && Tok.getLength() < 20) {
1465 IdLen = Tok.getLength();
1466 memcpy(Directive, RawCharData, IdLen);
1467 Directive[IdLen] = 0;
1468 } else {
1469 std::string DirectiveStr = getSpelling(Tok);
1470 IdLen = DirectiveStr.size();
1471 if (IdLen >= 20) {
1472 CurLexer->ParsingPreprocessorDirective = false;
1473 // Restore comment saving mode.
1474 CurLexer->KeepCommentMode = KeepComments;
1475 continue;
1476 }
1477 memcpy(Directive, &DirectiveStr[0], IdLen);
1478 Directive[IdLen] = 0;
1479 }
1480
1481 if (FirstChar == 'i' && Directive[1] == 'f') {
1482 if ((IdLen == 2) || // "if"
1483 (IdLen == 5 && !strcmp(Directive+2, "def")) || // "ifdef"
1484 (IdLen == 6 && !strcmp(Directive+2, "ndef"))) { // "ifndef"
1485 // We know the entire #if/#ifdef/#ifndef block will be skipped, don't
1486 // bother parsing the condition.
1487 DiscardUntilEndOfDirective();
1488 CurLexer->pushConditionalLevel(Tok.getLocation(), /*wasskipping*/true,
1489 /*foundnonskip*/false,
1490 /*fnddelse*/false);
1491 }
1492 } else if (FirstChar == 'e') {
1493 if (IdLen == 5 && !strcmp(Directive+1, "ndif")) { // "endif"
1494 CheckEndOfDirective("#endif");
1495 PPConditionalInfo CondInfo;
1496 CondInfo.WasSkipping = true; // Silence bogus warning.
1497 bool InCond = CurLexer->popConditionalLevel(CondInfo);
1498 InCond = InCond; // Silence warning in no-asserts mode.
1499 assert(!InCond && "Can't be skipping if not in a conditional!");
1500
1501 // If we popped the outermost skipping block, we're done skipping!
1502 if (!CondInfo.WasSkipping)
1503 break;
1504 } else if (IdLen == 4 && !strcmp(Directive+1, "lse")) { // "else".
1505 // #else directive in a skipping conditional. If not in some other
1506 // skipping conditional, and if #else hasn't already been seen, enter it
1507 // as a non-skipping conditional.
1508 CheckEndOfDirective("#else");
1509 PPConditionalInfo &CondInfo = CurLexer->peekConditionalLevel();
1510
1511 // If this is a #else with a #else before it, report the error.
1512 if (CondInfo.FoundElse) Diag(Tok, diag::pp_err_else_after_else);
1513
1514 // Note that we've seen a #else in this conditional.
1515 CondInfo.FoundElse = true;
1516
1517 // If the conditional is at the top level, and the #if block wasn't
1518 // entered, enter the #else block now.
1519 if (!CondInfo.WasSkipping && !CondInfo.FoundNonSkip) {
1520 CondInfo.FoundNonSkip = true;
1521 break;
1522 }
1523 } else if (IdLen == 4 && !strcmp(Directive+1, "lif")) { // "elif".
1524 PPConditionalInfo &CondInfo = CurLexer->peekConditionalLevel();
1525
1526 bool ShouldEnter;
1527 // If this is in a skipping block or if we're already handled this #if
1528 // block, don't bother parsing the condition.
1529 if (CondInfo.WasSkipping || CondInfo.FoundNonSkip) {
1530 DiscardUntilEndOfDirective();
1531 ShouldEnter = false;
1532 } else {
1533 // Restore the value of LexingRawMode so that identifiers are
1534 // looked up, etc, inside the #elif expression.
1535 assert(CurLexer->LexingRawMode && "We have to be skipping here!");
1536 CurLexer->LexingRawMode = false;
1537 IdentifierInfo *IfNDefMacro = 0;
1538 ShouldEnter = EvaluateDirectiveExpression(IfNDefMacro);
1539 CurLexer->LexingRawMode = true;
1540 }
1541
1542 // If this is a #elif with a #else before it, report the error.
1543 if (CondInfo.FoundElse) Diag(Tok, diag::pp_err_elif_after_else);
1544
1545 // If this condition is true, enter it!
1546 if (ShouldEnter) {
1547 CondInfo.FoundNonSkip = true;
1548 break;
1549 }
1550 }
1551 }
1552
1553 CurLexer->ParsingPreprocessorDirective = false;
1554 // Restore comment saving mode.
1555 CurLexer->KeepCommentMode = KeepComments;
1556 }
1557
1558 // Finally, if we are out of the conditional (saw an #endif or ran off the end
1559 // of the file, just stop skipping and return to lexing whatever came after
1560 // the #if block.
1561 CurLexer->LexingRawMode = false;
1562}
1563
1564//===----------------------------------------------------------------------===//
1565// Preprocessor Directive Handling.
1566//===----------------------------------------------------------------------===//
1567
1568/// HandleDirective - This callback is invoked when the lexer sees a # token
1569/// at the start of a line. This consumes the directive, modifies the
1570/// lexer/preprocessor state, and advances the lexer(s) so that the next token
1571/// read is the correct one.
1572void Preprocessor::HandleDirective(Token &Result) {
1573 // FIXME: Traditional: # with whitespace before it not recognized by K&R?
1574
1575 // We just parsed a # character at the start of a line, so we're in directive
1576 // mode. Tell the lexer this so any newlines we see will be converted into an
1577 // EOM token (which terminates the directive).
1578 CurLexer->ParsingPreprocessorDirective = true;
1579
1580 ++NumDirectives;
1581
1582 // We are about to read a token. For the multiple-include optimization FA to
1583 // work, we have to remember if we had read any tokens *before* this
1584 // pp-directive.
1585 bool ReadAnyTokensBeforeDirective = CurLexer->MIOpt.getHasReadAnyTokensVal();
1586
1587 // Read the next token, the directive flavor. This isn't expanded due to
1588 // C99 6.10.3p8.
1589 LexUnexpandedToken(Result);
1590
1591 // C99 6.10.3p11: Is this preprocessor directive in macro invocation? e.g.:
1592 // #define A(x) #x
1593 // A(abc
1594 // #warning blah
1595 // def)
1596 // If so, the user is relying on non-portable behavior, emit a diagnostic.
1597 if (InMacroArgs)
1598 Diag(Result, diag::ext_embedded_directive);
1599
1600TryAgain:
1601 switch (Result.getKind()) {
1602 case tok::eom:
1603 return; // null directive.
1604 case tok::comment:
1605 // Handle stuff like "# /*foo*/ define X" in -E -C mode.
1606 LexUnexpandedToken(Result);
1607 goto TryAgain;
1608
1609 case tok::numeric_constant:
1610 // FIXME: implement # 7 line numbers!
1611 DiscardUntilEndOfDirective();
1612 return;
1613 default:
1614 IdentifierInfo *II = Result.getIdentifierInfo();
1615 if (II == 0) break; // Not an identifier.
1616
1617 // Ask what the preprocessor keyword ID is.
1618 switch (II->getPPKeywordID()) {
1619 default: break;
1620 // C99 6.10.1 - Conditional Inclusion.
1621 case tok::pp_if:
1622 return HandleIfDirective(Result, ReadAnyTokensBeforeDirective);
1623 case tok::pp_ifdef:
1624 return HandleIfdefDirective(Result, false, true/*not valid for miopt*/);
1625 case tok::pp_ifndef:
1626 return HandleIfdefDirective(Result, true, ReadAnyTokensBeforeDirective);
1627 case tok::pp_elif:
1628 return HandleElifDirective(Result);
1629 case tok::pp_else:
1630 return HandleElseDirective(Result);
1631 case tok::pp_endif:
1632 return HandleEndifDirective(Result);
1633
1634 // C99 6.10.2 - Source File Inclusion.
1635 case tok::pp_include:
1636 return HandleIncludeDirective(Result); // Handle #include.
1637
1638 // C99 6.10.3 - Macro Replacement.
1639 case tok::pp_define:
1640 return HandleDefineDirective(Result, false);
1641 case tok::pp_undef:
1642 return HandleUndefDirective(Result);
1643
1644 // C99 6.10.4 - Line Control.
1645 case tok::pp_line:
1646 // FIXME: implement #line
1647 DiscardUntilEndOfDirective();
1648 return;
1649
1650 // C99 6.10.5 - Error Directive.
1651 case tok::pp_error:
1652 return HandleUserDiagnosticDirective(Result, false);
1653
1654 // C99 6.10.6 - Pragma Directive.
1655 case tok::pp_pragma:
1656 return HandlePragmaDirective();
1657
1658 // GNU Extensions.
1659 case tok::pp_import:
1660 return HandleImportDirective(Result);
1661 case tok::pp_include_next:
1662 return HandleIncludeNextDirective(Result);
1663
1664 case tok::pp_warning:
1665 Diag(Result, diag::ext_pp_warning_directive);
1666 return HandleUserDiagnosticDirective(Result, true);
1667 case tok::pp_ident:
1668 return HandleIdentSCCSDirective(Result);
1669 case tok::pp_sccs:
1670 return HandleIdentSCCSDirective(Result);
1671 case tok::pp_assert:
1672 //isExtension = true; // FIXME: implement #assert
1673 break;
1674 case tok::pp_unassert:
1675 //isExtension = true; // FIXME: implement #unassert
1676 break;
1677
1678 // clang extensions.
1679 case tok::pp_define_target:
1680 return HandleDefineDirective(Result, true);
1681 case tok::pp_define_other_target:
1682 return HandleDefineOtherTargetDirective(Result);
1683 }
1684 break;
1685 }
1686
1687 // If we reached here, the preprocessing token is not valid!
1688 Diag(Result, diag::err_pp_invalid_directive);
1689
1690 // Read the rest of the PP line.
1691 DiscardUntilEndOfDirective();
1692
1693 // Okay, we're done parsing the directive.
1694}
1695
1696void Preprocessor::HandleUserDiagnosticDirective(Token &Tok,
1697 bool isWarning) {
1698 // Read the rest of the line raw. We do this because we don't want macros
1699 // to be expanded and we don't require that the tokens be valid preprocessing
1700 // tokens. For example, this is allowed: "#warning ` 'foo". GCC does
1701 // collapse multiple consequtive white space between tokens, but this isn't
1702 // specified by the standard.
1703 std::string Message = CurLexer->ReadToEndOfLine();
1704
1705 unsigned DiagID = isWarning ? diag::pp_hash_warning : diag::err_pp_hash_error;
1706 return Diag(Tok, DiagID, Message);
1707}
1708
1709/// HandleIdentSCCSDirective - Handle a #ident/#sccs directive.
1710///
1711void Preprocessor::HandleIdentSCCSDirective(Token &Tok) {
1712 // Yes, this directive is an extension.
1713 Diag(Tok, diag::ext_pp_ident_directive);
1714
1715 // Read the string argument.
1716 Token StrTok;
1717 Lex(StrTok);
1718
1719 // If the token kind isn't a string, it's a malformed directive.
Chris Lattnercb8e41c2007-10-09 18:02:16 +00001720 if (StrTok.isNot(tok::string_literal) &&
1721 StrTok.isNot(tok::wide_string_literal))
Chris Lattner4b009652007-07-25 00:24:17 +00001722 return Diag(StrTok, diag::err_pp_malformed_ident);
1723
1724 // Verify that there is nothing after the string, other than EOM.
1725 CheckEndOfDirective("#ident");
1726
1727 if (Callbacks)
1728 Callbacks->Ident(Tok.getLocation(), getSpelling(StrTok));
1729}
1730
1731//===----------------------------------------------------------------------===//
1732// Preprocessor Include Directive Handling.
1733//===----------------------------------------------------------------------===//
1734
1735/// GetIncludeFilenameSpelling - Turn the specified lexer token into a fully
1736/// checked and spelled filename, e.g. as an operand of #include. This returns
1737/// true if the input filename was in <>'s or false if it were in ""'s. The
1738/// caller is expected to provide a buffer that is large enough to hold the
1739/// spelling of the filename, but is also expected to handle the case when
1740/// this method decides to use a different buffer.
1741bool Preprocessor::GetIncludeFilenameSpelling(SourceLocation Loc,
1742 const char *&BufStart,
1743 const char *&BufEnd) {
1744 // Get the text form of the filename.
1745 assert(BufStart != BufEnd && "Can't have tokens with empty spellings!");
1746
1747 // Make sure the filename is <x> or "x".
1748 bool isAngled;
1749 if (BufStart[0] == '<') {
1750 if (BufEnd[-1] != '>') {
1751 Diag(Loc, diag::err_pp_expects_filename);
1752 BufStart = 0;
1753 return true;
1754 }
1755 isAngled = true;
1756 } else if (BufStart[0] == '"') {
1757 if (BufEnd[-1] != '"') {
1758 Diag(Loc, diag::err_pp_expects_filename);
1759 BufStart = 0;
1760 return true;
1761 }
1762 isAngled = false;
1763 } else {
1764 Diag(Loc, diag::err_pp_expects_filename);
1765 BufStart = 0;
1766 return true;
1767 }
1768
1769 // Diagnose #include "" as invalid.
1770 if (BufEnd-BufStart <= 2) {
1771 Diag(Loc, diag::err_pp_empty_filename);
1772 BufStart = 0;
1773 return "";
1774 }
1775
1776 // Skip the brackets.
1777 ++BufStart;
1778 --BufEnd;
1779 return isAngled;
1780}
1781
1782/// ConcatenateIncludeName - Handle cases where the #include name is expanded
1783/// from a macro as multiple tokens, which need to be glued together. This
1784/// occurs for code like:
1785/// #define FOO <a/b.h>
1786/// #include FOO
1787/// because in this case, "<a/b.h>" is returned as 7 tokens, not one.
1788///
1789/// This code concatenates and consumes tokens up to the '>' token. It returns
1790/// false if the > was found, otherwise it returns true if it finds and consumes
1791/// the EOM marker.
1792static bool ConcatenateIncludeName(llvm::SmallVector<char, 128> &FilenameBuffer,
1793 Preprocessor &PP) {
1794 Token CurTok;
1795
1796 PP.Lex(CurTok);
Chris Lattnercb8e41c2007-10-09 18:02:16 +00001797 while (CurTok.isNot(tok::eom)) {
Chris Lattner4b009652007-07-25 00:24:17 +00001798 // Append the spelling of this token to the buffer. If there was a space
1799 // before it, add it now.
1800 if (CurTok.hasLeadingSpace())
1801 FilenameBuffer.push_back(' ');
1802
1803 // Get the spelling of the token, directly into FilenameBuffer if possible.
1804 unsigned PreAppendSize = FilenameBuffer.size();
1805 FilenameBuffer.resize(PreAppendSize+CurTok.getLength());
1806
1807 const char *BufPtr = &FilenameBuffer[PreAppendSize];
1808 unsigned ActualLen = PP.getSpelling(CurTok, BufPtr);
1809
1810 // If the token was spelled somewhere else, copy it into FilenameBuffer.
1811 if (BufPtr != &FilenameBuffer[PreAppendSize])
1812 memcpy(&FilenameBuffer[PreAppendSize], BufPtr, ActualLen);
1813
1814 // Resize FilenameBuffer to the correct size.
1815 if (CurTok.getLength() != ActualLen)
1816 FilenameBuffer.resize(PreAppendSize+ActualLen);
1817
1818 // If we found the '>' marker, return success.
Chris Lattnercb8e41c2007-10-09 18:02:16 +00001819 if (CurTok.is(tok::greater))
Chris Lattner4b009652007-07-25 00:24:17 +00001820 return false;
1821
1822 PP.Lex(CurTok);
1823 }
1824
1825 // If we hit the eom marker, emit an error and return true so that the caller
1826 // knows the EOM has been read.
1827 PP.Diag(CurTok.getLocation(), diag::err_pp_expects_filename);
1828 return true;
1829}
1830
1831/// HandleIncludeDirective - The "#include" tokens have just been read, read the
1832/// file to be included from the lexer, then include it! This is a common
1833/// routine with functionality shared between #include, #include_next and
1834/// #import.
1835void Preprocessor::HandleIncludeDirective(Token &IncludeTok,
1836 const DirectoryLookup *LookupFrom,
1837 bool isImport) {
1838
1839 Token FilenameTok;
1840 CurLexer->LexIncludeFilename(FilenameTok);
1841
1842 // Reserve a buffer to get the spelling.
1843 llvm::SmallVector<char, 128> FilenameBuffer;
1844 const char *FilenameStart, *FilenameEnd;
1845
1846 switch (FilenameTok.getKind()) {
1847 case tok::eom:
1848 // If the token kind is EOM, the error has already been diagnosed.
1849 return;
1850
1851 case tok::angle_string_literal:
1852 case tok::string_literal: {
1853 FilenameBuffer.resize(FilenameTok.getLength());
1854 FilenameStart = &FilenameBuffer[0];
1855 unsigned Len = getSpelling(FilenameTok, FilenameStart);
1856 FilenameEnd = FilenameStart+Len;
1857 break;
1858 }
1859
1860 case tok::less:
1861 // This could be a <foo/bar.h> file coming from a macro expansion. In this
1862 // case, glue the tokens together into FilenameBuffer and interpret those.
1863 FilenameBuffer.push_back('<');
1864 if (ConcatenateIncludeName(FilenameBuffer, *this))
1865 return; // Found <eom> but no ">"? Diagnostic already emitted.
1866 FilenameStart = &FilenameBuffer[0];
1867 FilenameEnd = &FilenameBuffer[FilenameBuffer.size()];
1868 break;
1869 default:
1870 Diag(FilenameTok.getLocation(), diag::err_pp_expects_filename);
1871 DiscardUntilEndOfDirective();
1872 return;
1873 }
1874
1875 bool isAngled = GetIncludeFilenameSpelling(FilenameTok.getLocation(),
1876 FilenameStart, FilenameEnd);
1877 // If GetIncludeFilenameSpelling set the start ptr to null, there was an
1878 // error.
1879 if (FilenameStart == 0) {
1880 DiscardUntilEndOfDirective();
1881 return;
1882 }
1883
1884 // Verify that there is nothing after the filename, other than EOM. Use the
1885 // preprocessor to lex this in case lexing the filename entered a macro.
1886 CheckEndOfDirective("#include");
1887
1888 // Check that we don't have infinite #include recursion.
1889 if (IncludeMacroStack.size() == MaxAllowedIncludeStackDepth-1)
1890 return Diag(FilenameTok, diag::err_pp_include_too_deep);
1891
1892 // Search include directories.
1893 const DirectoryLookup *CurDir;
1894 const FileEntry *File = LookupFile(FilenameStart, FilenameEnd,
1895 isAngled, LookupFrom, CurDir);
1896 if (File == 0)
1897 return Diag(FilenameTok, diag::err_pp_file_not_found,
1898 std::string(FilenameStart, FilenameEnd));
1899
1900 // Ask HeaderInfo if we should enter this #include file.
1901 if (!HeaderInfo.ShouldEnterIncludeFile(File, isImport)) {
1902 // If it returns true, #including this file will have no effect.
1903 return;
1904 }
1905
1906 // Look up the file, create a File ID for it.
1907 unsigned FileID = SourceMgr.createFileID(File, FilenameTok.getLocation());
1908 if (FileID == 0)
1909 return Diag(FilenameTok, diag::err_pp_file_not_found,
1910 std::string(FilenameStart, FilenameEnd));
1911
1912 // Finally, if all is good, enter the new file!
1913 EnterSourceFile(FileID, CurDir);
1914}
1915
1916/// HandleIncludeNextDirective - Implements #include_next.
1917///
1918void Preprocessor::HandleIncludeNextDirective(Token &IncludeNextTok) {
1919 Diag(IncludeNextTok, diag::ext_pp_include_next_directive);
1920
1921 // #include_next is like #include, except that we start searching after
1922 // the current found directory. If we can't do this, issue a
1923 // diagnostic.
1924 const DirectoryLookup *Lookup = CurDirLookup;
1925 if (isInPrimaryFile()) {
1926 Lookup = 0;
1927 Diag(IncludeNextTok, diag::pp_include_next_in_primary);
1928 } else if (Lookup == 0) {
1929 Diag(IncludeNextTok, diag::pp_include_next_absolute_path);
1930 } else {
1931 // Start looking up in the next directory.
1932 ++Lookup;
1933 }
1934
1935 return HandleIncludeDirective(IncludeNextTok, Lookup);
1936}
1937
1938/// HandleImportDirective - Implements #import.
1939///
1940void Preprocessor::HandleImportDirective(Token &ImportTok) {
1941 Diag(ImportTok, diag::ext_pp_import_directive);
1942
1943 return HandleIncludeDirective(ImportTok, 0, true);
1944}
1945
1946//===----------------------------------------------------------------------===//
1947// Preprocessor Macro Directive Handling.
1948//===----------------------------------------------------------------------===//
1949
1950/// ReadMacroDefinitionArgList - The ( starting an argument list of a macro
1951/// definition has just been read. Lex the rest of the arguments and the
1952/// closing ), updating MI with what we learn. Return true if an error occurs
1953/// parsing the arg list.
1954bool Preprocessor::ReadMacroDefinitionArgList(MacroInfo *MI) {
1955 llvm::SmallVector<IdentifierInfo*, 32> Arguments;
1956
1957 Token Tok;
1958 while (1) {
1959 LexUnexpandedToken(Tok);
1960 switch (Tok.getKind()) {
1961 case tok::r_paren:
1962 // Found the end of the argument list.
1963 if (Arguments.empty()) { // #define FOO()
1964 MI->setArgumentList(Arguments.begin(), Arguments.end());
1965 return false;
1966 }
1967 // Otherwise we have #define FOO(A,)
1968 Diag(Tok, diag::err_pp_expected_ident_in_arg_list);
1969 return true;
1970 case tok::ellipsis: // #define X(... -> C99 varargs
1971 // Warn if use of C99 feature in non-C99 mode.
1972 if (!Features.C99) Diag(Tok, diag::ext_variadic_macro);
1973
1974 // Lex the token after the identifier.
1975 LexUnexpandedToken(Tok);
Chris Lattnercb8e41c2007-10-09 18:02:16 +00001976 if (Tok.isNot(tok::r_paren)) {
Chris Lattner4b009652007-07-25 00:24:17 +00001977 Diag(Tok, diag::err_pp_missing_rparen_in_macro_def);
1978 return true;
1979 }
1980 // Add the __VA_ARGS__ identifier as an argument.
1981 Arguments.push_back(Ident__VA_ARGS__);
1982 MI->setIsC99Varargs();
1983 MI->setArgumentList(Arguments.begin(), Arguments.end());
1984 return false;
1985 case tok::eom: // #define X(
1986 Diag(Tok, diag::err_pp_missing_rparen_in_macro_def);
1987 return true;
1988 default:
1989 // Handle keywords and identifiers here to accept things like
1990 // #define Foo(for) for.
1991 IdentifierInfo *II = Tok.getIdentifierInfo();
1992 if (II == 0) {
1993 // #define X(1
1994 Diag(Tok, diag::err_pp_invalid_tok_in_arg_list);
1995 return true;
1996 }
1997
1998 // If this is already used as an argument, it is used multiple times (e.g.
1999 // #define X(A,A.
2000 if (std::find(Arguments.begin(), Arguments.end(), II) !=
2001 Arguments.end()) { // C99 6.10.3p6
2002 Diag(Tok, diag::err_pp_duplicate_name_in_arg_list, II->getName());
2003 return true;
2004 }
2005
2006 // Add the argument to the macro info.
2007 Arguments.push_back(II);
2008
2009 // Lex the token after the identifier.
2010 LexUnexpandedToken(Tok);
2011
2012 switch (Tok.getKind()) {
2013 default: // #define X(A B
2014 Diag(Tok, diag::err_pp_expected_comma_in_arg_list);
2015 return true;
2016 case tok::r_paren: // #define X(A)
2017 MI->setArgumentList(Arguments.begin(), Arguments.end());
2018 return false;
2019 case tok::comma: // #define X(A,
2020 break;
2021 case tok::ellipsis: // #define X(A... -> GCC extension
2022 // Diagnose extension.
2023 Diag(Tok, diag::ext_named_variadic_macro);
2024
2025 // Lex the token after the identifier.
2026 LexUnexpandedToken(Tok);
Chris Lattnercb8e41c2007-10-09 18:02:16 +00002027 if (Tok.isNot(tok::r_paren)) {
Chris Lattner4b009652007-07-25 00:24:17 +00002028 Diag(Tok, diag::err_pp_missing_rparen_in_macro_def);
2029 return true;
2030 }
2031
2032 MI->setIsGNUVarargs();
2033 MI->setArgumentList(Arguments.begin(), Arguments.end());
2034 return false;
2035 }
2036 }
2037 }
2038}
2039
2040/// HandleDefineDirective - Implements #define. This consumes the entire macro
2041/// line then lets the caller lex the next real token. If 'isTargetSpecific' is
2042/// true, then this is a "#define_target", otherwise this is a "#define".
2043///
2044void Preprocessor::HandleDefineDirective(Token &DefineTok,
2045 bool isTargetSpecific) {
2046 ++NumDefined;
2047
2048 Token MacroNameTok;
2049 ReadMacroName(MacroNameTok, 1);
2050
2051 // Error reading macro name? If so, diagnostic already issued.
Chris Lattnercb8e41c2007-10-09 18:02:16 +00002052 if (MacroNameTok.is(tok::eom))
Chris Lattner4b009652007-07-25 00:24:17 +00002053 return;
2054
2055 // If we are supposed to keep comments in #defines, reenable comment saving
2056 // mode.
2057 CurLexer->KeepCommentMode = KeepMacroComments;
2058
2059 // Create the new macro.
2060 MacroInfo *MI = new MacroInfo(MacroNameTok.getLocation());
2061 if (isTargetSpecific) MI->setIsTargetSpecific();
2062
2063 // If the identifier is an 'other target' macro, clear this bit.
2064 MacroNameTok.getIdentifierInfo()->setIsOtherTargetMacro(false);
2065
2066
2067 Token Tok;
2068 LexUnexpandedToken(Tok);
2069
2070 // If this is a function-like macro definition, parse the argument list,
2071 // marking each of the identifiers as being used as macro arguments. Also,
2072 // check other constraints on the first token of the macro body.
Chris Lattnercb8e41c2007-10-09 18:02:16 +00002073 if (Tok.is(tok::eom)) {
Chris Lattner4b009652007-07-25 00:24:17 +00002074 // If there is no body to this macro, we have no special handling here.
Chris Lattnercb8e41c2007-10-09 18:02:16 +00002075 } else if (Tok.is(tok::l_paren) && !Tok.hasLeadingSpace()) {
Chris Lattner4b009652007-07-25 00:24:17 +00002076 // This is a function-like macro definition. Read the argument list.
2077 MI->setIsFunctionLike();
2078 if (ReadMacroDefinitionArgList(MI)) {
2079 // Forget about MI.
2080 delete MI;
2081 // Throw away the rest of the line.
2082 if (CurLexer->ParsingPreprocessorDirective)
2083 DiscardUntilEndOfDirective();
2084 return;
2085 }
2086
2087 // Read the first token after the arg list for down below.
2088 LexUnexpandedToken(Tok);
2089 } else if (!Tok.hasLeadingSpace()) {
2090 // C99 requires whitespace between the macro definition and the body. Emit
2091 // a diagnostic for something like "#define X+".
2092 if (Features.C99) {
2093 Diag(Tok, diag::ext_c99_whitespace_required_after_macro_name);
2094 } else {
2095 // FIXME: C90/C++ do not get this diagnostic, but it does get a similar
2096 // one in some cases!
2097 }
2098 } else {
2099 // This is a normal token with leading space. Clear the leading space
2100 // marker on the first token to get proper expansion.
2101 Tok.clearFlag(Token::LeadingSpace);
2102 }
2103
2104 // If this is a definition of a variadic C99 function-like macro, not using
2105 // the GNU named varargs extension, enabled __VA_ARGS__.
2106
2107 // "Poison" __VA_ARGS__, which can only appear in the expansion of a macro.
2108 // This gets unpoisoned where it is allowed.
2109 assert(Ident__VA_ARGS__->isPoisoned() && "__VA_ARGS__ should be poisoned!");
2110 if (MI->isC99Varargs())
2111 Ident__VA_ARGS__->setIsPoisoned(false);
2112
2113 // Read the rest of the macro body.
2114 if (MI->isObjectLike()) {
2115 // Object-like macros are very simple, just read their body.
Chris Lattnercb8e41c2007-10-09 18:02:16 +00002116 while (Tok.isNot(tok::eom)) {
Chris Lattner4b009652007-07-25 00:24:17 +00002117 MI->AddTokenToBody(Tok);
2118 // Get the next token of the macro.
2119 LexUnexpandedToken(Tok);
2120 }
2121
2122 } else {
2123 // Otherwise, read the body of a function-like macro. This has to validate
2124 // the # (stringize) operator.
Chris Lattnercb8e41c2007-10-09 18:02:16 +00002125 while (Tok.isNot(tok::eom)) {
Chris Lattner4b009652007-07-25 00:24:17 +00002126 MI->AddTokenToBody(Tok);
2127
2128 // Check C99 6.10.3.2p1: ensure that # operators are followed by macro
2129 // parameters in function-like macro expansions.
Chris Lattnercb8e41c2007-10-09 18:02:16 +00002130 if (Tok.isNot(tok::hash)) {
Chris Lattner4b009652007-07-25 00:24:17 +00002131 // Get the next token of the macro.
2132 LexUnexpandedToken(Tok);
2133 continue;
2134 }
2135
2136 // Get the next token of the macro.
2137 LexUnexpandedToken(Tok);
2138
2139 // Not a macro arg identifier?
2140 if (!Tok.getIdentifierInfo() ||
2141 MI->getArgumentNum(Tok.getIdentifierInfo()) == -1) {
2142 Diag(Tok, diag::err_pp_stringize_not_parameter);
2143 delete MI;
2144
2145 // Disable __VA_ARGS__ again.
2146 Ident__VA_ARGS__->setIsPoisoned(true);
2147 return;
2148 }
2149
2150 // Things look ok, add the param name token to the macro.
2151 MI->AddTokenToBody(Tok);
2152
2153 // Get the next token of the macro.
2154 LexUnexpandedToken(Tok);
2155 }
2156 }
2157
2158
2159 // Disable __VA_ARGS__ again.
2160 Ident__VA_ARGS__->setIsPoisoned(true);
2161
2162 // Check that there is no paste (##) operator at the begining or end of the
2163 // replacement list.
2164 unsigned NumTokens = MI->getNumTokens();
2165 if (NumTokens != 0) {
Chris Lattnercb8e41c2007-10-09 18:02:16 +00002166 if (MI->getReplacementToken(0).is(tok::hashhash)) {
Chris Lattner4b009652007-07-25 00:24:17 +00002167 Diag(MI->getReplacementToken(0), diag::err_paste_at_start);
2168 delete MI;
2169 return;
2170 }
Chris Lattnercb8e41c2007-10-09 18:02:16 +00002171 if (MI->getReplacementToken(NumTokens-1).is(tok::hashhash)) {
Chris Lattner4b009652007-07-25 00:24:17 +00002172 Diag(MI->getReplacementToken(NumTokens-1), diag::err_paste_at_end);
2173 delete MI;
2174 return;
2175 }
2176 }
2177
2178 // If this is the primary source file, remember that this macro hasn't been
2179 // used yet.
2180 if (isInPrimaryFile())
2181 MI->setIsUsed(false);
2182
2183 // Finally, if this identifier already had a macro defined for it, verify that
2184 // the macro bodies are identical and free the old definition.
Chris Lattner7a1b0882007-10-07 08:44:20 +00002185 if (MacroInfo *OtherMI = getMacroInfo(MacroNameTok.getIdentifierInfo())) {
Chris Lattner4b009652007-07-25 00:24:17 +00002186 if (!OtherMI->isUsed())
2187 Diag(OtherMI->getDefinitionLoc(), diag::pp_macro_not_used);
2188
2189 // Macros must be identical. This means all tokes and whitespace separation
2190 // must be the same. C99 6.10.3.2.
2191 if (!MI->isIdenticalTo(*OtherMI, *this)) {
2192 Diag(MI->getDefinitionLoc(), diag::ext_pp_macro_redef,
2193 MacroNameTok.getIdentifierInfo()->getName());
2194 Diag(OtherMI->getDefinitionLoc(), diag::ext_pp_macro_redef2);
2195 }
2196 delete OtherMI;
2197 }
2198
Chris Lattner7a1b0882007-10-07 08:44:20 +00002199 setMacroInfo(MacroNameTok.getIdentifierInfo(), MI);
Chris Lattner4b009652007-07-25 00:24:17 +00002200}
2201
2202/// HandleDefineOtherTargetDirective - Implements #define_other_target.
2203void Preprocessor::HandleDefineOtherTargetDirective(Token &Tok) {
2204 Token MacroNameTok;
2205 ReadMacroName(MacroNameTok, 1);
2206
2207 // Error reading macro name? If so, diagnostic already issued.
Chris Lattnercb8e41c2007-10-09 18:02:16 +00002208 if (MacroNameTok.is(tok::eom))
Chris Lattner4b009652007-07-25 00:24:17 +00002209 return;
2210
2211 // Check to see if this is the last token on the #undef line.
2212 CheckEndOfDirective("#define_other_target");
2213
2214 // If there is already a macro defined by this name, turn it into a
2215 // target-specific define.
Chris Lattner7a1b0882007-10-07 08:44:20 +00002216 if (MacroInfo *MI = getMacroInfo(MacroNameTok.getIdentifierInfo())) {
Chris Lattner4b009652007-07-25 00:24:17 +00002217 MI->setIsTargetSpecific(true);
2218 return;
2219 }
2220
2221 // Mark the identifier as being a macro on some other target.
2222 MacroNameTok.getIdentifierInfo()->setIsOtherTargetMacro();
2223}
2224
2225
2226/// HandleUndefDirective - Implements #undef.
2227///
2228void Preprocessor::HandleUndefDirective(Token &UndefTok) {
2229 ++NumUndefined;
2230
2231 Token MacroNameTok;
2232 ReadMacroName(MacroNameTok, 2);
2233
2234 // Error reading macro name? If so, diagnostic already issued.
Chris Lattnercb8e41c2007-10-09 18:02:16 +00002235 if (MacroNameTok.is(tok::eom))
Chris Lattner4b009652007-07-25 00:24:17 +00002236 return;
2237
2238 // Check to see if this is the last token on the #undef line.
2239 CheckEndOfDirective("#undef");
2240
2241 // Okay, we finally have a valid identifier to undef.
Chris Lattner7a1b0882007-10-07 08:44:20 +00002242 MacroInfo *MI = getMacroInfo(MacroNameTok.getIdentifierInfo());
Chris Lattner4b009652007-07-25 00:24:17 +00002243
2244 // #undef untaints an identifier if it were marked by define_other_target.
2245 MacroNameTok.getIdentifierInfo()->setIsOtherTargetMacro(false);
2246
2247 // If the macro is not defined, this is a noop undef, just return.
2248 if (MI == 0) return;
2249
2250 if (!MI->isUsed())
2251 Diag(MI->getDefinitionLoc(), diag::pp_macro_not_used);
2252
2253 // Free macro definition.
2254 delete MI;
Chris Lattner7a1b0882007-10-07 08:44:20 +00002255 setMacroInfo(MacroNameTok.getIdentifierInfo(), 0);
Chris Lattner4b009652007-07-25 00:24:17 +00002256}
2257
2258
2259//===----------------------------------------------------------------------===//
2260// Preprocessor Conditional Directive Handling.
2261//===----------------------------------------------------------------------===//
2262
2263/// HandleIfdefDirective - Implements the #ifdef/#ifndef directive. isIfndef is
2264/// true when this is a #ifndef directive. ReadAnyTokensBeforeDirective is true
2265/// if any tokens have been returned or pp-directives activated before this
2266/// #ifndef has been lexed.
2267///
2268void Preprocessor::HandleIfdefDirective(Token &Result, bool isIfndef,
2269 bool ReadAnyTokensBeforeDirective) {
2270 ++NumIf;
2271 Token DirectiveTok = Result;
2272
2273 Token MacroNameTok;
2274 ReadMacroName(MacroNameTok);
2275
2276 // Error reading macro name? If so, diagnostic already issued.
Chris Lattnercb8e41c2007-10-09 18:02:16 +00002277 if (MacroNameTok.is(tok::eom)) {
Chris Lattnere6cdeb52007-09-24 05:14:57 +00002278 // Skip code until we get to #endif. This helps with recovery by not
2279 // emitting an error when the #endif is reached.
2280 SkipExcludedConditionalBlock(DirectiveTok.getLocation(),
2281 /*Foundnonskip*/false, /*FoundElse*/false);
Chris Lattner4b009652007-07-25 00:24:17 +00002282 return;
Chris Lattnere6cdeb52007-09-24 05:14:57 +00002283 }
Chris Lattner4b009652007-07-25 00:24:17 +00002284
2285 // Check to see if this is the last token on the #if[n]def line.
2286 CheckEndOfDirective(isIfndef ? "#ifndef" : "#ifdef");
2287
2288 // If the start of a top-level #ifdef, inform MIOpt.
2289 if (!ReadAnyTokensBeforeDirective &&
2290 CurLexer->getConditionalStackDepth() == 0) {
2291 assert(isIfndef && "#ifdef shouldn't reach here");
2292 CurLexer->MIOpt.EnterTopLevelIFNDEF(MacroNameTok.getIdentifierInfo());
2293 }
2294
2295 IdentifierInfo *MII = MacroNameTok.getIdentifierInfo();
Chris Lattner7a1b0882007-10-07 08:44:20 +00002296 MacroInfo *MI = getMacroInfo(MII);
Chris Lattner4b009652007-07-25 00:24:17 +00002297
2298 // If there is a macro, process it.
2299 if (MI) {
2300 // Mark it used.
2301 MI->setIsUsed(true);
2302
2303 // If this is the first use of a target-specific macro, warn about it.
2304 if (MI->isTargetSpecific()) {
2305 MI->setIsTargetSpecific(false); // Don't warn on second use.
2306 getTargetInfo().DiagnoseNonPortability(MacroNameTok.getLocation(),
2307 diag::port_target_macro_use);
2308 }
2309 } else {
2310 // Use of a target-specific macro for some other target? If so, warn.
2311 if (MII->isOtherTargetMacro()) {
2312 MII->setIsOtherTargetMacro(false); // Don't warn on second use.
2313 getTargetInfo().DiagnoseNonPortability(MacroNameTok.getLocation(),
2314 diag::port_target_macro_use);
2315 }
2316 }
2317
2318 // Should we include the stuff contained by this directive?
2319 if (!MI == isIfndef) {
2320 // Yes, remember that we are inside a conditional, then lex the next token.
2321 CurLexer->pushConditionalLevel(DirectiveTok.getLocation(), /*wasskip*/false,
2322 /*foundnonskip*/true, /*foundelse*/false);
2323 } else {
2324 // No, skip the contents of this block and return the first token after it.
2325 SkipExcludedConditionalBlock(DirectiveTok.getLocation(),
2326 /*Foundnonskip*/false,
2327 /*FoundElse*/false);
2328 }
2329}
2330
2331/// HandleIfDirective - Implements the #if directive.
2332///
2333void Preprocessor::HandleIfDirective(Token &IfToken,
2334 bool ReadAnyTokensBeforeDirective) {
2335 ++NumIf;
2336
2337 // Parse and evaluation the conditional expression.
2338 IdentifierInfo *IfNDefMacro = 0;
2339 bool ConditionalTrue = EvaluateDirectiveExpression(IfNDefMacro);
2340
2341 // Should we include the stuff contained by this directive?
2342 if (ConditionalTrue) {
2343 // If this condition is equivalent to #ifndef X, and if this is the first
2344 // directive seen, handle it for the multiple-include optimization.
2345 if (!ReadAnyTokensBeforeDirective &&
2346 CurLexer->getConditionalStackDepth() == 0 && IfNDefMacro)
2347 CurLexer->MIOpt.EnterTopLevelIFNDEF(IfNDefMacro);
2348
2349 // Yes, remember that we are inside a conditional, then lex the next token.
2350 CurLexer->pushConditionalLevel(IfToken.getLocation(), /*wasskip*/false,
2351 /*foundnonskip*/true, /*foundelse*/false);
2352 } else {
2353 // No, skip the contents of this block and return the first token after it.
2354 SkipExcludedConditionalBlock(IfToken.getLocation(), /*Foundnonskip*/false,
2355 /*FoundElse*/false);
2356 }
2357}
2358
2359/// HandleEndifDirective - Implements the #endif directive.
2360///
2361void Preprocessor::HandleEndifDirective(Token &EndifToken) {
2362 ++NumEndif;
2363
2364 // Check that this is the whole directive.
2365 CheckEndOfDirective("#endif");
2366
2367 PPConditionalInfo CondInfo;
2368 if (CurLexer->popConditionalLevel(CondInfo)) {
2369 // No conditionals on the stack: this is an #endif without an #if.
2370 return Diag(EndifToken, diag::err_pp_endif_without_if);
2371 }
2372
2373 // If this the end of a top-level #endif, inform MIOpt.
2374 if (CurLexer->getConditionalStackDepth() == 0)
2375 CurLexer->MIOpt.ExitTopLevelConditional();
2376
2377 assert(!CondInfo.WasSkipping && !CurLexer->LexingRawMode &&
2378 "This code should only be reachable in the non-skipping case!");
2379}
2380
2381
2382void Preprocessor::HandleElseDirective(Token &Result) {
2383 ++NumElse;
2384
2385 // #else directive in a non-skipping conditional... start skipping.
2386 CheckEndOfDirective("#else");
2387
2388 PPConditionalInfo CI;
2389 if (CurLexer->popConditionalLevel(CI))
2390 return Diag(Result, diag::pp_err_else_without_if);
2391
2392 // If this is a top-level #else, inform the MIOpt.
2393 if (CurLexer->getConditionalStackDepth() == 0)
2394 CurLexer->MIOpt.FoundTopLevelElse();
2395
2396 // If this is a #else with a #else before it, report the error.
2397 if (CI.FoundElse) Diag(Result, diag::pp_err_else_after_else);
2398
2399 // Finally, skip the rest of the contents of this block and return the first
2400 // token after it.
2401 return SkipExcludedConditionalBlock(CI.IfLoc, /*Foundnonskip*/true,
2402 /*FoundElse*/true);
2403}
2404
2405void Preprocessor::HandleElifDirective(Token &ElifToken) {
2406 ++NumElse;
2407
2408 // #elif directive in a non-skipping conditional... start skipping.
2409 // We don't care what the condition is, because we will always skip it (since
2410 // the block immediately before it was included).
2411 DiscardUntilEndOfDirective();
2412
2413 PPConditionalInfo CI;
2414 if (CurLexer->popConditionalLevel(CI))
2415 return Diag(ElifToken, diag::pp_err_elif_without_if);
2416
2417 // If this is a top-level #elif, inform the MIOpt.
2418 if (CurLexer->getConditionalStackDepth() == 0)
2419 CurLexer->MIOpt.FoundTopLevelElse();
2420
2421 // If this is a #elif with a #else before it, report the error.
2422 if (CI.FoundElse) Diag(ElifToken, diag::pp_err_elif_after_else);
2423
2424 // Finally, skip the rest of the contents of this block and return the first
2425 // token after it.
2426 return SkipExcludedConditionalBlock(CI.IfLoc, /*Foundnonskip*/true,
2427 /*FoundElse*/CI.FoundElse);
2428}
2429