blob: a73757f1b59e09c75a387e98a276f1f1517cdec7 [file] [log] [blame]
Reid Spencer5f016e22007-07-11 17:01:13 +00001//===--- Preprocess.cpp - C Language Family Preprocessor Implementation ---===//
2//
3// The LLVM Compiler Infrastructure
4//
Chris Lattner0bc735f2007-12-29 19:59:25 +00005// This file is distributed under the University of Illinois Open Source
6// License. See LICENSE.TXT for details.
Reid Spencer5f016e22007-07-11 17:01:13 +00007//
8//===----------------------------------------------------------------------===//
9//
10// This file implements the Preprocessor interface.
11//
12//===----------------------------------------------------------------------===//
13//
14// Options to support:
15// -H - Print the name of each header file used.
16// -d[MDNI] - Dump various things.
17// -fworking-directory - #line's with preprocessor's working dir.
18// -fpreprocessed
19// -dependency-file,-M,-MM,-MF,-MG,-MP,-MT,-MQ,-MD,-MMD
20// -W*
21// -w
22//
23// Messages to emit:
24// "Multiple include guards may be useful for:\n"
25//
26//===----------------------------------------------------------------------===//
27
28#include "clang/Lex/Preprocessor.h"
29#include "clang/Lex/HeaderSearch.h"
30#include "clang/Lex/MacroInfo.h"
31#include "clang/Lex/PPCallbacks.h"
32#include "clang/Lex/Pragma.h"
33#include "clang/Lex/ScratchBuffer.h"
34#include "clang/Basic/Diagnostic.h"
35#include "clang/Basic/FileManager.h"
36#include "clang/Basic/SourceManager.h"
37#include "clang/Basic/TargetInfo.h"
38#include "llvm/ADT/SmallVector.h"
Chris Lattner97ba77c2007-07-16 06:48:38 +000039#include "llvm/Support/MemoryBuffer.h"
Ted Kremenekbdd30c22008-01-14 16:44:48 +000040#include "llvm/Support/Streams.h"
Chris Lattner77034d32007-09-03 18:30:32 +000041#include <ctime>
Reid Spencer5f016e22007-07-11 17:01:13 +000042using namespace clang;
43
44//===----------------------------------------------------------------------===//
45
46Preprocessor::Preprocessor(Diagnostic &diags, const LangOptions &opts,
47 TargetInfo &target, SourceManager &SM,
48 HeaderSearch &Headers)
49 : Diags(diags), Features(opts), Target(target), FileMgr(Headers.getFileMgr()),
50 SourceMgr(SM), HeaderInfo(Headers), Identifiers(opts),
51 CurLexer(0), CurDirLookup(0), CurMacroExpander(0), Callbacks(0) {
52 ScratchBuf = new ScratchBuffer(SourceMgr);
Chris Lattner9594acf2007-07-15 00:25:26 +000053
Reid Spencer5f016e22007-07-11 17:01:13 +000054 // Clear stats.
55 NumDirectives = NumDefined = NumUndefined = NumPragma = 0;
56 NumIf = NumElse = NumEndif = 0;
57 NumEnteredSourceFiles = 0;
58 NumMacroExpanded = NumFnMacroExpanded = NumBuiltinMacroExpanded = 0;
59 NumFastMacroExpanded = NumTokenPaste = NumFastTokenPaste = 0;
60 MaxIncludeStackDepth = 0;
61 NumSkipped = 0;
62
63 // Default to discarding comments.
64 KeepComments = false;
65 KeepMacroComments = false;
66
67 // Macro expansion is enabled.
68 DisableMacroExpansion = false;
69 InMacroArgs = false;
Chris Lattner9594acf2007-07-15 00:25:26 +000070 NumCachedMacroExpanders = 0;
Reid Spencer5f016e22007-07-11 17:01:13 +000071
72 // "Poison" __VA_ARGS__, which can only appear in the expansion of a macro.
73 // This gets unpoisoned where it is allowed.
74 (Ident__VA_ARGS__ = getIdentifierInfo("__VA_ARGS__"))->setIsPoisoned();
75
Chris Lattner53b0dab2007-10-09 22:10:18 +000076 Predefines = 0;
77
Reid Spencer5f016e22007-07-11 17:01:13 +000078 // Initialize the pragma handlers.
79 PragmaHandlers = new PragmaNamespace(0);
80 RegisterBuiltinPragmas();
81
82 // Initialize builtin macros like __LINE__ and friends.
83 RegisterBuiltinMacros();
84}
85
86Preprocessor::~Preprocessor() {
87 // Free any active lexers.
88 delete CurLexer;
89
90 while (!IncludeMacroStack.empty()) {
91 delete IncludeMacroStack.back().TheLexer;
92 delete IncludeMacroStack.back().TheMacroExpander;
93 IncludeMacroStack.pop_back();
94 }
Chris Lattnercc1a8752007-10-07 08:44:20 +000095
96 // Free any macro definitions.
97 for (llvm::DenseMap<IdentifierInfo*, MacroInfo*>::iterator I =
98 Macros.begin(), E = Macros.end(); I != E; ++I) {
99 // Free the macro definition.
100 delete I->second;
101 I->second = 0;
102 I->first->setHasMacroDefinition(false);
103 }
Reid Spencer5f016e22007-07-11 17:01:13 +0000104
Chris Lattner9594acf2007-07-15 00:25:26 +0000105 // Free any cached macro expanders.
106 for (unsigned i = 0, e = NumCachedMacroExpanders; i != e; ++i)
107 delete MacroExpanderCache[i];
108
Reid Spencer5f016e22007-07-11 17:01:13 +0000109 // Release pragma information.
110 delete PragmaHandlers;
111
112 // Delete the scratch buffer info.
113 delete ScratchBuf;
114}
115
116PPCallbacks::~PPCallbacks() {
117}
118
119/// Diag - Forwarding function for diagnostics. This emits a diagnostic at
Chris Lattnerd2177732007-07-20 16:59:19 +0000120/// the specified Token's location, translating the token's start
Reid Spencer5f016e22007-07-11 17:01:13 +0000121/// position in the current buffer into a SourcePosition object for rendering.
122void Preprocessor::Diag(SourceLocation Loc, unsigned DiagID) {
Ted Kremenek9c728dc2007-12-12 22:39:36 +0000123 Diags.Report(getFullLoc(Loc), DiagID);
Reid Spencer5f016e22007-07-11 17:01:13 +0000124}
125
126void Preprocessor::Diag(SourceLocation Loc, unsigned DiagID,
127 const std::string &Msg) {
Ted Kremenek9c728dc2007-12-12 22:39:36 +0000128 Diags.Report(getFullLoc(Loc), DiagID, &Msg, 1);
Reid Spencer5f016e22007-07-11 17:01:13 +0000129}
130
Chris Lattnerd2177732007-07-20 16:59:19 +0000131void Preprocessor::DumpToken(const Token &Tok, bool DumpFlags) const {
Ted Kremenekbdd30c22008-01-14 16:44:48 +0000132 llvm::cerr << tok::getTokenName(Tok.getKind()) << " '"
133 << getSpelling(Tok) << "'";
Reid Spencer5f016e22007-07-11 17:01:13 +0000134
135 if (!DumpFlags) return;
Chris Lattnerc3d8d572007-12-09 20:31:55 +0000136
Ted Kremenekbdd30c22008-01-14 16:44:48 +0000137 llvm::cerr << "\t";
Reid Spencer5f016e22007-07-11 17:01:13 +0000138 if (Tok.isAtStartOfLine())
Ted Kremenekbdd30c22008-01-14 16:44:48 +0000139 llvm::cerr << " [StartOfLine]";
Reid Spencer5f016e22007-07-11 17:01:13 +0000140 if (Tok.hasLeadingSpace())
Ted Kremenekbdd30c22008-01-14 16:44:48 +0000141 llvm::cerr << " [LeadingSpace]";
Reid Spencer5f016e22007-07-11 17:01:13 +0000142 if (Tok.isExpandDisabled())
Ted Kremenekbdd30c22008-01-14 16:44:48 +0000143 llvm::cerr << " [ExpandDisabled]";
Reid Spencer5f016e22007-07-11 17:01:13 +0000144 if (Tok.needsCleaning()) {
145 const char *Start = SourceMgr.getCharacterData(Tok.getLocation());
Ted Kremenekbdd30c22008-01-14 16:44:48 +0000146 llvm::cerr << " [UnClean='" << std::string(Start, Start+Tok.getLength())
147 << "']";
Reid Spencer5f016e22007-07-11 17:01:13 +0000148 }
Chris Lattnerc3d8d572007-12-09 20:31:55 +0000149
Ted Kremenekbdd30c22008-01-14 16:44:48 +0000150 llvm::cerr << "\tLoc=<";
Chris Lattnerc3d8d572007-12-09 20:31:55 +0000151 DumpLocation(Tok.getLocation());
Ted Kremenekbdd30c22008-01-14 16:44:48 +0000152 llvm::cerr << ">";
Chris Lattnerc3d8d572007-12-09 20:31:55 +0000153}
154
155void Preprocessor::DumpLocation(SourceLocation Loc) const {
156 SourceLocation LogLoc = SourceMgr.getLogicalLoc(Loc);
Ted Kremenekbdd30c22008-01-14 16:44:48 +0000157 llvm::cerr << SourceMgr.getSourceName(LogLoc) << ':'
158 << SourceMgr.getLineNumber(LogLoc) << ':'
159 << SourceMgr.getLineNumber(LogLoc);
Chris Lattnerc3d8d572007-12-09 20:31:55 +0000160
161 SourceLocation PhysLoc = SourceMgr.getPhysicalLoc(Loc);
162 if (PhysLoc != LogLoc) {
Ted Kremenekbdd30c22008-01-14 16:44:48 +0000163 llvm::cerr << " <PhysLoc=";
Chris Lattnerc3d8d572007-12-09 20:31:55 +0000164 DumpLocation(PhysLoc);
Ted Kremenekbdd30c22008-01-14 16:44:48 +0000165 llvm::cerr << ">";
Chris Lattnerc3d8d572007-12-09 20:31:55 +0000166 }
Reid Spencer5f016e22007-07-11 17:01:13 +0000167}
168
169void Preprocessor::DumpMacro(const MacroInfo &MI) const {
Ted Kremenekbdd30c22008-01-14 16:44:48 +0000170 llvm::cerr << "MACRO: ";
Reid Spencer5f016e22007-07-11 17:01:13 +0000171 for (unsigned i = 0, e = MI.getNumTokens(); i != e; ++i) {
172 DumpToken(MI.getReplacementToken(i));
Ted Kremenekbdd30c22008-01-14 16:44:48 +0000173 llvm::cerr << " ";
Reid Spencer5f016e22007-07-11 17:01:13 +0000174 }
Ted Kremenekbdd30c22008-01-14 16:44:48 +0000175 llvm::cerr << "\n";
Reid Spencer5f016e22007-07-11 17:01:13 +0000176}
177
178void Preprocessor::PrintStats() {
Ted Kremenekbdd30c22008-01-14 16:44:48 +0000179 llvm::cerr << "\n*** Preprocessor Stats:\n";
180 llvm::cerr << NumDirectives << " directives found:\n";
181 llvm::cerr << " " << NumDefined << " #define.\n";
182 llvm::cerr << " " << NumUndefined << " #undef.\n";
183 llvm::cerr << " #include/#include_next/#import:\n";
184 llvm::cerr << " " << NumEnteredSourceFiles << " source files entered.\n";
185 llvm::cerr << " " << MaxIncludeStackDepth << " max include stack depth\n";
186 llvm::cerr << " " << NumIf << " #if/#ifndef/#ifdef.\n";
187 llvm::cerr << " " << NumElse << " #else/#elif.\n";
188 llvm::cerr << " " << NumEndif << " #endif.\n";
189 llvm::cerr << " " << NumPragma << " #pragma.\n";
190 llvm::cerr << NumSkipped << " #if/#ifndef#ifdef regions skipped\n";
Reid Spencer5f016e22007-07-11 17:01:13 +0000191
Ted Kremenekbdd30c22008-01-14 16:44:48 +0000192 llvm::cerr << NumMacroExpanded << "/" << NumFnMacroExpanded << "/"
193 << NumBuiltinMacroExpanded << " obj/fn/builtin macros expanded, "
194 << NumFastMacroExpanded << " on the fast path.\n";
195 llvm::cerr << (NumFastTokenPaste+NumTokenPaste)
196 << " token paste (##) operations performed, "
197 << NumFastTokenPaste << " on the fast path.\n";
Reid Spencer5f016e22007-07-11 17:01:13 +0000198}
199
200//===----------------------------------------------------------------------===//
201// Token Spelling
202//===----------------------------------------------------------------------===//
203
204
205/// getSpelling() - Return the 'spelling' of this token. The spelling of a
206/// token are the characters used to represent the token in the source file
207/// after trigraph expansion and escaped-newline folding. In particular, this
208/// wants to get the true, uncanonicalized, spelling of things like digraphs
209/// UCNs, etc.
Chris Lattnerd2177732007-07-20 16:59:19 +0000210std::string Preprocessor::getSpelling(const Token &Tok) const {
Reid Spencer5f016e22007-07-11 17:01:13 +0000211 assert((int)Tok.getLength() >= 0 && "Token character range is bogus!");
212
213 // If this token contains nothing interesting, return it directly.
214 const char *TokStart = SourceMgr.getCharacterData(Tok.getLocation());
215 if (!Tok.needsCleaning())
216 return std::string(TokStart, TokStart+Tok.getLength());
217
218 std::string Result;
219 Result.reserve(Tok.getLength());
220
221 // Otherwise, hard case, relex the characters into the string.
222 for (const char *Ptr = TokStart, *End = TokStart+Tok.getLength();
223 Ptr != End; ) {
224 unsigned CharSize;
225 Result.push_back(Lexer::getCharAndSizeNoWarn(Ptr, CharSize, Features));
226 Ptr += CharSize;
227 }
228 assert(Result.size() != unsigned(Tok.getLength()) &&
229 "NeedsCleaning flag set on something that didn't need cleaning!");
230 return Result;
231}
232
233/// getSpelling - This method is used to get the spelling of a token into a
234/// preallocated buffer, instead of as an std::string. The caller is required
235/// to allocate enough space for the token, which is guaranteed to be at least
236/// Tok.getLength() bytes long. The actual length of the token is returned.
237///
238/// Note that this method may do two possible things: it may either fill in
239/// the buffer specified with characters, or it may *change the input pointer*
240/// to point to a constant buffer with the data already in it (avoiding a
241/// copy). The caller is not allowed to modify the returned buffer pointer
242/// if an internal buffer is returned.
Chris Lattnerd2177732007-07-20 16:59:19 +0000243unsigned Preprocessor::getSpelling(const Token &Tok,
Reid Spencer5f016e22007-07-11 17:01:13 +0000244 const char *&Buffer) const {
245 assert((int)Tok.getLength() >= 0 && "Token character range is bogus!");
246
247 // If this token is an identifier, just return the string from the identifier
248 // table, which is very quick.
249 if (const IdentifierInfo *II = Tok.getIdentifierInfo()) {
250 Buffer = II->getName();
Chris Lattner0f670322007-07-22 22:50:09 +0000251
252 // Return the length of the token. If the token needed cleaning, don't
253 // include the size of the newlines or trigraphs in it.
254 if (!Tok.needsCleaning())
255 return Tok.getLength();
256 else
257 return strlen(Buffer);
Reid Spencer5f016e22007-07-11 17:01:13 +0000258 }
259
260 // Otherwise, compute the start of the token in the input lexer buffer.
261 const char *TokStart = SourceMgr.getCharacterData(Tok.getLocation());
262
263 // If this token contains nothing interesting, return it directly.
264 if (!Tok.needsCleaning()) {
265 Buffer = TokStart;
266 return Tok.getLength();
267 }
268 // Otherwise, hard case, relex the characters into the string.
269 char *OutBuf = const_cast<char*>(Buffer);
270 for (const char *Ptr = TokStart, *End = TokStart+Tok.getLength();
271 Ptr != End; ) {
272 unsigned CharSize;
273 *OutBuf++ = Lexer::getCharAndSizeNoWarn(Ptr, CharSize, Features);
274 Ptr += CharSize;
275 }
276 assert(unsigned(OutBuf-Buffer) != Tok.getLength() &&
277 "NeedsCleaning flag set on something that didn't need cleaning!");
278
279 return OutBuf-Buffer;
280}
281
282
283/// CreateString - Plop the specified string into a scratch buffer and return a
284/// location for it. If specified, the source location provides a source
285/// location for the token.
286SourceLocation Preprocessor::
287CreateString(const char *Buf, unsigned Len, SourceLocation SLoc) {
288 if (SLoc.isValid())
289 return ScratchBuf->getToken(Buf, Len, SLoc);
290 return ScratchBuf->getToken(Buf, Len);
291}
292
293
Chris Lattner97ba77c2007-07-16 06:48:38 +0000294/// AdvanceToTokenCharacter - Given a location that specifies the start of a
295/// token, return a new location that specifies a character within the token.
296SourceLocation Preprocessor::AdvanceToTokenCharacter(SourceLocation TokStart,
297 unsigned CharNo) {
Chris Lattner9dc1f532007-07-20 16:37:10 +0000298 // If they request the first char of the token, we're trivially done. If this
299 // is a macro expansion, it doesn't make sense to point to a character within
300 // the instantiation point (the name). We could point to the source
301 // character, but without also pointing to instantiation info, this is
302 // confusing.
303 if (CharNo == 0 || TokStart.isMacroID()) return TokStart;
Chris Lattner97ba77c2007-07-16 06:48:38 +0000304
305 // Figure out how many physical characters away the specified logical
306 // character is. This needs to take into consideration newlines and
307 // trigraphs.
Chris Lattner9dc1f532007-07-20 16:37:10 +0000308 const char *TokPtr = SourceMgr.getCharacterData(TokStart);
309 unsigned PhysOffset = 0;
Chris Lattner97ba77c2007-07-16 06:48:38 +0000310
311 // The usual case is that tokens don't contain anything interesting. Skip
312 // over the uninteresting characters. If a token only consists of simple
313 // chars, this method is extremely fast.
314 while (CharNo && Lexer::isObviouslySimpleCharacter(*TokPtr))
Chris Lattner9dc1f532007-07-20 16:37:10 +0000315 ++TokPtr, --CharNo, ++PhysOffset;
Chris Lattner97ba77c2007-07-16 06:48:38 +0000316
317 // If we have a character that may be a trigraph or escaped newline, create a
318 // lexer to parse it correctly.
Chris Lattner97ba77c2007-07-16 06:48:38 +0000319 if (CharNo != 0) {
320 // Create a lexer starting at this token position.
Chris Lattner25bdb512007-07-20 16:52:03 +0000321 Lexer TheLexer(TokStart, *this, TokPtr);
Chris Lattnerd2177732007-07-20 16:59:19 +0000322 Token Tok;
Chris Lattner97ba77c2007-07-16 06:48:38 +0000323 // Skip over characters the remaining characters.
Chris Lattner9dc1f532007-07-20 16:37:10 +0000324 const char *TokStartPtr = TokPtr;
Chris Lattner97ba77c2007-07-16 06:48:38 +0000325 for (; CharNo; --CharNo)
326 TheLexer.getAndAdvanceChar(TokPtr, Tok);
Chris Lattner9dc1f532007-07-20 16:37:10 +0000327
328 PhysOffset += TokPtr-TokStartPtr;
Chris Lattner97ba77c2007-07-16 06:48:38 +0000329 }
Chris Lattner9dc1f532007-07-20 16:37:10 +0000330
331 return TokStart.getFileLocWithOffset(PhysOffset);
Chris Lattner97ba77c2007-07-16 06:48:38 +0000332}
333
334
Chris Lattner53b0dab2007-10-09 22:10:18 +0000335//===----------------------------------------------------------------------===//
336// Preprocessor Initialization Methods
337//===----------------------------------------------------------------------===//
338
339// Append a #define line to Buf for Macro. Macro should be of the form XXX,
340// in which case we emit "#define XXX 1" or "XXX=Y z W" in which case we emit
341// "#define XXX Y z W". To get a #define with no value, use "XXX=".
342static void DefineBuiltinMacro(std::vector<char> &Buf, const char *Macro,
343 const char *Command = "#define ") {
344 Buf.insert(Buf.end(), Command, Command+strlen(Command));
345 if (const char *Equal = strchr(Macro, '=')) {
346 // Turn the = into ' '.
347 Buf.insert(Buf.end(), Macro, Equal);
348 Buf.push_back(' ');
349 Buf.insert(Buf.end(), Equal+1, Equal+strlen(Equal));
350 } else {
351 // Push "macroname 1".
352 Buf.insert(Buf.end(), Macro, Macro+strlen(Macro));
353 Buf.push_back(' ');
354 Buf.push_back('1');
355 }
356 Buf.push_back('\n');
357}
358
359
360static void InitializePredefinedMacros(Preprocessor &PP,
361 std::vector<char> &Buf) {
362 // FIXME: Implement magic like cpp_init_builtins for things like __STDC__
363 // and __DATE__ etc.
364#if 0
365 /* __STDC__ has the value 1 under normal circumstances.
366 However, if (a) we are in a system header, (b) the option
367 stdc_0_in_system_headers is true (set by target config), and
368 (c) we are not in strictly conforming mode, then it has the
369 value 0. (b) and (c) are already checked in cpp_init_builtins. */
370 //case BT_STDC:
371 if (cpp_in_system_header (pfile))
372 number = 0;
373 else
374 number = 1;
375 break;
376#endif
377 // These should all be defined in the preprocessor according to the
378 // current language configuration.
379 DefineBuiltinMacro(Buf, "__STDC__=1");
380 //DefineBuiltinMacro(Buf, "__ASSEMBLER__=1");
381 if (PP.getLangOptions().C99 && !PP.getLangOptions().CPlusPlus)
382 DefineBuiltinMacro(Buf, "__STDC_VERSION__=199901L");
383 else if (0) // STDC94 ?
384 DefineBuiltinMacro(Buf, "__STDC_VERSION__=199409L");
385
386 DefineBuiltinMacro(Buf, "__STDC_HOSTED__=1");
387 if (PP.getLangOptions().ObjC1)
388 DefineBuiltinMacro(Buf, "__OBJC__=1");
389 if (PP.getLangOptions().ObjC2)
390 DefineBuiltinMacro(Buf, "__OBJC2__=1");
Steve Naroff8ee529b2007-10-31 18:42:27 +0000391
Chris Lattnerd19144b2007-10-10 17:48:53 +0000392 // Add __builtin_va_list typedef.
393 {
394 const char *VAList = PP.getTargetInfo().getVAListDeclaration();
395 Buf.insert(Buf.end(), VAList, VAList+strlen(VAList));
396 Buf.push_back('\n');
397 }
Chris Lattner53b0dab2007-10-09 22:10:18 +0000398
399 // Get the target #defines.
400 PP.getTargetInfo().getTargetDefines(Buf);
401
402 // Compiler set macros.
403 DefineBuiltinMacro(Buf, "__APPLE_CC__=5250");
Steve Naroff39d0a272007-11-10 18:06:36 +0000404 DefineBuiltinMacro(Buf, "__ENVIRONMENT_MAC_OS_X_VERSION_MIN_REQUIRED__=1050");
Chris Lattner53b0dab2007-10-09 22:10:18 +0000405 DefineBuiltinMacro(Buf, "__GNUC_MINOR__=0");
406 DefineBuiltinMacro(Buf, "__GNUC_PATCHLEVEL__=1");
407 DefineBuiltinMacro(Buf, "__GNUC__=4");
408 DefineBuiltinMacro(Buf, "__GXX_ABI_VERSION=1002");
409 DefineBuiltinMacro(Buf, "__VERSION__=\"4.0.1 (Apple Computer, Inc. "
410 "build 5250)\"");
411
412 // Build configuration options.
413 DefineBuiltinMacro(Buf, "__DYNAMIC__=1");
414 DefineBuiltinMacro(Buf, "__FINITE_MATH_ONLY__=0");
415 DefineBuiltinMacro(Buf, "__NO_INLINE__=1");
416 DefineBuiltinMacro(Buf, "__PIC__=1");
417
418
419 if (PP.getLangOptions().CPlusPlus) {
420 DefineBuiltinMacro(Buf, "__DEPRECATED=1");
421 DefineBuiltinMacro(Buf, "__EXCEPTIONS=1");
422 DefineBuiltinMacro(Buf, "__GNUG__=4");
423 DefineBuiltinMacro(Buf, "__GXX_WEAK__=1");
424 DefineBuiltinMacro(Buf, "__cplusplus=1");
425 DefineBuiltinMacro(Buf, "__private_extern__=extern");
426 }
427
428 // FIXME: Should emit a #line directive here.
429}
430
431
432/// EnterMainSourceFile - Enter the specified FileID as the main source file,
Nate Begeman6b616022008-01-07 04:01:26 +0000433/// which implicitly adds the builtin defines etc.
Ted Kremenek95041a22007-12-19 22:51:13 +0000434void Preprocessor::EnterMainSourceFile() {
435
436 unsigned MainFileID = SourceMgr.getMainFileID();
437
Chris Lattner53b0dab2007-10-09 22:10:18 +0000438 // Enter the main file source buffer.
439 EnterSourceFile(MainFileID, 0);
440
Chris Lattnerb2832982007-11-15 19:07:47 +0000441 // Tell the header info that the main file was entered. If the file is later
442 // #imported, it won't be re-entered.
443 if (const FileEntry *FE =
444 SourceMgr.getFileEntryForLoc(SourceLocation::getFileLoc(MainFileID, 0)))
445 HeaderInfo.IncrementIncludeCount(FE);
446
Chris Lattner53b0dab2007-10-09 22:10:18 +0000447 std::vector<char> PrologFile;
448 PrologFile.reserve(4080);
449
450 // Install things like __POWERPC__, __GNUC__, etc into the macro table.
451 InitializePredefinedMacros(*this, PrologFile);
452
453 // Add on the predefines from the driver.
454 PrologFile.insert(PrologFile.end(), Predefines,Predefines+strlen(Predefines));
455
456 // Memory buffer must end with a null byte!
457 PrologFile.push_back(0);
458
459 // Now that we have emitted the predefined macros, #includes, etc into
460 // PrologFile, preprocess it to populate the initial preprocessor state.
461 llvm::MemoryBuffer *SB =
462 llvm::MemoryBuffer::getMemBufferCopy(&PrologFile.front(),&PrologFile.back(),
463 "<predefines>");
464 assert(SB && "Cannot fail to create predefined source buffer");
465 unsigned FileID = SourceMgr.createFileIDForMemBuffer(SB);
466 assert(FileID && "Could not create FileID for predefines?");
467
468 // Start parsing the predefines.
469 EnterSourceFile(FileID, 0);
470}
Chris Lattner97ba77c2007-07-16 06:48:38 +0000471
Reid Spencer5f016e22007-07-11 17:01:13 +0000472//===----------------------------------------------------------------------===//
473// Source File Location Methods.
474//===----------------------------------------------------------------------===//
475
476/// LookupFile - Given a "foo" or <foo> reference, look up the indicated file,
477/// return null on failure. isAngled indicates whether the file reference is
478/// for system #include's or not (i.e. using <> instead of "").
479const FileEntry *Preprocessor::LookupFile(const char *FilenameStart,
480 const char *FilenameEnd,
481 bool isAngled,
482 const DirectoryLookup *FromDir,
483 const DirectoryLookup *&CurDir) {
484 // If the header lookup mechanism may be relative to the current file, pass in
485 // info about where the current file is.
486 const FileEntry *CurFileEnt = 0;
487 if (!FromDir) {
Chris Lattner9dc1f532007-07-20 16:37:10 +0000488 SourceLocation FileLoc = getCurrentFileLexer()->getFileLoc();
489 CurFileEnt = SourceMgr.getFileEntryForLoc(FileLoc);
Reid Spencer5f016e22007-07-11 17:01:13 +0000490 }
491
492 // Do a standard file entry lookup.
493 CurDir = CurDirLookup;
494 const FileEntry *FE =
495 HeaderInfo.LookupFile(FilenameStart, FilenameEnd,
496 isAngled, FromDir, CurDir, CurFileEnt);
497 if (FE) return FE;
498
499 // Otherwise, see if this is a subframework header. If so, this is relative
500 // to one of the headers on the #include stack. Walk the list of the current
501 // headers on the #include stack and pass them to HeaderInfo.
502 if (CurLexer && !CurLexer->Is_PragmaLexer) {
Chris Lattner9415a0c2008-02-01 05:34:02 +0000503 if ((CurFileEnt = SourceMgr.getFileEntryForLoc(CurLexer->getFileLoc())))
504 if ((FE = HeaderInfo.LookupSubframeworkHeader(FilenameStart, FilenameEnd,
505 CurFileEnt)))
506 return FE;
Reid Spencer5f016e22007-07-11 17:01:13 +0000507 }
508
509 for (unsigned i = 0, e = IncludeMacroStack.size(); i != e; ++i) {
510 IncludeStackInfo &ISEntry = IncludeMacroStack[e-i-1];
511 if (ISEntry.TheLexer && !ISEntry.TheLexer->Is_PragmaLexer) {
Chris Lattner9415a0c2008-02-01 05:34:02 +0000512 if ((CurFileEnt =
513 SourceMgr.getFileEntryForLoc(ISEntry.TheLexer->getFileLoc())))
514 if ((FE = HeaderInfo.LookupSubframeworkHeader(FilenameStart,
515 FilenameEnd, CurFileEnt)))
516 return FE;
Reid Spencer5f016e22007-07-11 17:01:13 +0000517 }
518 }
519
520 // Otherwise, we really couldn't find the file.
521 return 0;
522}
523
524/// isInPrimaryFile - Return true if we're in the top-level file, not in a
525/// #include.
526bool Preprocessor::isInPrimaryFile() const {
527 if (CurLexer && !CurLexer->Is_PragmaLexer)
Chris Lattner53b0dab2007-10-09 22:10:18 +0000528 return IncludeMacroStack.empty();
Reid Spencer5f016e22007-07-11 17:01:13 +0000529
530 // If there are any stacked lexers, we're in a #include.
Chris Lattner53b0dab2007-10-09 22:10:18 +0000531 assert(IncludeMacroStack[0].TheLexer &&
532 !IncludeMacroStack[0].TheLexer->Is_PragmaLexer &&
533 "Top level include stack isn't our primary lexer?");
534 for (unsigned i = 1, e = IncludeMacroStack.size(); i != e; ++i)
Reid Spencer5f016e22007-07-11 17:01:13 +0000535 if (IncludeMacroStack[i].TheLexer &&
536 !IncludeMacroStack[i].TheLexer->Is_PragmaLexer)
Chris Lattner53b0dab2007-10-09 22:10:18 +0000537 return false;
538 return true;
Reid Spencer5f016e22007-07-11 17:01:13 +0000539}
540
541/// getCurrentLexer - Return the current file lexer being lexed from. Note
542/// that this ignores any potentially active macro expansions and _Pragma
543/// expansions going on at the time.
544Lexer *Preprocessor::getCurrentFileLexer() const {
545 if (CurLexer && !CurLexer->Is_PragmaLexer) return CurLexer;
546
547 // Look for a stacked lexer.
548 for (unsigned i = IncludeMacroStack.size(); i != 0; --i) {
549 Lexer *L = IncludeMacroStack[i-1].TheLexer;
550 if (L && !L->Is_PragmaLexer) // Ignore macro & _Pragma expansions.
551 return L;
552 }
553 return 0;
554}
555
556
557/// EnterSourceFile - Add a source file to the top of the include stack and
558/// start lexing tokens from it instead of the current buffer. Return true
559/// on failure.
560void Preprocessor::EnterSourceFile(unsigned FileID,
Chris Lattner53b0dab2007-10-09 22:10:18 +0000561 const DirectoryLookup *CurDir) {
Reid Spencer5f016e22007-07-11 17:01:13 +0000562 assert(CurMacroExpander == 0 && "Cannot #include a file inside a macro!");
563 ++NumEnteredSourceFiles;
564
565 if (MaxIncludeStackDepth < IncludeMacroStack.size())
566 MaxIncludeStackDepth = IncludeMacroStack.size();
567
Chris Lattner25bdb512007-07-20 16:52:03 +0000568 Lexer *TheLexer = new Lexer(SourceLocation::getFileLoc(FileID, 0), *this);
Reid Spencer5f016e22007-07-11 17:01:13 +0000569 EnterSourceFileWithLexer(TheLexer, CurDir);
570}
571
572/// EnterSourceFile - Add a source file to the top of the include stack and
573/// start lexing tokens from it instead of the current buffer.
574void Preprocessor::EnterSourceFileWithLexer(Lexer *TheLexer,
575 const DirectoryLookup *CurDir) {
576
577 // Add the current lexer to the include stack.
578 if (CurLexer || CurMacroExpander)
579 IncludeMacroStack.push_back(IncludeStackInfo(CurLexer, CurDirLookup,
580 CurMacroExpander));
581
582 CurLexer = TheLexer;
583 CurDirLookup = CurDir;
584 CurMacroExpander = 0;
585
586 // Notify the client, if desired, that we are in a new source file.
587 if (Callbacks && !CurLexer->Is_PragmaLexer) {
588 DirectoryLookup::DirType FileType = DirectoryLookup::NormalHeaderDir;
589
590 // Get the file entry for the current file.
591 if (const FileEntry *FE =
Chris Lattner9dc1f532007-07-20 16:37:10 +0000592 SourceMgr.getFileEntryForLoc(CurLexer->getFileLoc()))
Reid Spencer5f016e22007-07-11 17:01:13 +0000593 FileType = HeaderInfo.getFileDirFlavor(FE);
594
Chris Lattner9dc1f532007-07-20 16:37:10 +0000595 Callbacks->FileChanged(CurLexer->getFileLoc(),
Reid Spencer5f016e22007-07-11 17:01:13 +0000596 PPCallbacks::EnterFile, FileType);
597 }
598}
599
600
601
602/// EnterMacro - Add a Macro to the top of the include stack and start lexing
603/// tokens from it instead of the current buffer.
Chris Lattnerd2177732007-07-20 16:59:19 +0000604void Preprocessor::EnterMacro(Token &Tok, MacroArgs *Args) {
Reid Spencer5f016e22007-07-11 17:01:13 +0000605 IncludeMacroStack.push_back(IncludeStackInfo(CurLexer, CurDirLookup,
606 CurMacroExpander));
607 CurLexer = 0;
608 CurDirLookup = 0;
609
Chris Lattner9594acf2007-07-15 00:25:26 +0000610 if (NumCachedMacroExpanders == 0) {
611 CurMacroExpander = new MacroExpander(Tok, Args, *this);
612 } else {
613 CurMacroExpander = MacroExpanderCache[--NumCachedMacroExpanders];
614 CurMacroExpander->Init(Tok, Args);
615 }
Reid Spencer5f016e22007-07-11 17:01:13 +0000616}
617
618/// EnterTokenStream - Add a "macro" context to the top of the include stack,
619/// which will cause the lexer to start returning the specified tokens. Note
620/// that these tokens will be re-macro-expanded when/if expansion is enabled.
621/// This method assumes that the specified stream of tokens has a permanent
622/// owner somewhere, so they do not need to be copied.
Chris Lattnerd2177732007-07-20 16:59:19 +0000623void Preprocessor::EnterTokenStream(const Token *Toks, unsigned NumToks) {
Reid Spencer5f016e22007-07-11 17:01:13 +0000624 // Save our current state.
625 IncludeMacroStack.push_back(IncludeStackInfo(CurLexer, CurDirLookup,
626 CurMacroExpander));
627 CurLexer = 0;
628 CurDirLookup = 0;
629
630 // Create a macro expander to expand from the specified token stream.
Chris Lattner9594acf2007-07-15 00:25:26 +0000631 if (NumCachedMacroExpanders == 0) {
632 CurMacroExpander = new MacroExpander(Toks, NumToks, *this);
633 } else {
634 CurMacroExpander = MacroExpanderCache[--NumCachedMacroExpanders];
635 CurMacroExpander->Init(Toks, NumToks);
636 }
Reid Spencer5f016e22007-07-11 17:01:13 +0000637}
638
639/// RemoveTopOfLexerStack - Pop the current lexer/macro exp off the top of the
640/// lexer stack. This should only be used in situations where the current
641/// state of the top-of-stack lexer is known.
642void Preprocessor::RemoveTopOfLexerStack() {
643 assert(!IncludeMacroStack.empty() && "Ran out of stack entries to load");
Chris Lattner9594acf2007-07-15 00:25:26 +0000644
645 if (CurMacroExpander) {
646 // Delete or cache the now-dead macro expander.
647 if (NumCachedMacroExpanders == MacroExpanderCacheSize)
648 delete CurMacroExpander;
649 else
650 MacroExpanderCache[NumCachedMacroExpanders++] = CurMacroExpander;
651 } else {
652 delete CurLexer;
653 }
Reid Spencer5f016e22007-07-11 17:01:13 +0000654 CurLexer = IncludeMacroStack.back().TheLexer;
655 CurDirLookup = IncludeMacroStack.back().TheDirLookup;
656 CurMacroExpander = IncludeMacroStack.back().TheMacroExpander;
657 IncludeMacroStack.pop_back();
658}
659
660//===----------------------------------------------------------------------===//
661// Macro Expansion Handling.
662//===----------------------------------------------------------------------===//
663
Chris Lattnercc1a8752007-10-07 08:44:20 +0000664/// setMacroInfo - Specify a macro for this identifier.
665///
666void Preprocessor::setMacroInfo(IdentifierInfo *II, MacroInfo *MI) {
667 if (MI == 0) {
668 if (II->hasMacroDefinition()) {
669 Macros.erase(II);
670 II->setHasMacroDefinition(false);
671 }
672 } else {
673 Macros[II] = MI;
674 II->setHasMacroDefinition(true);
675 }
676}
677
Reid Spencer5f016e22007-07-11 17:01:13 +0000678/// RegisterBuiltinMacro - Register the specified identifier in the identifier
679/// table and mark it as a builtin macro to be expanded.
680IdentifierInfo *Preprocessor::RegisterBuiltinMacro(const char *Name) {
681 // Get the identifier.
682 IdentifierInfo *Id = getIdentifierInfo(Name);
683
684 // Mark it as being a macro that is builtin.
685 MacroInfo *MI = new MacroInfo(SourceLocation());
686 MI->setIsBuiltinMacro();
Chris Lattnercc1a8752007-10-07 08:44:20 +0000687 setMacroInfo(Id, MI);
Reid Spencer5f016e22007-07-11 17:01:13 +0000688 return Id;
689}
690
691
692/// RegisterBuiltinMacros - Register builtin macros, such as __LINE__ with the
693/// identifier table.
694void Preprocessor::RegisterBuiltinMacros() {
695 Ident__LINE__ = RegisterBuiltinMacro("__LINE__");
696 Ident__FILE__ = RegisterBuiltinMacro("__FILE__");
697 Ident__DATE__ = RegisterBuiltinMacro("__DATE__");
698 Ident__TIME__ = RegisterBuiltinMacro("__TIME__");
699 Ident_Pragma = RegisterBuiltinMacro("_Pragma");
700
701 // GCC Extensions.
702 Ident__BASE_FILE__ = RegisterBuiltinMacro("__BASE_FILE__");
703 Ident__INCLUDE_LEVEL__ = RegisterBuiltinMacro("__INCLUDE_LEVEL__");
704 Ident__TIMESTAMP__ = RegisterBuiltinMacro("__TIMESTAMP__");
705}
706
707/// isTrivialSingleTokenExpansion - Return true if MI, which has a single token
708/// in its expansion, currently expands to that token literally.
709static bool isTrivialSingleTokenExpansion(const MacroInfo *MI,
Chris Lattnercc1a8752007-10-07 08:44:20 +0000710 const IdentifierInfo *MacroIdent,
711 Preprocessor &PP) {
Reid Spencer5f016e22007-07-11 17:01:13 +0000712 IdentifierInfo *II = MI->getReplacementToken(0).getIdentifierInfo();
713
714 // If the token isn't an identifier, it's always literally expanded.
715 if (II == 0) return true;
716
717 // If the identifier is a macro, and if that macro is enabled, it may be
718 // expanded so it's not a trivial expansion.
Chris Lattnercc1a8752007-10-07 08:44:20 +0000719 if (II->hasMacroDefinition() && PP.getMacroInfo(II)->isEnabled() &&
Reid Spencer5f016e22007-07-11 17:01:13 +0000720 // Fast expanding "#define X X" is ok, because X would be disabled.
721 II != MacroIdent)
722 return false;
723
724 // If this is an object-like macro invocation, it is safe to trivially expand
725 // it.
726 if (MI->isObjectLike()) return true;
727
728 // If this is a function-like macro invocation, it's safe to trivially expand
729 // as long as the identifier is not a macro argument.
730 for (MacroInfo::arg_iterator I = MI->arg_begin(), E = MI->arg_end();
731 I != E; ++I)
732 if (*I == II)
733 return false; // Identifier is a macro argument.
734
735 return true;
736}
737
738
739/// isNextPPTokenLParen - Determine whether the next preprocessor token to be
740/// lexed is a '('. If so, consume the token and return true, if not, this
741/// method should have no observable side-effect on the lexed tokens.
742bool Preprocessor::isNextPPTokenLParen() {
743 // Do some quick tests for rejection cases.
744 unsigned Val;
745 if (CurLexer)
746 Val = CurLexer->isNextPPTokenLParen();
747 else
748 Val = CurMacroExpander->isNextTokenLParen();
749
750 if (Val == 2) {
Chris Lattner0ea793e2007-07-19 00:07:36 +0000751 // We have run off the end. If it's a source file we don't
752 // examine enclosing ones (C99 5.1.1.2p4). Otherwise walk up the
753 // macro stack.
754 if (CurLexer)
755 return false;
756 for (unsigned i = IncludeMacroStack.size(); i != 0; --i) {
Reid Spencer5f016e22007-07-11 17:01:13 +0000757 IncludeStackInfo &Entry = IncludeMacroStack[i-1];
758 if (Entry.TheLexer)
759 Val = Entry.TheLexer->isNextPPTokenLParen();
760 else
761 Val = Entry.TheMacroExpander->isNextTokenLParen();
Chris Lattner0ea793e2007-07-19 00:07:36 +0000762
763 if (Val != 2)
764 break;
765
766 // Ran off the end of a source file?
767 if (Entry.TheLexer)
768 return false;
Reid Spencer5f016e22007-07-11 17:01:13 +0000769 }
770 }
771
772 // Okay, if we know that the token is a '(', lex it and return. Otherwise we
773 // have found something that isn't a '(' or we found the end of the
774 // translation unit. In either case, return false.
775 if (Val != 1)
776 return false;
777
Chris Lattnerd2177732007-07-20 16:59:19 +0000778 Token Tok;
Reid Spencer5f016e22007-07-11 17:01:13 +0000779 LexUnexpandedToken(Tok);
Chris Lattner22f6bbc2007-10-09 18:02:16 +0000780 assert(Tok.is(tok::l_paren) && "Error computing l-paren-ness?");
Reid Spencer5f016e22007-07-11 17:01:13 +0000781 return true;
782}
783
784/// HandleMacroExpandedIdentifier - If an identifier token is read that is to be
785/// expanded as a macro, handle it and return the next token as 'Identifier'.
Chris Lattnerd2177732007-07-20 16:59:19 +0000786bool Preprocessor::HandleMacroExpandedIdentifier(Token &Identifier,
Reid Spencer5f016e22007-07-11 17:01:13 +0000787 MacroInfo *MI) {
Chris Lattner4d730462008-01-07 19:50:27 +0000788 // If this is a macro exapnsion in the "#if !defined(x)" line for the file,
789 // then the macro could expand to different things in other contexts, we need
790 // to disable the optimization in this case.
791 if (CurLexer) CurLexer->MIOpt.ExpandedMacro();
Reid Spencer5f016e22007-07-11 17:01:13 +0000792
793 // If this is a builtin macro, like __LINE__ or _Pragma, handle it specially.
794 if (MI->isBuiltinMacro()) {
795 ExpandBuiltinMacro(Identifier);
796 return false;
797 }
798
799 // If this is the first use of a target-specific macro, warn about it.
800 if (MI->isTargetSpecific()) {
801 MI->setIsTargetSpecific(false); // Don't warn on second use.
Ted Kremenek9c728dc2007-12-12 22:39:36 +0000802 getTargetInfo().DiagnoseNonPortability(getFullLoc(Identifier.getLocation()),
Reid Spencer5f016e22007-07-11 17:01:13 +0000803 diag::port_target_macro_use);
804 }
805
806 /// Args - If this is a function-like macro expansion, this contains,
807 /// for each macro argument, the list of tokens that were provided to the
808 /// invocation.
809 MacroArgs *Args = 0;
810
811 // If this is a function-like macro, read the arguments.
812 if (MI->isFunctionLike()) {
813 // C99 6.10.3p10: If the preprocessing token immediately after the the macro
Chris Lattner2b64fdc2007-07-19 16:11:58 +0000814 // name isn't a '(', this macro should not be expanded. Otherwise, consume
815 // it.
Reid Spencer5f016e22007-07-11 17:01:13 +0000816 if (!isNextPPTokenLParen())
817 return true;
818
819 // Remember that we are now parsing the arguments to a macro invocation.
820 // Preprocessor directives used inside macro arguments are not portable, and
821 // this enables the warning.
822 InMacroArgs = true;
823 Args = ReadFunctionLikeMacroArgs(Identifier, MI);
824
825 // Finished parsing args.
826 InMacroArgs = false;
827
828 // If there was an error parsing the arguments, bail out.
829 if (Args == 0) return false;
830
831 ++NumFnMacroExpanded;
832 } else {
833 ++NumMacroExpanded;
834 }
835
836 // Notice that this macro has been used.
837 MI->setIsUsed(true);
838
839 // If we started lexing a macro, enter the macro expansion body.
840
841 // If this macro expands to no tokens, don't bother to push it onto the
842 // expansion stack, only to take it right back off.
843 if (MI->getNumTokens() == 0) {
844 // No need for arg info.
845 if (Args) Args->destroy();
846
847 // Ignore this macro use, just return the next token in the current
848 // buffer.
849 bool HadLeadingSpace = Identifier.hasLeadingSpace();
850 bool IsAtStartOfLine = Identifier.isAtStartOfLine();
851
852 Lex(Identifier);
853
854 // If the identifier isn't on some OTHER line, inherit the leading
855 // whitespace/first-on-a-line property of this token. This handles
856 // stuff like "! XX," -> "! ," and " XX," -> " ,", when XX is
857 // empty.
858 if (!Identifier.isAtStartOfLine()) {
Chris Lattnerd2177732007-07-20 16:59:19 +0000859 if (IsAtStartOfLine) Identifier.setFlag(Token::StartOfLine);
860 if (HadLeadingSpace) Identifier.setFlag(Token::LeadingSpace);
Reid Spencer5f016e22007-07-11 17:01:13 +0000861 }
862 ++NumFastMacroExpanded;
863 return false;
864
865 } else if (MI->getNumTokens() == 1 &&
Chris Lattnercc1a8752007-10-07 08:44:20 +0000866 isTrivialSingleTokenExpansion(MI, Identifier.getIdentifierInfo(),
867 *this)){
Reid Spencer5f016e22007-07-11 17:01:13 +0000868 // Otherwise, if this macro expands into a single trivially-expanded
869 // token: expand it now. This handles common cases like
870 // "#define VAL 42".
871
872 // Propagate the isAtStartOfLine/hasLeadingSpace markers of the macro
873 // identifier to the expanded token.
874 bool isAtStartOfLine = Identifier.isAtStartOfLine();
875 bool hasLeadingSpace = Identifier.hasLeadingSpace();
876
877 // Remember where the token is instantiated.
878 SourceLocation InstantiateLoc = Identifier.getLocation();
879
880 // Replace the result token.
881 Identifier = MI->getReplacementToken(0);
882
883 // Restore the StartOfLine/LeadingSpace markers.
Chris Lattnerd2177732007-07-20 16:59:19 +0000884 Identifier.setFlagValue(Token::StartOfLine , isAtStartOfLine);
885 Identifier.setFlagValue(Token::LeadingSpace, hasLeadingSpace);
Reid Spencer5f016e22007-07-11 17:01:13 +0000886
887 // Update the tokens location to include both its logical and physical
888 // locations.
889 SourceLocation Loc =
890 SourceMgr.getInstantiationLoc(Identifier.getLocation(), InstantiateLoc);
891 Identifier.setLocation(Loc);
892
893 // If this is #define X X, we must mark the result as unexpandible.
894 if (IdentifierInfo *NewII = Identifier.getIdentifierInfo())
Chris Lattnercc1a8752007-10-07 08:44:20 +0000895 if (getMacroInfo(NewII) == MI)
Chris Lattnerd2177732007-07-20 16:59:19 +0000896 Identifier.setFlag(Token::DisableExpand);
Reid Spencer5f016e22007-07-11 17:01:13 +0000897
898 // Since this is not an identifier token, it can't be macro expanded, so
899 // we're done.
900 ++NumFastMacroExpanded;
901 return false;
902 }
903
904 // Start expanding the macro.
905 EnterMacro(Identifier, Args);
906
907 // Now that the macro is at the top of the include stack, ask the
908 // preprocessor to read the next token from it.
909 Lex(Identifier);
910 return false;
911}
912
913/// ReadFunctionLikeMacroArgs - After reading "MACRO(", this method is
914/// invoked to read all of the actual arguments specified for the macro
915/// invocation. This returns null on error.
Chris Lattnerd2177732007-07-20 16:59:19 +0000916MacroArgs *Preprocessor::ReadFunctionLikeMacroArgs(Token &MacroName,
Reid Spencer5f016e22007-07-11 17:01:13 +0000917 MacroInfo *MI) {
918 // The number of fixed arguments to parse.
919 unsigned NumFixedArgsLeft = MI->getNumArgs();
920 bool isVariadic = MI->isVariadic();
921
922 // Outer loop, while there are more arguments, keep reading them.
Chris Lattnerd2177732007-07-20 16:59:19 +0000923 Token Tok;
Reid Spencer5f016e22007-07-11 17:01:13 +0000924 Tok.setKind(tok::comma);
925 --NumFixedArgsLeft; // Start reading the first arg.
926
927 // ArgTokens - Build up a list of tokens that make up each argument. Each
928 // argument is separated by an EOF token. Use a SmallVector so we can avoid
929 // heap allocations in the common case.
Chris Lattnerd2177732007-07-20 16:59:19 +0000930 llvm::SmallVector<Token, 64> ArgTokens;
Reid Spencer5f016e22007-07-11 17:01:13 +0000931
932 unsigned NumActuals = 0;
Chris Lattner22f6bbc2007-10-09 18:02:16 +0000933 while (Tok.is(tok::comma)) {
Chris Lattner2b64fdc2007-07-19 16:11:58 +0000934 // C99 6.10.3p11: Keep track of the number of l_parens we have seen. Note
935 // that we already consumed the first one.
Reid Spencer5f016e22007-07-11 17:01:13 +0000936 unsigned NumParens = 0;
937
938 while (1) {
939 // Read arguments as unexpanded tokens. This avoids issues, e.g., where
940 // an argument value in a macro could expand to ',' or '(' or ')'.
941 LexUnexpandedToken(Tok);
942
Chris Lattnerc21d9e42008-01-22 19:34:51 +0000943 if (Tok.is(tok::eof) || Tok.is(tok::eom)) { // "#if f(<eof>" & "#if f(\n"
Reid Spencer5f016e22007-07-11 17:01:13 +0000944 Diag(MacroName, diag::err_unterm_macro_invoc);
Chris Lattnerc21d9e42008-01-22 19:34:51 +0000945 // Do not lose the EOF/EOM. Return it to the client.
Reid Spencer5f016e22007-07-11 17:01:13 +0000946 MacroName = Tok;
947 return 0;
Chris Lattner22f6bbc2007-10-09 18:02:16 +0000948 } else if (Tok.is(tok::r_paren)) {
Reid Spencer5f016e22007-07-11 17:01:13 +0000949 // If we found the ) token, the macro arg list is done.
950 if (NumParens-- == 0)
951 break;
Chris Lattner22f6bbc2007-10-09 18:02:16 +0000952 } else if (Tok.is(tok::l_paren)) {
Reid Spencer5f016e22007-07-11 17:01:13 +0000953 ++NumParens;
Chris Lattner22f6bbc2007-10-09 18:02:16 +0000954 } else if (Tok.is(tok::comma) && NumParens == 0) {
Reid Spencer5f016e22007-07-11 17:01:13 +0000955 // Comma ends this argument if there are more fixed arguments expected.
956 if (NumFixedArgsLeft)
957 break;
958
959 // If this is not a variadic macro, too many args were specified.
960 if (!isVariadic) {
961 // Emit the diagnostic at the macro name in case there is a missing ).
962 // Emitting it at the , could be far away from the macro name.
963 Diag(MacroName, diag::err_too_many_args_in_macro_invoc);
964 return 0;
965 }
966 // Otherwise, continue to add the tokens to this variable argument.
Chris Lattner22f6bbc2007-10-09 18:02:16 +0000967 } else if (Tok.is(tok::comment) && !KeepMacroComments) {
Reid Spencer5f016e22007-07-11 17:01:13 +0000968 // If this is a comment token in the argument list and we're just in
969 // -C mode (not -CC mode), discard the comment.
970 continue;
Chris Lattner0c3eb292007-11-23 06:50:21 +0000971 } else if (Tok.is(tok::identifier)) {
972 // Reading macro arguments can cause macros that we are currently
973 // expanding from to be popped off the expansion stack. Doing so causes
974 // them to be reenabled for expansion. Here we record whether any
975 // identifiers we lex as macro arguments correspond to disabled macros.
976 // If so, we mark the token as noexpand. This is a subtle aspect of
977 // C99 6.10.3.4p2.
978 if (MacroInfo *MI = getMacroInfo(Tok.getIdentifierInfo()))
979 if (!MI->isEnabled())
980 Tok.setFlag(Token::DisableExpand);
Reid Spencer5f016e22007-07-11 17:01:13 +0000981 }
982
983 ArgTokens.push_back(Tok);
984 }
985
986 // Empty arguments are standard in C99 and supported as an extension in
987 // other modes.
988 if (ArgTokens.empty() && !Features.C99)
989 Diag(Tok, diag::ext_empty_fnmacro_arg);
990
991 // Add a marker EOF token to the end of the token list for this argument.
Chris Lattnerd2177732007-07-20 16:59:19 +0000992 Token EOFTok;
Reid Spencer5f016e22007-07-11 17:01:13 +0000993 EOFTok.startToken();
994 EOFTok.setKind(tok::eof);
995 EOFTok.setLocation(Tok.getLocation());
996 EOFTok.setLength(0);
997 ArgTokens.push_back(EOFTok);
998 ++NumActuals;
999 --NumFixedArgsLeft;
1000 };
1001
1002 // Okay, we either found the r_paren. Check to see if we parsed too few
1003 // arguments.
1004 unsigned MinArgsExpected = MI->getNumArgs();
1005
1006 // See MacroArgs instance var for description of this.
1007 bool isVarargsElided = false;
1008
1009 if (NumActuals < MinArgsExpected) {
1010 // There are several cases where too few arguments is ok, handle them now.
1011 if (NumActuals+1 == MinArgsExpected && MI->isVariadic()) {
1012 // Varargs where the named vararg parameter is missing: ok as extension.
1013 // #define A(x, ...)
1014 // A("blah")
1015 Diag(Tok, diag::ext_missing_varargs_arg);
1016
1017 // Remember this occurred if this is a C99 macro invocation with at least
1018 // one actual argument.
1019 isVarargsElided = MI->isC99Varargs() && MI->getNumArgs() > 1;
1020 } else if (MI->getNumArgs() == 1) {
1021 // #define A(x)
1022 // A()
1023 // is ok because it is an empty argument.
1024
1025 // Empty arguments are standard in C99 and supported as an extension in
1026 // other modes.
1027 if (ArgTokens.empty() && !Features.C99)
1028 Diag(Tok, diag::ext_empty_fnmacro_arg);
1029 } else {
1030 // Otherwise, emit the error.
1031 Diag(Tok, diag::err_too_few_args_in_macro_invoc);
1032 return 0;
1033 }
1034
1035 // Add a marker EOF token to the end of the token list for this argument.
1036 SourceLocation EndLoc = Tok.getLocation();
1037 Tok.startToken();
1038 Tok.setKind(tok::eof);
1039 Tok.setLocation(EndLoc);
1040 Tok.setLength(0);
1041 ArgTokens.push_back(Tok);
1042 }
1043
1044 return MacroArgs::create(MI, &ArgTokens[0], ArgTokens.size(),isVarargsElided);
1045}
1046
1047/// ComputeDATE_TIME - Compute the current time, enter it into the specified
1048/// scratch buffer, then return DATELoc/TIMELoc locations with the position of
1049/// the identifier tokens inserted.
1050static void ComputeDATE_TIME(SourceLocation &DATELoc, SourceLocation &TIMELoc,
1051 Preprocessor &PP) {
1052 time_t TT = time(0);
1053 struct tm *TM = localtime(&TT);
1054
1055 static const char * const Months[] = {
1056 "Jan","Feb","Mar","Apr","May","Jun","Jul","Aug","Sep","Oct","Nov","Dec"
1057 };
1058
1059 char TmpBuffer[100];
1060 sprintf(TmpBuffer, "\"%s %2d %4d\"", Months[TM->tm_mon], TM->tm_mday,
1061 TM->tm_year+1900);
1062 DATELoc = PP.CreateString(TmpBuffer, strlen(TmpBuffer));
1063
1064 sprintf(TmpBuffer, "\"%02d:%02d:%02d\"", TM->tm_hour, TM->tm_min, TM->tm_sec);
1065 TIMELoc = PP.CreateString(TmpBuffer, strlen(TmpBuffer));
1066}
1067
1068/// ExpandBuiltinMacro - If an identifier token is read that is to be expanded
1069/// as a builtin macro, handle it and return the next token as 'Tok'.
Chris Lattnerd2177732007-07-20 16:59:19 +00001070void Preprocessor::ExpandBuiltinMacro(Token &Tok) {
Reid Spencer5f016e22007-07-11 17:01:13 +00001071 // Figure out which token this is.
1072 IdentifierInfo *II = Tok.getIdentifierInfo();
1073 assert(II && "Can't be a macro without id info!");
1074
1075 // If this is an _Pragma directive, expand it, invoke the pragma handler, then
1076 // lex the token after it.
1077 if (II == Ident_Pragma)
1078 return Handle_Pragma(Tok);
1079
1080 ++NumBuiltinMacroExpanded;
1081
1082 char TmpBuffer[100];
1083
1084 // Set up the return result.
1085 Tok.setIdentifierInfo(0);
Chris Lattnerd2177732007-07-20 16:59:19 +00001086 Tok.clearFlag(Token::NeedsCleaning);
Reid Spencer5f016e22007-07-11 17:01:13 +00001087
1088 if (II == Ident__LINE__) {
1089 // __LINE__ expands to a simple numeric value.
Chris Lattner9dc1f532007-07-20 16:37:10 +00001090 sprintf(TmpBuffer, "%u", SourceMgr.getLogicalLineNumber(Tok.getLocation()));
Reid Spencer5f016e22007-07-11 17:01:13 +00001091 unsigned Length = strlen(TmpBuffer);
1092 Tok.setKind(tok::numeric_constant);
1093 Tok.setLength(Length);
1094 Tok.setLocation(CreateString(TmpBuffer, Length, Tok.getLocation()));
1095 } else if (II == Ident__FILE__ || II == Ident__BASE_FILE__) {
1096 SourceLocation Loc = Tok.getLocation();
1097 if (II == Ident__BASE_FILE__) {
1098 Diag(Tok, diag::ext_pp_base_file);
Chris Lattner9dc1f532007-07-20 16:37:10 +00001099 SourceLocation NextLoc = SourceMgr.getIncludeLoc(Loc);
1100 while (NextLoc.isValid()) {
Reid Spencer5f016e22007-07-11 17:01:13 +00001101 Loc = NextLoc;
Chris Lattner9dc1f532007-07-20 16:37:10 +00001102 NextLoc = SourceMgr.getIncludeLoc(Loc);
Reid Spencer5f016e22007-07-11 17:01:13 +00001103 }
1104 }
1105
1106 // Escape this filename. Turn '\' -> '\\' '"' -> '\"'
Chris Lattner9dc1f532007-07-20 16:37:10 +00001107 std::string FN = SourceMgr.getSourceName(SourceMgr.getLogicalLoc(Loc));
Reid Spencer5f016e22007-07-11 17:01:13 +00001108 FN = '"' + Lexer::Stringify(FN) + '"';
1109 Tok.setKind(tok::string_literal);
1110 Tok.setLength(FN.size());
1111 Tok.setLocation(CreateString(&FN[0], FN.size(), Tok.getLocation()));
1112 } else if (II == Ident__DATE__) {
1113 if (!DATELoc.isValid())
1114 ComputeDATE_TIME(DATELoc, TIMELoc, *this);
1115 Tok.setKind(tok::string_literal);
1116 Tok.setLength(strlen("\"Mmm dd yyyy\""));
1117 Tok.setLocation(SourceMgr.getInstantiationLoc(DATELoc, Tok.getLocation()));
1118 } else if (II == Ident__TIME__) {
1119 if (!TIMELoc.isValid())
1120 ComputeDATE_TIME(DATELoc, TIMELoc, *this);
1121 Tok.setKind(tok::string_literal);
1122 Tok.setLength(strlen("\"hh:mm:ss\""));
1123 Tok.setLocation(SourceMgr.getInstantiationLoc(TIMELoc, Tok.getLocation()));
1124 } else if (II == Ident__INCLUDE_LEVEL__) {
1125 Diag(Tok, diag::ext_pp_include_level);
1126
1127 // Compute the include depth of this token.
1128 unsigned Depth = 0;
Chris Lattner9dc1f532007-07-20 16:37:10 +00001129 SourceLocation Loc = SourceMgr.getIncludeLoc(Tok.getLocation());
1130 for (; Loc.isValid(); ++Depth)
1131 Loc = SourceMgr.getIncludeLoc(Loc);
Reid Spencer5f016e22007-07-11 17:01:13 +00001132
1133 // __INCLUDE_LEVEL__ expands to a simple numeric value.
1134 sprintf(TmpBuffer, "%u", Depth);
1135 unsigned Length = strlen(TmpBuffer);
1136 Tok.setKind(tok::numeric_constant);
1137 Tok.setLength(Length);
1138 Tok.setLocation(CreateString(TmpBuffer, Length, Tok.getLocation()));
1139 } else if (II == Ident__TIMESTAMP__) {
1140 // MSVC, ICC, GCC, VisualAge C++ extension. The generated string should be
1141 // of the form "Ddd Mmm dd hh::mm::ss yyyy", which is returned by asctime.
1142 Diag(Tok, diag::ext_pp_timestamp);
1143
1144 // Get the file that we are lexing out of. If we're currently lexing from
1145 // a macro, dig into the include stack.
1146 const FileEntry *CurFile = 0;
1147 Lexer *TheLexer = getCurrentFileLexer();
1148
1149 if (TheLexer)
Chris Lattner9dc1f532007-07-20 16:37:10 +00001150 CurFile = SourceMgr.getFileEntryForLoc(TheLexer->getFileLoc());
Reid Spencer5f016e22007-07-11 17:01:13 +00001151
1152 // If this file is older than the file it depends on, emit a diagnostic.
1153 const char *Result;
1154 if (CurFile) {
1155 time_t TT = CurFile->getModificationTime();
1156 struct tm *TM = localtime(&TT);
1157 Result = asctime(TM);
1158 } else {
1159 Result = "??? ??? ?? ??:??:?? ????\n";
1160 }
1161 TmpBuffer[0] = '"';
1162 strcpy(TmpBuffer+1, Result);
1163 unsigned Len = strlen(TmpBuffer);
1164 TmpBuffer[Len-1] = '"'; // Replace the newline with a quote.
1165 Tok.setKind(tok::string_literal);
1166 Tok.setLength(Len);
1167 Tok.setLocation(CreateString(TmpBuffer, Len, Tok.getLocation()));
1168 } else {
1169 assert(0 && "Unknown identifier!");
Chris Lattnerc3d8d572007-12-09 20:31:55 +00001170 }
Reid Spencer5f016e22007-07-11 17:01:13 +00001171}
1172
1173//===----------------------------------------------------------------------===//
1174// Lexer Event Handling.
1175//===----------------------------------------------------------------------===//
1176
1177/// LookUpIdentifierInfo - Given a tok::identifier token, look up the
1178/// identifier information for the token and install it into the token.
Chris Lattnerd2177732007-07-20 16:59:19 +00001179IdentifierInfo *Preprocessor::LookUpIdentifierInfo(Token &Identifier,
Reid Spencer5f016e22007-07-11 17:01:13 +00001180 const char *BufPtr) {
Chris Lattner22f6bbc2007-10-09 18:02:16 +00001181 assert(Identifier.is(tok::identifier) && "Not an identifier!");
Reid Spencer5f016e22007-07-11 17:01:13 +00001182 assert(Identifier.getIdentifierInfo() == 0 && "Identinfo already exists!");
1183
1184 // Look up this token, see if it is a macro, or if it is a language keyword.
1185 IdentifierInfo *II;
1186 if (BufPtr && !Identifier.needsCleaning()) {
1187 // No cleaning needed, just use the characters from the lexed buffer.
1188 II = getIdentifierInfo(BufPtr, BufPtr+Identifier.getLength());
1189 } else {
1190 // Cleaning needed, alloca a buffer, clean into it, then use the buffer.
Chris Lattnerc35717a2007-07-13 17:10:38 +00001191 llvm::SmallVector<char, 64> IdentifierBuffer;
1192 IdentifierBuffer.resize(Identifier.getLength());
1193 const char *TmpBuf = &IdentifierBuffer[0];
Reid Spencer5f016e22007-07-11 17:01:13 +00001194 unsigned Size = getSpelling(Identifier, TmpBuf);
1195 II = getIdentifierInfo(TmpBuf, TmpBuf+Size);
1196 }
1197 Identifier.setIdentifierInfo(II);
1198 return II;
1199}
1200
1201
1202/// HandleIdentifier - This callback is invoked when the lexer reads an
1203/// identifier. This callback looks up the identifier in the map and/or
1204/// potentially macro expands it or turns it into a named token (like 'for').
Chris Lattnerd2177732007-07-20 16:59:19 +00001205void Preprocessor::HandleIdentifier(Token &Identifier) {
Reid Spencer5f016e22007-07-11 17:01:13 +00001206 assert(Identifier.getIdentifierInfo() &&
1207 "Can't handle identifiers without identifier info!");
1208
1209 IdentifierInfo &II = *Identifier.getIdentifierInfo();
1210
1211 // If this identifier was poisoned, and if it was not produced from a macro
1212 // expansion, emit an error.
1213 if (II.isPoisoned() && CurLexer) {
1214 if (&II != Ident__VA_ARGS__) // We warn about __VA_ARGS__ with poisoning.
1215 Diag(Identifier, diag::err_pp_used_poisoned_id);
1216 else
1217 Diag(Identifier, diag::ext_pp_bad_vaargs_use);
1218 }
1219
1220 // If this is a macro to be expanded, do it.
Chris Lattnercc1a8752007-10-07 08:44:20 +00001221 if (MacroInfo *MI = getMacroInfo(&II)) {
Reid Spencer5f016e22007-07-11 17:01:13 +00001222 if (!DisableMacroExpansion && !Identifier.isExpandDisabled()) {
1223 if (MI->isEnabled()) {
1224 if (!HandleMacroExpandedIdentifier(Identifier, MI))
1225 return;
1226 } else {
1227 // C99 6.10.3.4p2 says that a disabled macro may never again be
1228 // expanded, even if it's in a context where it could be expanded in the
1229 // future.
Chris Lattnerd2177732007-07-20 16:59:19 +00001230 Identifier.setFlag(Token::DisableExpand);
Reid Spencer5f016e22007-07-11 17:01:13 +00001231 }
1232 }
1233 } else if (II.isOtherTargetMacro() && !DisableMacroExpansion) {
1234 // If this identifier is a macro on some other target, emit a diagnostic.
1235 // This diagnosic is only emitted when macro expansion is enabled, because
1236 // the macro would not have been expanded for the other target either.
1237 II.setIsOtherTargetMacro(false); // Don't warn on second use.
Ted Kremenek9c728dc2007-12-12 22:39:36 +00001238 getTargetInfo().DiagnoseNonPortability(getFullLoc(Identifier.getLocation()),
Reid Spencer5f016e22007-07-11 17:01:13 +00001239 diag::port_target_macro_use);
1240
1241 }
1242
1243 // C++ 2.11p2: If this is an alternative representation of a C++ operator,
1244 // then we act as if it is the actual operator and not the textual
1245 // representation of it.
1246 if (II.isCPlusPlusOperatorKeyword())
1247 Identifier.setIdentifierInfo(0);
1248
1249 // Change the kind of this identifier to the appropriate token kind, e.g.
1250 // turning "for" into a keyword.
1251 Identifier.setKind(II.getTokenID());
1252
1253 // If this is an extension token, diagnose its use.
1254 // FIXME: tried (unsuccesfully) to shut this up when compiling with gnu99
1255 // For now, I'm just commenting it out (while I work on attributes).
1256 if (II.isExtensionToken() && Features.C99)
1257 Diag(Identifier, diag::ext_token_used);
1258}
1259
1260/// HandleEndOfFile - This callback is invoked when the lexer hits the end of
1261/// the current file. This either returns the EOF token or pops a level off
1262/// the include stack and keeps going.
Chris Lattnerd2177732007-07-20 16:59:19 +00001263bool Preprocessor::HandleEndOfFile(Token &Result, bool isEndOfMacro) {
Reid Spencer5f016e22007-07-11 17:01:13 +00001264 assert(!CurMacroExpander &&
1265 "Ending a file when currently in a macro!");
1266
1267 // See if this file had a controlling macro.
1268 if (CurLexer) { // Not ending a macro, ignore it.
1269 if (const IdentifierInfo *ControllingMacro =
1270 CurLexer->MIOpt.GetControllingMacroAtEndOfFile()) {
1271 // Okay, this has a controlling macro, remember in PerFileInfo.
1272 if (const FileEntry *FE =
Chris Lattner9dc1f532007-07-20 16:37:10 +00001273 SourceMgr.getFileEntryForLoc(CurLexer->getFileLoc()))
Reid Spencer5f016e22007-07-11 17:01:13 +00001274 HeaderInfo.SetFileControllingMacro(FE, ControllingMacro);
1275 }
1276 }
1277
1278 // If this is a #include'd file, pop it off the include stack and continue
1279 // lexing the #includer file.
1280 if (!IncludeMacroStack.empty()) {
1281 // We're done with the #included file.
1282 RemoveTopOfLexerStack();
1283
1284 // Notify the client, if desired, that we are in a new source file.
1285 if (Callbacks && !isEndOfMacro && CurLexer) {
1286 DirectoryLookup::DirType FileType = DirectoryLookup::NormalHeaderDir;
1287
1288 // Get the file entry for the current file.
1289 if (const FileEntry *FE =
Chris Lattner9dc1f532007-07-20 16:37:10 +00001290 SourceMgr.getFileEntryForLoc(CurLexer->getFileLoc()))
Reid Spencer5f016e22007-07-11 17:01:13 +00001291 FileType = HeaderInfo.getFileDirFlavor(FE);
1292
1293 Callbacks->FileChanged(CurLexer->getSourceLocation(CurLexer->BufferPtr),
1294 PPCallbacks::ExitFile, FileType);
1295 }
1296
1297 // Client should lex another token.
1298 return false;
1299 }
Chris Lattner09cf90f2008-01-25 00:00:30 +00001300
1301 // If the file ends with a newline, form the EOF token on the newline itself,
1302 // rather than "on the line following it", which doesn't exist. This makes
1303 // diagnostics relating to the end of file include the last file that the user
1304 // actually typed, which is goodness.
1305 const char *EndPos = CurLexer->BufferEnd;
1306 if (EndPos != CurLexer->BufferStart &&
1307 (EndPos[-1] == '\n' || EndPos[-1] == '\r')) {
1308 --EndPos;
1309
1310 // Handle \n\r and \r\n:
1311 if (EndPos != CurLexer->BufferStart &&
1312 (EndPos[-1] == '\n' || EndPos[-1] == '\r') &&
1313 EndPos[-1] != EndPos[0])
1314 --EndPos;
1315 }
Reid Spencer5f016e22007-07-11 17:01:13 +00001316
1317 Result.startToken();
Chris Lattner09cf90f2008-01-25 00:00:30 +00001318 CurLexer->BufferPtr = EndPos;
1319 CurLexer->FormTokenWithChars(Result, EndPos);
Reid Spencer5f016e22007-07-11 17:01:13 +00001320 Result.setKind(tok::eof);
1321
1322 // We're done with the #included file.
1323 delete CurLexer;
1324 CurLexer = 0;
1325
1326 // This is the end of the top-level file. If the diag::pp_macro_not_used
Chris Lattnercc1a8752007-10-07 08:44:20 +00001327 // diagnostic is enabled, look for macros that have not been used.
Reid Spencer5f016e22007-07-11 17:01:13 +00001328 if (Diags.getDiagnosticLevel(diag::pp_macro_not_used) != Diagnostic::Ignored){
Chris Lattnercc1a8752007-10-07 08:44:20 +00001329 for (llvm::DenseMap<IdentifierInfo*, MacroInfo*>::iterator I =
1330 Macros.begin(), E = Macros.end(); I != E; ++I) {
1331 if (!I->second->isUsed())
1332 Diag(I->second->getDefinitionLoc(), diag::pp_macro_not_used);
Reid Spencer5f016e22007-07-11 17:01:13 +00001333 }
1334 }
Reid Spencer5f016e22007-07-11 17:01:13 +00001335 return true;
1336}
1337
1338/// HandleEndOfMacro - This callback is invoked when the lexer hits the end of
1339/// the current macro expansion or token stream expansion.
Chris Lattnerd2177732007-07-20 16:59:19 +00001340bool Preprocessor::HandleEndOfMacro(Token &Result) {
Reid Spencer5f016e22007-07-11 17:01:13 +00001341 assert(CurMacroExpander && !CurLexer &&
1342 "Ending a macro when currently in a #include file!");
1343
Chris Lattner9594acf2007-07-15 00:25:26 +00001344 // Delete or cache the now-dead macro expander.
1345 if (NumCachedMacroExpanders == MacroExpanderCacheSize)
1346 delete CurMacroExpander;
1347 else
1348 MacroExpanderCache[NumCachedMacroExpanders++] = CurMacroExpander;
Reid Spencer5f016e22007-07-11 17:01:13 +00001349
1350 // Handle this like a #include file being popped off the stack.
1351 CurMacroExpander = 0;
1352 return HandleEndOfFile(Result, true);
1353}
1354
1355
1356//===----------------------------------------------------------------------===//
1357// Utility Methods for Preprocessor Directive Handling.
1358//===----------------------------------------------------------------------===//
1359
1360/// DiscardUntilEndOfDirective - Read and discard all tokens remaining on the
1361/// current line until the tok::eom token is found.
1362void Preprocessor::DiscardUntilEndOfDirective() {
Chris Lattnerd2177732007-07-20 16:59:19 +00001363 Token Tmp;
Reid Spencer5f016e22007-07-11 17:01:13 +00001364 do {
1365 LexUnexpandedToken(Tmp);
Chris Lattner22f6bbc2007-10-09 18:02:16 +00001366 } while (Tmp.isNot(tok::eom));
Reid Spencer5f016e22007-07-11 17:01:13 +00001367}
1368
1369/// isCXXNamedOperator - Returns "true" if the token is a named operator in C++.
1370static bool isCXXNamedOperator(const std::string &Spelling) {
1371 return Spelling == "and" || Spelling == "bitand" || Spelling == "bitor" ||
1372 Spelling == "compl" || Spelling == "not" || Spelling == "not_eq" ||
1373 Spelling == "or" || Spelling == "xor";
1374}
1375
1376/// ReadMacroName - Lex and validate a macro name, which occurs after a
1377/// #define or #undef. This sets the token kind to eom and discards the rest
1378/// of the macro line if the macro name is invalid. isDefineUndef is 1 if
1379/// this is due to a a #define, 2 if #undef directive, 0 if it is something
1380/// else (e.g. #ifdef).
Chris Lattnerd2177732007-07-20 16:59:19 +00001381void Preprocessor::ReadMacroName(Token &MacroNameTok, char isDefineUndef) {
Reid Spencer5f016e22007-07-11 17:01:13 +00001382 // Read the token, don't allow macro expansion on it.
1383 LexUnexpandedToken(MacroNameTok);
1384
1385 // Missing macro name?
Chris Lattner22f6bbc2007-10-09 18:02:16 +00001386 if (MacroNameTok.is(tok::eom))
Reid Spencer5f016e22007-07-11 17:01:13 +00001387 return Diag(MacroNameTok, diag::err_pp_missing_macro_name);
1388
1389 IdentifierInfo *II = MacroNameTok.getIdentifierInfo();
1390 if (II == 0) {
1391 std::string Spelling = getSpelling(MacroNameTok);
1392 if (isCXXNamedOperator(Spelling))
1393 // C++ 2.5p2: Alternative tokens behave the same as its primary token
1394 // except for their spellings.
1395 Diag(MacroNameTok, diag::err_pp_operator_used_as_macro_name, Spelling);
1396 else
1397 Diag(MacroNameTok, diag::err_pp_macro_not_identifier);
1398 // Fall through on error.
1399 } else if (isDefineUndef && II->getPPKeywordID() == tok::pp_defined) {
1400 // Error if defining "defined": C99 6.10.8.4.
1401 Diag(MacroNameTok, diag::err_defined_macro_name);
Chris Lattner0edde552007-10-07 08:04:56 +00001402 } else if (isDefineUndef && II->hasMacroDefinition() &&
Chris Lattnercc1a8752007-10-07 08:44:20 +00001403 getMacroInfo(II)->isBuiltinMacro()) {
Reid Spencer5f016e22007-07-11 17:01:13 +00001404 // Error if defining "__LINE__" and other builtins: C99 6.10.8.4.
1405 if (isDefineUndef == 1)
1406 Diag(MacroNameTok, diag::pp_redef_builtin_macro);
1407 else
1408 Diag(MacroNameTok, diag::pp_undef_builtin_macro);
1409 } else {
1410 // Okay, we got a good identifier node. Return it.
1411 return;
1412 }
1413
1414 // Invalid macro name, read and discard the rest of the line. Then set the
1415 // token kind to tok::eom.
1416 MacroNameTok.setKind(tok::eom);
1417 return DiscardUntilEndOfDirective();
1418}
1419
1420/// CheckEndOfDirective - Ensure that the next token is a tok::eom token. If
1421/// not, emit a diagnostic and consume up until the eom.
1422void Preprocessor::CheckEndOfDirective(const char *DirType) {
Chris Lattnerd2177732007-07-20 16:59:19 +00001423 Token Tmp;
Reid Spencer5f016e22007-07-11 17:01:13 +00001424 Lex(Tmp);
1425 // There should be no tokens after the directive, but we allow them as an
1426 // extension.
Chris Lattner22f6bbc2007-10-09 18:02:16 +00001427 while (Tmp.is(tok::comment)) // Skip comments in -C mode.
Reid Spencer5f016e22007-07-11 17:01:13 +00001428 Lex(Tmp);
1429
Chris Lattner22f6bbc2007-10-09 18:02:16 +00001430 if (Tmp.isNot(tok::eom)) {
Reid Spencer5f016e22007-07-11 17:01:13 +00001431 Diag(Tmp, diag::ext_pp_extra_tokens_at_eol, DirType);
1432 DiscardUntilEndOfDirective();
1433 }
1434}
1435
1436
1437
1438/// SkipExcludedConditionalBlock - We just read a #if or related directive and
1439/// decided that the subsequent tokens are in the #if'd out portion of the
1440/// file. Lex the rest of the file, until we see an #endif. If
1441/// FoundNonSkipPortion is true, then we have already emitted code for part of
1442/// this #if directive, so #else/#elif blocks should never be entered. If ElseOk
1443/// is true, then #else directives are ok, if not, then we have already seen one
1444/// so a #else directive is a duplicate. When this returns, the caller can lex
1445/// the first valid token.
1446void Preprocessor::SkipExcludedConditionalBlock(SourceLocation IfTokenLoc,
1447 bool FoundNonSkipPortion,
1448 bool FoundElse) {
1449 ++NumSkipped;
1450 assert(CurMacroExpander == 0 && CurLexer &&
1451 "Lexing a macro, not a file?");
1452
1453 CurLexer->pushConditionalLevel(IfTokenLoc, /*isSkipping*/false,
1454 FoundNonSkipPortion, FoundElse);
1455
1456 // Enter raw mode to disable identifier lookup (and thus macro expansion),
1457 // disabling warnings, etc.
1458 CurLexer->LexingRawMode = true;
Chris Lattnerd2177732007-07-20 16:59:19 +00001459 Token Tok;
Reid Spencer5f016e22007-07-11 17:01:13 +00001460 while (1) {
1461 CurLexer->Lex(Tok);
1462
1463 // If this is the end of the buffer, we have an error.
Chris Lattner22f6bbc2007-10-09 18:02:16 +00001464 if (Tok.is(tok::eof)) {
Reid Spencer5f016e22007-07-11 17:01:13 +00001465 // Emit errors for each unterminated conditional on the stack, including
1466 // the current one.
1467 while (!CurLexer->ConditionalStack.empty()) {
1468 Diag(CurLexer->ConditionalStack.back().IfLoc,
1469 diag::err_pp_unterminated_conditional);
1470 CurLexer->ConditionalStack.pop_back();
1471 }
1472
1473 // Just return and let the caller lex after this #include.
1474 break;
1475 }
1476
1477 // If this token is not a preprocessor directive, just skip it.
Chris Lattner22f6bbc2007-10-09 18:02:16 +00001478 if (Tok.isNot(tok::hash) || !Tok.isAtStartOfLine())
Reid Spencer5f016e22007-07-11 17:01:13 +00001479 continue;
1480
1481 // We just parsed a # character at the start of a line, so we're in
1482 // directive mode. Tell the lexer this so any newlines we see will be
1483 // converted into an EOM token (this terminates the macro).
1484 CurLexer->ParsingPreprocessorDirective = true;
1485 CurLexer->KeepCommentMode = false;
1486
1487
1488 // Read the next token, the directive flavor.
1489 LexUnexpandedToken(Tok);
1490
1491 // If this isn't an identifier directive (e.g. is "# 1\n" or "#\n", or
1492 // something bogus), skip it.
Chris Lattner22f6bbc2007-10-09 18:02:16 +00001493 if (Tok.isNot(tok::identifier)) {
Reid Spencer5f016e22007-07-11 17:01:13 +00001494 CurLexer->ParsingPreprocessorDirective = false;
1495 // Restore comment saving mode.
1496 CurLexer->KeepCommentMode = KeepComments;
1497 continue;
1498 }
1499
1500 // If the first letter isn't i or e, it isn't intesting to us. We know that
1501 // this is safe in the face of spelling differences, because there is no way
1502 // to spell an i/e in a strange way that is another letter. Skipping this
1503 // allows us to avoid looking up the identifier info for #define/#undef and
1504 // other common directives.
1505 const char *RawCharData = SourceMgr.getCharacterData(Tok.getLocation());
1506 char FirstChar = RawCharData[0];
1507 if (FirstChar >= 'a' && FirstChar <= 'z' &&
1508 FirstChar != 'i' && FirstChar != 'e') {
1509 CurLexer->ParsingPreprocessorDirective = false;
1510 // Restore comment saving mode.
1511 CurLexer->KeepCommentMode = KeepComments;
1512 continue;
1513 }
1514
1515 // Get the identifier name without trigraphs or embedded newlines. Note
1516 // that we can't use Tok.getIdentifierInfo() because its lookup is disabled
1517 // when skipping.
1518 // TODO: could do this with zero copies in the no-clean case by using
1519 // strncmp below.
1520 char Directive[20];
1521 unsigned IdLen;
1522 if (!Tok.needsCleaning() && Tok.getLength() < 20) {
1523 IdLen = Tok.getLength();
1524 memcpy(Directive, RawCharData, IdLen);
1525 Directive[IdLen] = 0;
1526 } else {
1527 std::string DirectiveStr = getSpelling(Tok);
1528 IdLen = DirectiveStr.size();
1529 if (IdLen >= 20) {
1530 CurLexer->ParsingPreprocessorDirective = false;
1531 // Restore comment saving mode.
1532 CurLexer->KeepCommentMode = KeepComments;
1533 continue;
1534 }
1535 memcpy(Directive, &DirectiveStr[0], IdLen);
1536 Directive[IdLen] = 0;
1537 }
1538
1539 if (FirstChar == 'i' && Directive[1] == 'f') {
1540 if ((IdLen == 2) || // "if"
1541 (IdLen == 5 && !strcmp(Directive+2, "def")) || // "ifdef"
1542 (IdLen == 6 && !strcmp(Directive+2, "ndef"))) { // "ifndef"
1543 // We know the entire #if/#ifdef/#ifndef block will be skipped, don't
1544 // bother parsing the condition.
1545 DiscardUntilEndOfDirective();
1546 CurLexer->pushConditionalLevel(Tok.getLocation(), /*wasskipping*/true,
1547 /*foundnonskip*/false,
1548 /*fnddelse*/false);
1549 }
1550 } else if (FirstChar == 'e') {
1551 if (IdLen == 5 && !strcmp(Directive+1, "ndif")) { // "endif"
1552 CheckEndOfDirective("#endif");
1553 PPConditionalInfo CondInfo;
1554 CondInfo.WasSkipping = true; // Silence bogus warning.
1555 bool InCond = CurLexer->popConditionalLevel(CondInfo);
1556 InCond = InCond; // Silence warning in no-asserts mode.
1557 assert(!InCond && "Can't be skipping if not in a conditional!");
1558
1559 // If we popped the outermost skipping block, we're done skipping!
1560 if (!CondInfo.WasSkipping)
1561 break;
1562 } else if (IdLen == 4 && !strcmp(Directive+1, "lse")) { // "else".
1563 // #else directive in a skipping conditional. If not in some other
1564 // skipping conditional, and if #else hasn't already been seen, enter it
1565 // as a non-skipping conditional.
1566 CheckEndOfDirective("#else");
1567 PPConditionalInfo &CondInfo = CurLexer->peekConditionalLevel();
1568
1569 // If this is a #else with a #else before it, report the error.
1570 if (CondInfo.FoundElse) Diag(Tok, diag::pp_err_else_after_else);
1571
1572 // Note that we've seen a #else in this conditional.
1573 CondInfo.FoundElse = true;
1574
1575 // If the conditional is at the top level, and the #if block wasn't
1576 // entered, enter the #else block now.
1577 if (!CondInfo.WasSkipping && !CondInfo.FoundNonSkip) {
1578 CondInfo.FoundNonSkip = true;
1579 break;
1580 }
1581 } else if (IdLen == 4 && !strcmp(Directive+1, "lif")) { // "elif".
1582 PPConditionalInfo &CondInfo = CurLexer->peekConditionalLevel();
1583
1584 bool ShouldEnter;
1585 // If this is in a skipping block or if we're already handled this #if
1586 // block, don't bother parsing the condition.
1587 if (CondInfo.WasSkipping || CondInfo.FoundNonSkip) {
1588 DiscardUntilEndOfDirective();
1589 ShouldEnter = false;
1590 } else {
1591 // Restore the value of LexingRawMode so that identifiers are
1592 // looked up, etc, inside the #elif expression.
1593 assert(CurLexer->LexingRawMode && "We have to be skipping here!");
1594 CurLexer->LexingRawMode = false;
1595 IdentifierInfo *IfNDefMacro = 0;
1596 ShouldEnter = EvaluateDirectiveExpression(IfNDefMacro);
1597 CurLexer->LexingRawMode = true;
1598 }
1599
1600 // If this is a #elif with a #else before it, report the error.
1601 if (CondInfo.FoundElse) Diag(Tok, diag::pp_err_elif_after_else);
1602
1603 // If this condition is true, enter it!
1604 if (ShouldEnter) {
1605 CondInfo.FoundNonSkip = true;
1606 break;
1607 }
1608 }
1609 }
1610
1611 CurLexer->ParsingPreprocessorDirective = false;
1612 // Restore comment saving mode.
1613 CurLexer->KeepCommentMode = KeepComments;
1614 }
1615
1616 // Finally, if we are out of the conditional (saw an #endif or ran off the end
1617 // of the file, just stop skipping and return to lexing whatever came after
1618 // the #if block.
1619 CurLexer->LexingRawMode = false;
1620}
1621
1622//===----------------------------------------------------------------------===//
1623// Preprocessor Directive Handling.
1624//===----------------------------------------------------------------------===//
1625
1626/// HandleDirective - This callback is invoked when the lexer sees a # token
1627/// at the start of a line. This consumes the directive, modifies the
1628/// lexer/preprocessor state, and advances the lexer(s) so that the next token
1629/// read is the correct one.
Chris Lattnerd2177732007-07-20 16:59:19 +00001630void Preprocessor::HandleDirective(Token &Result) {
Reid Spencer5f016e22007-07-11 17:01:13 +00001631 // FIXME: Traditional: # with whitespace before it not recognized by K&R?
1632
1633 // We just parsed a # character at the start of a line, so we're in directive
1634 // mode. Tell the lexer this so any newlines we see will be converted into an
1635 // EOM token (which terminates the directive).
1636 CurLexer->ParsingPreprocessorDirective = true;
1637
1638 ++NumDirectives;
1639
1640 // We are about to read a token. For the multiple-include optimization FA to
1641 // work, we have to remember if we had read any tokens *before* this
1642 // pp-directive.
1643 bool ReadAnyTokensBeforeDirective = CurLexer->MIOpt.getHasReadAnyTokensVal();
1644
1645 // Read the next token, the directive flavor. This isn't expanded due to
1646 // C99 6.10.3p8.
1647 LexUnexpandedToken(Result);
1648
1649 // C99 6.10.3p11: Is this preprocessor directive in macro invocation? e.g.:
1650 // #define A(x) #x
1651 // A(abc
1652 // #warning blah
1653 // def)
1654 // If so, the user is relying on non-portable behavior, emit a diagnostic.
1655 if (InMacroArgs)
1656 Diag(Result, diag::ext_embedded_directive);
1657
1658TryAgain:
1659 switch (Result.getKind()) {
1660 case tok::eom:
1661 return; // null directive.
1662 case tok::comment:
1663 // Handle stuff like "# /*foo*/ define X" in -E -C mode.
1664 LexUnexpandedToken(Result);
1665 goto TryAgain;
1666
1667 case tok::numeric_constant:
1668 // FIXME: implement # 7 line numbers!
1669 DiscardUntilEndOfDirective();
1670 return;
1671 default:
1672 IdentifierInfo *II = Result.getIdentifierInfo();
1673 if (II == 0) break; // Not an identifier.
1674
1675 // Ask what the preprocessor keyword ID is.
1676 switch (II->getPPKeywordID()) {
1677 default: break;
1678 // C99 6.10.1 - Conditional Inclusion.
1679 case tok::pp_if:
1680 return HandleIfDirective(Result, ReadAnyTokensBeforeDirective);
1681 case tok::pp_ifdef:
1682 return HandleIfdefDirective(Result, false, true/*not valid for miopt*/);
1683 case tok::pp_ifndef:
1684 return HandleIfdefDirective(Result, true, ReadAnyTokensBeforeDirective);
1685 case tok::pp_elif:
1686 return HandleElifDirective(Result);
1687 case tok::pp_else:
1688 return HandleElseDirective(Result);
1689 case tok::pp_endif:
1690 return HandleEndifDirective(Result);
1691
1692 // C99 6.10.2 - Source File Inclusion.
1693 case tok::pp_include:
1694 return HandleIncludeDirective(Result); // Handle #include.
1695
1696 // C99 6.10.3 - Macro Replacement.
1697 case tok::pp_define:
1698 return HandleDefineDirective(Result, false);
1699 case tok::pp_undef:
1700 return HandleUndefDirective(Result);
1701
1702 // C99 6.10.4 - Line Control.
1703 case tok::pp_line:
1704 // FIXME: implement #line
1705 DiscardUntilEndOfDirective();
1706 return;
1707
1708 // C99 6.10.5 - Error Directive.
1709 case tok::pp_error:
1710 return HandleUserDiagnosticDirective(Result, false);
1711
1712 // C99 6.10.6 - Pragma Directive.
1713 case tok::pp_pragma:
1714 return HandlePragmaDirective();
1715
1716 // GNU Extensions.
1717 case tok::pp_import:
1718 return HandleImportDirective(Result);
1719 case tok::pp_include_next:
1720 return HandleIncludeNextDirective(Result);
1721
1722 case tok::pp_warning:
1723 Diag(Result, diag::ext_pp_warning_directive);
1724 return HandleUserDiagnosticDirective(Result, true);
1725 case tok::pp_ident:
1726 return HandleIdentSCCSDirective(Result);
1727 case tok::pp_sccs:
1728 return HandleIdentSCCSDirective(Result);
1729 case tok::pp_assert:
1730 //isExtension = true; // FIXME: implement #assert
1731 break;
1732 case tok::pp_unassert:
1733 //isExtension = true; // FIXME: implement #unassert
1734 break;
1735
1736 // clang extensions.
1737 case tok::pp_define_target:
1738 return HandleDefineDirective(Result, true);
1739 case tok::pp_define_other_target:
1740 return HandleDefineOtherTargetDirective(Result);
1741 }
1742 break;
1743 }
1744
1745 // If we reached here, the preprocessing token is not valid!
1746 Diag(Result, diag::err_pp_invalid_directive);
1747
1748 // Read the rest of the PP line.
1749 DiscardUntilEndOfDirective();
1750
1751 // Okay, we're done parsing the directive.
1752}
1753
Chris Lattnerd2177732007-07-20 16:59:19 +00001754void Preprocessor::HandleUserDiagnosticDirective(Token &Tok,
Reid Spencer5f016e22007-07-11 17:01:13 +00001755 bool isWarning) {
1756 // Read the rest of the line raw. We do this because we don't want macros
1757 // to be expanded and we don't require that the tokens be valid preprocessing
1758 // tokens. For example, this is allowed: "#warning ` 'foo". GCC does
1759 // collapse multiple consequtive white space between tokens, but this isn't
1760 // specified by the standard.
1761 std::string Message = CurLexer->ReadToEndOfLine();
1762
1763 unsigned DiagID = isWarning ? diag::pp_hash_warning : diag::err_pp_hash_error;
1764 return Diag(Tok, DiagID, Message);
1765}
1766
1767/// HandleIdentSCCSDirective - Handle a #ident/#sccs directive.
1768///
Chris Lattnerd2177732007-07-20 16:59:19 +00001769void Preprocessor::HandleIdentSCCSDirective(Token &Tok) {
Reid Spencer5f016e22007-07-11 17:01:13 +00001770 // Yes, this directive is an extension.
1771 Diag(Tok, diag::ext_pp_ident_directive);
1772
1773 // Read the string argument.
Chris Lattnerd2177732007-07-20 16:59:19 +00001774 Token StrTok;
Reid Spencer5f016e22007-07-11 17:01:13 +00001775 Lex(StrTok);
1776
1777 // If the token kind isn't a string, it's a malformed directive.
Chris Lattner22f6bbc2007-10-09 18:02:16 +00001778 if (StrTok.isNot(tok::string_literal) &&
1779 StrTok.isNot(tok::wide_string_literal))
Reid Spencer5f016e22007-07-11 17:01:13 +00001780 return Diag(StrTok, diag::err_pp_malformed_ident);
1781
1782 // Verify that there is nothing after the string, other than EOM.
1783 CheckEndOfDirective("#ident");
1784
1785 if (Callbacks)
1786 Callbacks->Ident(Tok.getLocation(), getSpelling(StrTok));
1787}
1788
1789//===----------------------------------------------------------------------===//
1790// Preprocessor Include Directive Handling.
1791//===----------------------------------------------------------------------===//
1792
1793/// GetIncludeFilenameSpelling - Turn the specified lexer token into a fully
1794/// checked and spelled filename, e.g. as an operand of #include. This returns
1795/// true if the input filename was in <>'s or false if it were in ""'s. The
1796/// caller is expected to provide a buffer that is large enough to hold the
1797/// spelling of the filename, but is also expected to handle the case when
1798/// this method decides to use a different buffer.
Chris Lattnerf1c99ac2007-07-23 04:15:27 +00001799bool Preprocessor::GetIncludeFilenameSpelling(SourceLocation Loc,
Reid Spencer5f016e22007-07-11 17:01:13 +00001800 const char *&BufStart,
1801 const char *&BufEnd) {
1802 // Get the text form of the filename.
Reid Spencer5f016e22007-07-11 17:01:13 +00001803 assert(BufStart != BufEnd && "Can't have tokens with empty spellings!");
1804
1805 // Make sure the filename is <x> or "x".
1806 bool isAngled;
1807 if (BufStart[0] == '<') {
1808 if (BufEnd[-1] != '>') {
Chris Lattnerf1c99ac2007-07-23 04:15:27 +00001809 Diag(Loc, diag::err_pp_expects_filename);
Reid Spencer5f016e22007-07-11 17:01:13 +00001810 BufStart = 0;
1811 return true;
1812 }
1813 isAngled = true;
1814 } else if (BufStart[0] == '"') {
1815 if (BufEnd[-1] != '"') {
Chris Lattnerf1c99ac2007-07-23 04:15:27 +00001816 Diag(Loc, diag::err_pp_expects_filename);
Reid Spencer5f016e22007-07-11 17:01:13 +00001817 BufStart = 0;
1818 return true;
1819 }
1820 isAngled = false;
1821 } else {
Chris Lattnerf1c99ac2007-07-23 04:15:27 +00001822 Diag(Loc, diag::err_pp_expects_filename);
Reid Spencer5f016e22007-07-11 17:01:13 +00001823 BufStart = 0;
1824 return true;
1825 }
1826
1827 // Diagnose #include "" as invalid.
1828 if (BufEnd-BufStart <= 2) {
Chris Lattnerf1c99ac2007-07-23 04:15:27 +00001829 Diag(Loc, diag::err_pp_empty_filename);
Reid Spencer5f016e22007-07-11 17:01:13 +00001830 BufStart = 0;
1831 return "";
1832 }
1833
1834 // Skip the brackets.
1835 ++BufStart;
1836 --BufEnd;
1837 return isAngled;
1838}
1839
Chris Lattner706ab502007-07-23 04:56:47 +00001840/// ConcatenateIncludeName - Handle cases where the #include name is expanded
1841/// from a macro as multiple tokens, which need to be glued together. This
1842/// occurs for code like:
1843/// #define FOO <a/b.h>
1844/// #include FOO
1845/// because in this case, "<a/b.h>" is returned as 7 tokens, not one.
1846///
1847/// This code concatenates and consumes tokens up to the '>' token. It returns
1848/// false if the > was found, otherwise it returns true if it finds and consumes
1849/// the EOM marker.
1850static bool ConcatenateIncludeName(llvm::SmallVector<char, 128> &FilenameBuffer,
1851 Preprocessor &PP) {
1852 Token CurTok;
1853
1854 PP.Lex(CurTok);
Chris Lattner22f6bbc2007-10-09 18:02:16 +00001855 while (CurTok.isNot(tok::eom)) {
Chris Lattner706ab502007-07-23 04:56:47 +00001856 // Append the spelling of this token to the buffer. If there was a space
1857 // before it, add it now.
1858 if (CurTok.hasLeadingSpace())
1859 FilenameBuffer.push_back(' ');
1860
1861 // Get the spelling of the token, directly into FilenameBuffer if possible.
1862 unsigned PreAppendSize = FilenameBuffer.size();
1863 FilenameBuffer.resize(PreAppendSize+CurTok.getLength());
1864
1865 const char *BufPtr = &FilenameBuffer[PreAppendSize];
1866 unsigned ActualLen = PP.getSpelling(CurTok, BufPtr);
1867
1868 // If the token was spelled somewhere else, copy it into FilenameBuffer.
1869 if (BufPtr != &FilenameBuffer[PreAppendSize])
1870 memcpy(&FilenameBuffer[PreAppendSize], BufPtr, ActualLen);
1871
1872 // Resize FilenameBuffer to the correct size.
1873 if (CurTok.getLength() != ActualLen)
1874 FilenameBuffer.resize(PreAppendSize+ActualLen);
1875
1876 // If we found the '>' marker, return success.
Chris Lattner22f6bbc2007-10-09 18:02:16 +00001877 if (CurTok.is(tok::greater))
Chris Lattner706ab502007-07-23 04:56:47 +00001878 return false;
1879
1880 PP.Lex(CurTok);
1881 }
1882
1883 // If we hit the eom marker, emit an error and return true so that the caller
1884 // knows the EOM has been read.
1885 PP.Diag(CurTok.getLocation(), diag::err_pp_expects_filename);
1886 return true;
1887}
1888
Reid Spencer5f016e22007-07-11 17:01:13 +00001889/// HandleIncludeDirective - The "#include" tokens have just been read, read the
1890/// file to be included from the lexer, then include it! This is a common
1891/// routine with functionality shared between #include, #include_next and
1892/// #import.
Chris Lattnerd2177732007-07-20 16:59:19 +00001893void Preprocessor::HandleIncludeDirective(Token &IncludeTok,
Reid Spencer5f016e22007-07-11 17:01:13 +00001894 const DirectoryLookup *LookupFrom,
1895 bool isImport) {
1896
Chris Lattnerd2177732007-07-20 16:59:19 +00001897 Token FilenameTok;
Reid Spencer5f016e22007-07-11 17:01:13 +00001898 CurLexer->LexIncludeFilename(FilenameTok);
1899
Reid Spencer5f016e22007-07-11 17:01:13 +00001900 // Reserve a buffer to get the spelling.
1901 llvm::SmallVector<char, 128> FilenameBuffer;
Chris Lattner706ab502007-07-23 04:56:47 +00001902 const char *FilenameStart, *FilenameEnd;
1903
1904 switch (FilenameTok.getKind()) {
1905 case tok::eom:
1906 // If the token kind is EOM, the error has already been diagnosed.
1907 return;
Reid Spencer5f016e22007-07-11 17:01:13 +00001908
Chris Lattner706ab502007-07-23 04:56:47 +00001909 case tok::angle_string_literal:
Chris Lattnerf11ccfc2007-07-23 22:23:52 +00001910 case tok::string_literal: {
Chris Lattner706ab502007-07-23 04:56:47 +00001911 FilenameBuffer.resize(FilenameTok.getLength());
1912 FilenameStart = &FilenameBuffer[0];
1913 unsigned Len = getSpelling(FilenameTok, FilenameStart);
1914 FilenameEnd = FilenameStart+Len;
1915 break;
Chris Lattnerf11ccfc2007-07-23 22:23:52 +00001916 }
Chris Lattner706ab502007-07-23 04:56:47 +00001917
1918 case tok::less:
1919 // This could be a <foo/bar.h> file coming from a macro expansion. In this
1920 // case, glue the tokens together into FilenameBuffer and interpret those.
1921 FilenameBuffer.push_back('<');
1922 if (ConcatenateIncludeName(FilenameBuffer, *this))
1923 return; // Found <eom> but no ">"? Diagnostic already emitted.
1924 FilenameStart = &FilenameBuffer[0];
1925 FilenameEnd = &FilenameBuffer[FilenameBuffer.size()];
1926 break;
1927 default:
1928 Diag(FilenameTok.getLocation(), diag::err_pp_expects_filename);
1929 DiscardUntilEndOfDirective();
1930 return;
1931 }
1932
Chris Lattnerf1c99ac2007-07-23 04:15:27 +00001933 bool isAngled = GetIncludeFilenameSpelling(FilenameTok.getLocation(),
Reid Spencer5f016e22007-07-11 17:01:13 +00001934 FilenameStart, FilenameEnd);
1935 // If GetIncludeFilenameSpelling set the start ptr to null, there was an
1936 // error.
Chris Lattner706ab502007-07-23 04:56:47 +00001937 if (FilenameStart == 0) {
1938 DiscardUntilEndOfDirective();
Reid Spencer5f016e22007-07-11 17:01:13 +00001939 return;
Chris Lattner706ab502007-07-23 04:56:47 +00001940 }
Reid Spencer5f016e22007-07-11 17:01:13 +00001941
1942 // Verify that there is nothing after the filename, other than EOM. Use the
1943 // preprocessor to lex this in case lexing the filename entered a macro.
1944 CheckEndOfDirective("#include");
1945
1946 // Check that we don't have infinite #include recursion.
1947 if (IncludeMacroStack.size() == MaxAllowedIncludeStackDepth-1)
1948 return Diag(FilenameTok, diag::err_pp_include_too_deep);
1949
1950 // Search include directories.
1951 const DirectoryLookup *CurDir;
1952 const FileEntry *File = LookupFile(FilenameStart, FilenameEnd,
1953 isAngled, LookupFrom, CurDir);
1954 if (File == 0)
1955 return Diag(FilenameTok, diag::err_pp_file_not_found,
1956 std::string(FilenameStart, FilenameEnd));
1957
1958 // Ask HeaderInfo if we should enter this #include file.
1959 if (!HeaderInfo.ShouldEnterIncludeFile(File, isImport)) {
1960 // If it returns true, #including this file will have no effect.
1961 return;
1962 }
1963
1964 // Look up the file, create a File ID for it.
1965 unsigned FileID = SourceMgr.createFileID(File, FilenameTok.getLocation());
1966 if (FileID == 0)
1967 return Diag(FilenameTok, diag::err_pp_file_not_found,
1968 std::string(FilenameStart, FilenameEnd));
1969
1970 // Finally, if all is good, enter the new file!
1971 EnterSourceFile(FileID, CurDir);
1972}
1973
1974/// HandleIncludeNextDirective - Implements #include_next.
1975///
Chris Lattnerd2177732007-07-20 16:59:19 +00001976void Preprocessor::HandleIncludeNextDirective(Token &IncludeNextTok) {
Reid Spencer5f016e22007-07-11 17:01:13 +00001977 Diag(IncludeNextTok, diag::ext_pp_include_next_directive);
1978
1979 // #include_next is like #include, except that we start searching after
1980 // the current found directory. If we can't do this, issue a
1981 // diagnostic.
1982 const DirectoryLookup *Lookup = CurDirLookup;
1983 if (isInPrimaryFile()) {
1984 Lookup = 0;
1985 Diag(IncludeNextTok, diag::pp_include_next_in_primary);
1986 } else if (Lookup == 0) {
1987 Diag(IncludeNextTok, diag::pp_include_next_absolute_path);
1988 } else {
1989 // Start looking up in the next directory.
1990 ++Lookup;
1991 }
1992
1993 return HandleIncludeDirective(IncludeNextTok, Lookup);
1994}
1995
1996/// HandleImportDirective - Implements #import.
1997///
Chris Lattnerd2177732007-07-20 16:59:19 +00001998void Preprocessor::HandleImportDirective(Token &ImportTok) {
Reid Spencer5f016e22007-07-11 17:01:13 +00001999 Diag(ImportTok, diag::ext_pp_import_directive);
2000
2001 return HandleIncludeDirective(ImportTok, 0, true);
2002}
2003
2004//===----------------------------------------------------------------------===//
2005// Preprocessor Macro Directive Handling.
2006//===----------------------------------------------------------------------===//
2007
2008/// ReadMacroDefinitionArgList - The ( starting an argument list of a macro
2009/// definition has just been read. Lex the rest of the arguments and the
2010/// closing ), updating MI with what we learn. Return true if an error occurs
2011/// parsing the arg list.
2012bool Preprocessor::ReadMacroDefinitionArgList(MacroInfo *MI) {
Chris Lattner25c96482007-07-14 22:46:43 +00002013 llvm::SmallVector<IdentifierInfo*, 32> Arguments;
2014
Chris Lattnerd2177732007-07-20 16:59:19 +00002015 Token Tok;
Reid Spencer5f016e22007-07-11 17:01:13 +00002016 while (1) {
2017 LexUnexpandedToken(Tok);
2018 switch (Tok.getKind()) {
2019 case tok::r_paren:
2020 // Found the end of the argument list.
Chris Lattner25c96482007-07-14 22:46:43 +00002021 if (Arguments.empty()) { // #define FOO()
2022 MI->setArgumentList(Arguments.begin(), Arguments.end());
2023 return false;
2024 }
Reid Spencer5f016e22007-07-11 17:01:13 +00002025 // Otherwise we have #define FOO(A,)
2026 Diag(Tok, diag::err_pp_expected_ident_in_arg_list);
2027 return true;
2028 case tok::ellipsis: // #define X(... -> C99 varargs
2029 // Warn if use of C99 feature in non-C99 mode.
2030 if (!Features.C99) Diag(Tok, diag::ext_variadic_macro);
2031
2032 // Lex the token after the identifier.
2033 LexUnexpandedToken(Tok);
Chris Lattner22f6bbc2007-10-09 18:02:16 +00002034 if (Tok.isNot(tok::r_paren)) {
Reid Spencer5f016e22007-07-11 17:01:13 +00002035 Diag(Tok, diag::err_pp_missing_rparen_in_macro_def);
2036 return true;
2037 }
2038 // Add the __VA_ARGS__ identifier as an argument.
Chris Lattner25c96482007-07-14 22:46:43 +00002039 Arguments.push_back(Ident__VA_ARGS__);
Reid Spencer5f016e22007-07-11 17:01:13 +00002040 MI->setIsC99Varargs();
Chris Lattner25c96482007-07-14 22:46:43 +00002041 MI->setArgumentList(Arguments.begin(), Arguments.end());
Reid Spencer5f016e22007-07-11 17:01:13 +00002042 return false;
2043 case tok::eom: // #define X(
2044 Diag(Tok, diag::err_pp_missing_rparen_in_macro_def);
2045 return true;
2046 default:
2047 // Handle keywords and identifiers here to accept things like
2048 // #define Foo(for) for.
2049 IdentifierInfo *II = Tok.getIdentifierInfo();
2050 if (II == 0) {
2051 // #define X(1
2052 Diag(Tok, diag::err_pp_invalid_tok_in_arg_list);
2053 return true;
2054 }
2055
2056 // If this is already used as an argument, it is used multiple times (e.g.
2057 // #define X(A,A.
Chris Lattner25c96482007-07-14 22:46:43 +00002058 if (std::find(Arguments.begin(), Arguments.end(), II) !=
2059 Arguments.end()) { // C99 6.10.3p6
Reid Spencer5f016e22007-07-11 17:01:13 +00002060 Diag(Tok, diag::err_pp_duplicate_name_in_arg_list, II->getName());
2061 return true;
2062 }
2063
2064 // Add the argument to the macro info.
Chris Lattner25c96482007-07-14 22:46:43 +00002065 Arguments.push_back(II);
Reid Spencer5f016e22007-07-11 17:01:13 +00002066
2067 // Lex the token after the identifier.
2068 LexUnexpandedToken(Tok);
2069
2070 switch (Tok.getKind()) {
2071 default: // #define X(A B
2072 Diag(Tok, diag::err_pp_expected_comma_in_arg_list);
2073 return true;
2074 case tok::r_paren: // #define X(A)
Chris Lattner25c96482007-07-14 22:46:43 +00002075 MI->setArgumentList(Arguments.begin(), Arguments.end());
Reid Spencer5f016e22007-07-11 17:01:13 +00002076 return false;
2077 case tok::comma: // #define X(A,
2078 break;
2079 case tok::ellipsis: // #define X(A... -> GCC extension
2080 // Diagnose extension.
2081 Diag(Tok, diag::ext_named_variadic_macro);
2082
2083 // Lex the token after the identifier.
2084 LexUnexpandedToken(Tok);
Chris Lattner22f6bbc2007-10-09 18:02:16 +00002085 if (Tok.isNot(tok::r_paren)) {
Reid Spencer5f016e22007-07-11 17:01:13 +00002086 Diag(Tok, diag::err_pp_missing_rparen_in_macro_def);
2087 return true;
2088 }
2089
2090 MI->setIsGNUVarargs();
Chris Lattner25c96482007-07-14 22:46:43 +00002091 MI->setArgumentList(Arguments.begin(), Arguments.end());
Reid Spencer5f016e22007-07-11 17:01:13 +00002092 return false;
2093 }
2094 }
2095 }
2096}
2097
2098/// HandleDefineDirective - Implements #define. This consumes the entire macro
2099/// line then lets the caller lex the next real token. If 'isTargetSpecific' is
2100/// true, then this is a "#define_target", otherwise this is a "#define".
2101///
Chris Lattnerd2177732007-07-20 16:59:19 +00002102void Preprocessor::HandleDefineDirective(Token &DefineTok,
Reid Spencer5f016e22007-07-11 17:01:13 +00002103 bool isTargetSpecific) {
2104 ++NumDefined;
2105
Chris Lattnerd2177732007-07-20 16:59:19 +00002106 Token MacroNameTok;
Reid Spencer5f016e22007-07-11 17:01:13 +00002107 ReadMacroName(MacroNameTok, 1);
2108
2109 // Error reading macro name? If so, diagnostic already issued.
Chris Lattner22f6bbc2007-10-09 18:02:16 +00002110 if (MacroNameTok.is(tok::eom))
Reid Spencer5f016e22007-07-11 17:01:13 +00002111 return;
Chris Lattnerc215bd62007-07-14 22:11:41 +00002112
Reid Spencer5f016e22007-07-11 17:01:13 +00002113 // If we are supposed to keep comments in #defines, reenable comment saving
2114 // mode.
2115 CurLexer->KeepCommentMode = KeepMacroComments;
2116
2117 // Create the new macro.
2118 MacroInfo *MI = new MacroInfo(MacroNameTok.getLocation());
2119 if (isTargetSpecific) MI->setIsTargetSpecific();
2120
2121 // If the identifier is an 'other target' macro, clear this bit.
2122 MacroNameTok.getIdentifierInfo()->setIsOtherTargetMacro(false);
2123
2124
Chris Lattnerd2177732007-07-20 16:59:19 +00002125 Token Tok;
Reid Spencer5f016e22007-07-11 17:01:13 +00002126 LexUnexpandedToken(Tok);
2127
2128 // If this is a function-like macro definition, parse the argument list,
2129 // marking each of the identifiers as being used as macro arguments. Also,
2130 // check other constraints on the first token of the macro body.
Chris Lattner22f6bbc2007-10-09 18:02:16 +00002131 if (Tok.is(tok::eom)) {
Reid Spencer5f016e22007-07-11 17:01:13 +00002132 // If there is no body to this macro, we have no special handling here.
Chris Lattner22f6bbc2007-10-09 18:02:16 +00002133 } else if (Tok.is(tok::l_paren) && !Tok.hasLeadingSpace()) {
Reid Spencer5f016e22007-07-11 17:01:13 +00002134 // This is a function-like macro definition. Read the argument list.
2135 MI->setIsFunctionLike();
2136 if (ReadMacroDefinitionArgList(MI)) {
2137 // Forget about MI.
2138 delete MI;
2139 // Throw away the rest of the line.
2140 if (CurLexer->ParsingPreprocessorDirective)
2141 DiscardUntilEndOfDirective();
2142 return;
2143 }
2144
2145 // Read the first token after the arg list for down below.
2146 LexUnexpandedToken(Tok);
2147 } else if (!Tok.hasLeadingSpace()) {
2148 // C99 requires whitespace between the macro definition and the body. Emit
2149 // a diagnostic for something like "#define X+".
2150 if (Features.C99) {
2151 Diag(Tok, diag::ext_c99_whitespace_required_after_macro_name);
2152 } else {
2153 // FIXME: C90/C++ do not get this diagnostic, but it does get a similar
2154 // one in some cases!
2155 }
2156 } else {
2157 // This is a normal token with leading space. Clear the leading space
2158 // marker on the first token to get proper expansion.
Chris Lattnerd2177732007-07-20 16:59:19 +00002159 Tok.clearFlag(Token::LeadingSpace);
Reid Spencer5f016e22007-07-11 17:01:13 +00002160 }
2161
2162 // If this is a definition of a variadic C99 function-like macro, not using
2163 // the GNU named varargs extension, enabled __VA_ARGS__.
2164
2165 // "Poison" __VA_ARGS__, which can only appear in the expansion of a macro.
2166 // This gets unpoisoned where it is allowed.
2167 assert(Ident__VA_ARGS__->isPoisoned() && "__VA_ARGS__ should be poisoned!");
2168 if (MI->isC99Varargs())
2169 Ident__VA_ARGS__->setIsPoisoned(false);
2170
2171 // Read the rest of the macro body.
Chris Lattnerb5e240f2007-07-14 21:54:03 +00002172 if (MI->isObjectLike()) {
2173 // Object-like macros are very simple, just read their body.
Chris Lattner22f6bbc2007-10-09 18:02:16 +00002174 while (Tok.isNot(tok::eom)) {
Chris Lattnerb5e240f2007-07-14 21:54:03 +00002175 MI->AddTokenToBody(Tok);
Reid Spencer5f016e22007-07-11 17:01:13 +00002176 // Get the next token of the macro.
2177 LexUnexpandedToken(Tok);
Reid Spencer5f016e22007-07-11 17:01:13 +00002178 }
2179
Chris Lattnerb5e240f2007-07-14 21:54:03 +00002180 } else {
2181 // Otherwise, read the body of a function-like macro. This has to validate
2182 // the # (stringize) operator.
Chris Lattner22f6bbc2007-10-09 18:02:16 +00002183 while (Tok.isNot(tok::eom)) {
Chris Lattnerb5e240f2007-07-14 21:54:03 +00002184 MI->AddTokenToBody(Tok);
Reid Spencer5f016e22007-07-11 17:01:13 +00002185
Chris Lattnerb5e240f2007-07-14 21:54:03 +00002186 // Check C99 6.10.3.2p1: ensure that # operators are followed by macro
2187 // parameters in function-like macro expansions.
Chris Lattner22f6bbc2007-10-09 18:02:16 +00002188 if (Tok.isNot(tok::hash)) {
Chris Lattnerb5e240f2007-07-14 21:54:03 +00002189 // Get the next token of the macro.
2190 LexUnexpandedToken(Tok);
2191 continue;
2192 }
2193
2194 // Get the next token of the macro.
2195 LexUnexpandedToken(Tok);
2196
2197 // Not a macro arg identifier?
2198 if (!Tok.getIdentifierInfo() ||
2199 MI->getArgumentNum(Tok.getIdentifierInfo()) == -1) {
2200 Diag(Tok, diag::err_pp_stringize_not_parameter);
2201 delete MI;
2202
2203 // Disable __VA_ARGS__ again.
2204 Ident__VA_ARGS__->setIsPoisoned(true);
2205 return;
2206 }
2207
2208 // Things look ok, add the param name token to the macro.
2209 MI->AddTokenToBody(Tok);
2210
2211 // Get the next token of the macro.
2212 LexUnexpandedToken(Tok);
2213 }
Reid Spencer5f016e22007-07-11 17:01:13 +00002214 }
2215
Chris Lattnerc215bd62007-07-14 22:11:41 +00002216
Reid Spencer5f016e22007-07-11 17:01:13 +00002217 // Disable __VA_ARGS__ again.
2218 Ident__VA_ARGS__->setIsPoisoned(true);
2219
2220 // Check that there is no paste (##) operator at the begining or end of the
2221 // replacement list.
2222 unsigned NumTokens = MI->getNumTokens();
2223 if (NumTokens != 0) {
Chris Lattner22f6bbc2007-10-09 18:02:16 +00002224 if (MI->getReplacementToken(0).is(tok::hashhash)) {
Reid Spencer5f016e22007-07-11 17:01:13 +00002225 Diag(MI->getReplacementToken(0), diag::err_paste_at_start);
2226 delete MI;
2227 return;
2228 }
Chris Lattner22f6bbc2007-10-09 18:02:16 +00002229 if (MI->getReplacementToken(NumTokens-1).is(tok::hashhash)) {
Reid Spencer5f016e22007-07-11 17:01:13 +00002230 Diag(MI->getReplacementToken(NumTokens-1), diag::err_paste_at_end);
2231 delete MI;
2232 return;
2233 }
2234 }
2235
2236 // If this is the primary source file, remember that this macro hasn't been
2237 // used yet.
2238 if (isInPrimaryFile())
2239 MI->setIsUsed(false);
2240
2241 // Finally, if this identifier already had a macro defined for it, verify that
2242 // the macro bodies are identical and free the old definition.
Chris Lattnercc1a8752007-10-07 08:44:20 +00002243 if (MacroInfo *OtherMI = getMacroInfo(MacroNameTok.getIdentifierInfo())) {
Reid Spencer5f016e22007-07-11 17:01:13 +00002244 if (!OtherMI->isUsed())
2245 Diag(OtherMI->getDefinitionLoc(), diag::pp_macro_not_used);
2246
2247 // Macros must be identical. This means all tokes and whitespace separation
2248 // must be the same. C99 6.10.3.2.
2249 if (!MI->isIdenticalTo(*OtherMI, *this)) {
2250 Diag(MI->getDefinitionLoc(), diag::ext_pp_macro_redef,
2251 MacroNameTok.getIdentifierInfo()->getName());
2252 Diag(OtherMI->getDefinitionLoc(), diag::ext_pp_macro_redef2);
2253 }
2254 delete OtherMI;
2255 }
2256
Chris Lattnercc1a8752007-10-07 08:44:20 +00002257 setMacroInfo(MacroNameTok.getIdentifierInfo(), MI);
Reid Spencer5f016e22007-07-11 17:01:13 +00002258}
2259
2260/// HandleDefineOtherTargetDirective - Implements #define_other_target.
Chris Lattnerd2177732007-07-20 16:59:19 +00002261void Preprocessor::HandleDefineOtherTargetDirective(Token &Tok) {
2262 Token MacroNameTok;
Reid Spencer5f016e22007-07-11 17:01:13 +00002263 ReadMacroName(MacroNameTok, 1);
2264
2265 // Error reading macro name? If so, diagnostic already issued.
Chris Lattner22f6bbc2007-10-09 18:02:16 +00002266 if (MacroNameTok.is(tok::eom))
Reid Spencer5f016e22007-07-11 17:01:13 +00002267 return;
2268
2269 // Check to see if this is the last token on the #undef line.
2270 CheckEndOfDirective("#define_other_target");
2271
2272 // If there is already a macro defined by this name, turn it into a
2273 // target-specific define.
Chris Lattnercc1a8752007-10-07 08:44:20 +00002274 if (MacroInfo *MI = getMacroInfo(MacroNameTok.getIdentifierInfo())) {
Reid Spencer5f016e22007-07-11 17:01:13 +00002275 MI->setIsTargetSpecific(true);
2276 return;
2277 }
2278
2279 // Mark the identifier as being a macro on some other target.
2280 MacroNameTok.getIdentifierInfo()->setIsOtherTargetMacro();
2281}
2282
2283
2284/// HandleUndefDirective - Implements #undef.
2285///
Chris Lattnerd2177732007-07-20 16:59:19 +00002286void Preprocessor::HandleUndefDirective(Token &UndefTok) {
Reid Spencer5f016e22007-07-11 17:01:13 +00002287 ++NumUndefined;
2288
Chris Lattnerd2177732007-07-20 16:59:19 +00002289 Token MacroNameTok;
Reid Spencer5f016e22007-07-11 17:01:13 +00002290 ReadMacroName(MacroNameTok, 2);
2291
2292 // Error reading macro name? If so, diagnostic already issued.
Chris Lattner22f6bbc2007-10-09 18:02:16 +00002293 if (MacroNameTok.is(tok::eom))
Reid Spencer5f016e22007-07-11 17:01:13 +00002294 return;
2295
2296 // Check to see if this is the last token on the #undef line.
2297 CheckEndOfDirective("#undef");
2298
2299 // Okay, we finally have a valid identifier to undef.
Chris Lattnercc1a8752007-10-07 08:44:20 +00002300 MacroInfo *MI = getMacroInfo(MacroNameTok.getIdentifierInfo());
Reid Spencer5f016e22007-07-11 17:01:13 +00002301
2302 // #undef untaints an identifier if it were marked by define_other_target.
2303 MacroNameTok.getIdentifierInfo()->setIsOtherTargetMacro(false);
2304
2305 // If the macro is not defined, this is a noop undef, just return.
2306 if (MI == 0) return;
2307
2308 if (!MI->isUsed())
2309 Diag(MI->getDefinitionLoc(), diag::pp_macro_not_used);
2310
2311 // Free macro definition.
2312 delete MI;
Chris Lattnercc1a8752007-10-07 08:44:20 +00002313 setMacroInfo(MacroNameTok.getIdentifierInfo(), 0);
Reid Spencer5f016e22007-07-11 17:01:13 +00002314}
2315
2316
2317//===----------------------------------------------------------------------===//
2318// Preprocessor Conditional Directive Handling.
2319//===----------------------------------------------------------------------===//
2320
2321/// HandleIfdefDirective - Implements the #ifdef/#ifndef directive. isIfndef is
2322/// true when this is a #ifndef directive. ReadAnyTokensBeforeDirective is true
2323/// if any tokens have been returned or pp-directives activated before this
2324/// #ifndef has been lexed.
2325///
Chris Lattnerd2177732007-07-20 16:59:19 +00002326void Preprocessor::HandleIfdefDirective(Token &Result, bool isIfndef,
Reid Spencer5f016e22007-07-11 17:01:13 +00002327 bool ReadAnyTokensBeforeDirective) {
2328 ++NumIf;
Chris Lattnerd2177732007-07-20 16:59:19 +00002329 Token DirectiveTok = Result;
Reid Spencer5f016e22007-07-11 17:01:13 +00002330
Chris Lattnerd2177732007-07-20 16:59:19 +00002331 Token MacroNameTok;
Reid Spencer5f016e22007-07-11 17:01:13 +00002332 ReadMacroName(MacroNameTok);
2333
2334 // Error reading macro name? If so, diagnostic already issued.
Chris Lattner22f6bbc2007-10-09 18:02:16 +00002335 if (MacroNameTok.is(tok::eom)) {
Chris Lattnerf37bb252007-09-24 05:14:57 +00002336 // Skip code until we get to #endif. This helps with recovery by not
2337 // emitting an error when the #endif is reached.
2338 SkipExcludedConditionalBlock(DirectiveTok.getLocation(),
2339 /*Foundnonskip*/false, /*FoundElse*/false);
Reid Spencer5f016e22007-07-11 17:01:13 +00002340 return;
Chris Lattnerf37bb252007-09-24 05:14:57 +00002341 }
Reid Spencer5f016e22007-07-11 17:01:13 +00002342
2343 // Check to see if this is the last token on the #if[n]def line.
2344 CheckEndOfDirective(isIfndef ? "#ifndef" : "#ifdef");
2345
2346 // If the start of a top-level #ifdef, inform MIOpt.
2347 if (!ReadAnyTokensBeforeDirective &&
2348 CurLexer->getConditionalStackDepth() == 0) {
2349 assert(isIfndef && "#ifdef shouldn't reach here");
2350 CurLexer->MIOpt.EnterTopLevelIFNDEF(MacroNameTok.getIdentifierInfo());
2351 }
2352
2353 IdentifierInfo *MII = MacroNameTok.getIdentifierInfo();
Chris Lattnercc1a8752007-10-07 08:44:20 +00002354 MacroInfo *MI = getMacroInfo(MII);
Reid Spencer5f016e22007-07-11 17:01:13 +00002355
2356 // If there is a macro, process it.
2357 if (MI) {
2358 // Mark it used.
2359 MI->setIsUsed(true);
2360
2361 // If this is the first use of a target-specific macro, warn about it.
2362 if (MI->isTargetSpecific()) {
2363 MI->setIsTargetSpecific(false); // Don't warn on second use.
Ted Kremenek9c728dc2007-12-12 22:39:36 +00002364 getTargetInfo().DiagnoseNonPortability(
2365 getFullLoc(MacroNameTok.getLocation()),
2366 diag::port_target_macro_use);
Reid Spencer5f016e22007-07-11 17:01:13 +00002367 }
2368 } else {
2369 // Use of a target-specific macro for some other target? If so, warn.
2370 if (MII->isOtherTargetMacro()) {
2371 MII->setIsOtherTargetMacro(false); // Don't warn on second use.
Ted Kremenek9c728dc2007-12-12 22:39:36 +00002372 getTargetInfo().DiagnoseNonPortability(
2373 getFullLoc(MacroNameTok.getLocation()),
2374 diag::port_target_macro_use);
Reid Spencer5f016e22007-07-11 17:01:13 +00002375 }
2376 }
2377
2378 // Should we include the stuff contained by this directive?
2379 if (!MI == isIfndef) {
2380 // Yes, remember that we are inside a conditional, then lex the next token.
2381 CurLexer->pushConditionalLevel(DirectiveTok.getLocation(), /*wasskip*/false,
2382 /*foundnonskip*/true, /*foundelse*/false);
2383 } else {
2384 // No, skip the contents of this block and return the first token after it.
2385 SkipExcludedConditionalBlock(DirectiveTok.getLocation(),
2386 /*Foundnonskip*/false,
2387 /*FoundElse*/false);
2388 }
2389}
2390
2391/// HandleIfDirective - Implements the #if directive.
2392///
Chris Lattnerd2177732007-07-20 16:59:19 +00002393void Preprocessor::HandleIfDirective(Token &IfToken,
Reid Spencer5f016e22007-07-11 17:01:13 +00002394 bool ReadAnyTokensBeforeDirective) {
2395 ++NumIf;
2396
2397 // Parse and evaluation the conditional expression.
2398 IdentifierInfo *IfNDefMacro = 0;
2399 bool ConditionalTrue = EvaluateDirectiveExpression(IfNDefMacro);
2400
2401 // Should we include the stuff contained by this directive?
2402 if (ConditionalTrue) {
2403 // If this condition is equivalent to #ifndef X, and if this is the first
2404 // directive seen, handle it for the multiple-include optimization.
2405 if (!ReadAnyTokensBeforeDirective &&
2406 CurLexer->getConditionalStackDepth() == 0 && IfNDefMacro)
2407 CurLexer->MIOpt.EnterTopLevelIFNDEF(IfNDefMacro);
2408
2409 // Yes, remember that we are inside a conditional, then lex the next token.
2410 CurLexer->pushConditionalLevel(IfToken.getLocation(), /*wasskip*/false,
2411 /*foundnonskip*/true, /*foundelse*/false);
2412 } else {
2413 // No, skip the contents of this block and return the first token after it.
2414 SkipExcludedConditionalBlock(IfToken.getLocation(), /*Foundnonskip*/false,
2415 /*FoundElse*/false);
2416 }
2417}
2418
2419/// HandleEndifDirective - Implements the #endif directive.
2420///
Chris Lattnerd2177732007-07-20 16:59:19 +00002421void Preprocessor::HandleEndifDirective(Token &EndifToken) {
Reid Spencer5f016e22007-07-11 17:01:13 +00002422 ++NumEndif;
2423
2424 // Check that this is the whole directive.
2425 CheckEndOfDirective("#endif");
2426
2427 PPConditionalInfo CondInfo;
2428 if (CurLexer->popConditionalLevel(CondInfo)) {
2429 // No conditionals on the stack: this is an #endif without an #if.
2430 return Diag(EndifToken, diag::err_pp_endif_without_if);
2431 }
2432
2433 // If this the end of a top-level #endif, inform MIOpt.
2434 if (CurLexer->getConditionalStackDepth() == 0)
2435 CurLexer->MIOpt.ExitTopLevelConditional();
2436
2437 assert(!CondInfo.WasSkipping && !CurLexer->LexingRawMode &&
2438 "This code should only be reachable in the non-skipping case!");
2439}
2440
2441
Chris Lattnerd2177732007-07-20 16:59:19 +00002442void Preprocessor::HandleElseDirective(Token &Result) {
Reid Spencer5f016e22007-07-11 17:01:13 +00002443 ++NumElse;
2444
2445 // #else directive in a non-skipping conditional... start skipping.
2446 CheckEndOfDirective("#else");
2447
2448 PPConditionalInfo CI;
2449 if (CurLexer->popConditionalLevel(CI))
2450 return Diag(Result, diag::pp_err_else_without_if);
2451
2452 // If this is a top-level #else, inform the MIOpt.
2453 if (CurLexer->getConditionalStackDepth() == 0)
2454 CurLexer->MIOpt.FoundTopLevelElse();
2455
2456 // If this is a #else with a #else before it, report the error.
2457 if (CI.FoundElse) Diag(Result, diag::pp_err_else_after_else);
2458
2459 // Finally, skip the rest of the contents of this block and return the first
2460 // token after it.
2461 return SkipExcludedConditionalBlock(CI.IfLoc, /*Foundnonskip*/true,
2462 /*FoundElse*/true);
2463}
2464
Chris Lattnerd2177732007-07-20 16:59:19 +00002465void Preprocessor::HandleElifDirective(Token &ElifToken) {
Reid Spencer5f016e22007-07-11 17:01:13 +00002466 ++NumElse;
2467
2468 // #elif directive in a non-skipping conditional... start skipping.
2469 // We don't care what the condition is, because we will always skip it (since
2470 // the block immediately before it was included).
2471 DiscardUntilEndOfDirective();
2472
2473 PPConditionalInfo CI;
2474 if (CurLexer->popConditionalLevel(CI))
2475 return Diag(ElifToken, diag::pp_err_elif_without_if);
2476
2477 // If this is a top-level #elif, inform the MIOpt.
2478 if (CurLexer->getConditionalStackDepth() == 0)
2479 CurLexer->MIOpt.FoundTopLevelElse();
2480
2481 // If this is a #elif with a #else before it, report the error.
2482 if (CI.FoundElse) Diag(ElifToken, diag::pp_err_elif_after_else);
2483
2484 // Finally, skip the rest of the contents of this block and return the first
2485 // token after it.
2486 return SkipExcludedConditionalBlock(CI.IfLoc, /*Foundnonskip*/true,
2487 /*FoundElse*/CI.FoundElse);
2488}
2489