blob: 1a210ce172b069751bf455e52246f82e737421ff [file] [log] [blame]
Chris Lattnereb8a28f2006-08-10 18:43:39 +00001//===--- Parser.cpp - C Language Family Parser ----------------------------===//
Chris Lattner0bb5f832006-07-31 01:59:18 +00002//
3// The LLVM Compiler Infrastructure
4//
5// This file was developed by Chris Lattner and is distributed under
6// the University of Illinois Open Source License. See LICENSE.TXT for details.
7//
8//===----------------------------------------------------------------------===//
9//
10// This file implements the Parser interfaces.
11//
12//===----------------------------------------------------------------------===//
13
14#include "clang/Parse/Parser.h"
Chris Lattnerb9093cd2006-08-04 04:39:53 +000015#include "clang/Parse/Declarations.h"
Chris Lattner971c6b62006-08-05 22:46:42 +000016#include "clang/Parse/Scope.h"
Chris Lattner0bb5f832006-07-31 01:59:18 +000017using namespace llvm;
18using namespace clang;
19
Chris Lattner685ed1e2006-08-14 00:22:04 +000020Parser::Parser(Preprocessor &pp, Action &actions)
Chris Lattner971c6b62006-08-05 22:46:42 +000021 : PP(pp), Actions(actions), Diags(PP.getDiagnostics()) {
Chris Lattneracd58a32006-08-06 17:24:14 +000022 Tok.SetKind(tok::eof);
Chris Lattnere4e38592006-08-14 00:15:05 +000023 CurScope = 0;
Chris Lattnereec40f92006-08-06 21:55:29 +000024
25 ParenCount = BracketCount = BraceCount = 0;
Chris Lattner971c6b62006-08-05 22:46:42 +000026}
27
28Parser::~Parser() {
Chris Lattnere4e38592006-08-14 00:15:05 +000029 // If we still have scopes active, delete the scope tree.
Chris Lattner971c6b62006-08-05 22:46:42 +000030 delete CurScope;
31}
32
Chris Lattner685ed1e2006-08-14 00:22:04 +000033/// Out-of-line virtual destructor to provide home for Action class.
34Action::~Action() {}
Chris Lattnere4e38592006-08-14 00:15:05 +000035
Chris Lattner0bb5f832006-07-31 01:59:18 +000036
Chris Lattnerb9093cd2006-08-04 04:39:53 +000037void Parser::Diag(SourceLocation Loc, unsigned DiagID,
Chris Lattner0bb5f832006-07-31 01:59:18 +000038 const std::string &Msg) {
Chris Lattnerb9093cd2006-08-04 04:39:53 +000039 Diags.Report(Loc, DiagID, Msg);
Chris Lattner0bb5f832006-07-31 01:59:18 +000040}
41
Chris Lattner4564bc12006-08-10 23:14:52 +000042/// MatchRHSPunctuation - For punctuation with a LHS and RHS (e.g. '['/']'),
43/// this helper function matches and consumes the specified RHS token if
44/// present. If not present, it emits the specified diagnostic indicating
45/// that the parser failed to match the RHS of the token at LHSLoc. LHSName
46/// should be the name of the unmatched LHS token.
Chris Lattner04f80192006-08-15 04:55:54 +000047void Parser::MatchRHSPunctuation(tok::TokenKind RHSTok, SourceLocation LHSLoc) {
Chris Lattner4564bc12006-08-10 23:14:52 +000048
49 if (Tok.getKind() == RHSTok) {
Chris Lattnerdbb2a462006-08-12 19:26:13 +000050 ConsumeAnyToken();
Chris Lattner4564bc12006-08-10 23:14:52 +000051 } else {
Chris Lattner04f80192006-08-15 04:55:54 +000052 const char *LHSName = "unknown";
53 diag::kind DID = diag::err_parse_error;
54 switch (RHSTok) {
55 default: break;
56 case tok::r_paren : LHSName = "("; DID = diag::err_expected_rparen; break;
57 case tok::r_brace : LHSName = "{"; DID = diag::err_expected_rbrace; break;
58 case tok::r_square: LHSName = "["; DID = diag::err_expected_rsquare; break;
59 }
60 Diag(Tok, DID);
Chris Lattner4564bc12006-08-10 23:14:52 +000061 Diag(LHSLoc, diag::err_matching, LHSName);
62 SkipUntil(RHSTok);
63 }
64}
65
Chris Lattnerdbb2a462006-08-12 19:26:13 +000066/// ExpectAndConsume - The parser expects that 'ExpectedTok' is next in the
67/// input. If so, it is consumed and false is returned.
68///
69/// If the input is malformed, this emits the specified diagnostic. Next, if
70/// SkipToTok is specified, it calls SkipUntil(SkipToTok). Finally, true is
71/// returned.
72bool Parser::ExpectAndConsume(tok::TokenKind ExpectedTok, unsigned DiagID,
Chris Lattner6d7e6342006-08-15 03:41:14 +000073 const char *Msg, tok::TokenKind SkipToTok) {
Chris Lattnerdbb2a462006-08-12 19:26:13 +000074 if (Tok.getKind() == ExpectedTok) {
Chris Lattner15a00da2006-08-15 04:10:31 +000075 ConsumeAnyToken();
Chris Lattnerdbb2a462006-08-12 19:26:13 +000076 return false;
77 }
78
Chris Lattner6d7e6342006-08-15 03:41:14 +000079 Diag(Tok, DiagID, Msg);
Chris Lattnerdbb2a462006-08-12 19:26:13 +000080 if (SkipToTok != tok::unknown)
81 SkipUntil(SkipToTok);
82 return true;
83}
84
Chris Lattner70f32b72006-07-31 05:09:04 +000085//===----------------------------------------------------------------------===//
Chris Lattnereec40f92006-08-06 21:55:29 +000086// Error recovery.
87//===----------------------------------------------------------------------===//
88
89/// SkipUntil - Read tokens until we get to the specified token, then consume
90/// it (unless DontConsume is false). Because we cannot guarantee that the
91/// token will ever occur, this skips to the next token, or to some likely
92/// good stopping point. If StopAtSemi is true, skipping will stop at a ';'
93/// character.
94///
95/// If SkipUntil finds the specified token, it returns true, otherwise it
96/// returns false.
97bool Parser::SkipUntil(tok::TokenKind T, bool StopAtSemi, bool DontConsume) {
Chris Lattner5bd57e02006-08-11 06:40:25 +000098 // We always want this function to skip at least one token if the first token
99 // isn't T and if not at EOF.
100 bool isFirstTokenSkipped = true;
Chris Lattnereec40f92006-08-06 21:55:29 +0000101 while (1) {
102 // If we found the token, stop and return true.
103 if (Tok.getKind() == T) {
104 if (DontConsume) {
105 // Noop, don't consume the token.
Chris Lattnereec40f92006-08-06 21:55:29 +0000106 } else {
Chris Lattnerdbb2a462006-08-12 19:26:13 +0000107 ConsumeAnyToken();
Chris Lattnereec40f92006-08-06 21:55:29 +0000108 }
109 return true;
110 }
111
112 switch (Tok.getKind()) {
113 case tok::eof:
114 // Ran out of tokens.
115 return false;
116
117 case tok::l_paren:
118 // Recursively skip properly-nested parens.
119 ConsumeParen();
Chris Lattner5bd57e02006-08-11 06:40:25 +0000120 SkipUntil(tok::r_paren, false);
Chris Lattnereec40f92006-08-06 21:55:29 +0000121 break;
122 case tok::l_square:
123 // Recursively skip properly-nested square brackets.
124 ConsumeBracket();
Chris Lattner5bd57e02006-08-11 06:40:25 +0000125 SkipUntil(tok::r_square, false);
Chris Lattnereec40f92006-08-06 21:55:29 +0000126 break;
127 case tok::l_brace:
128 // Recursively skip properly-nested braces.
129 ConsumeBrace();
Chris Lattner5bd57e02006-08-11 06:40:25 +0000130 SkipUntil(tok::r_brace, false);
Chris Lattnereec40f92006-08-06 21:55:29 +0000131 break;
132
133 // Okay, we found a ']' or '}' or ')', which we think should be balanced.
134 // Since the user wasn't looking for this token (if they were, it would
135 // already be handled), this isn't balanced. If there is a LHS token at a
136 // higher level, we will assume that this matches the unbalanced token
137 // and return it. Otherwise, this is a spurious RHS token, which we skip.
138 case tok::r_paren:
Chris Lattner5bd57e02006-08-11 06:40:25 +0000139 if (ParenCount && !isFirstTokenSkipped)
140 return false; // Matches something.
Chris Lattnereec40f92006-08-06 21:55:29 +0000141 ConsumeParen();
142 break;
143 case tok::r_square:
Chris Lattner5bd57e02006-08-11 06:40:25 +0000144 if (BracketCount && !isFirstTokenSkipped)
145 return false; // Matches something.
Chris Lattnereec40f92006-08-06 21:55:29 +0000146 ConsumeBracket();
147 break;
148 case tok::r_brace:
Chris Lattner5bd57e02006-08-11 06:40:25 +0000149 if (BraceCount && !isFirstTokenSkipped)
150 return false; // Matches something.
Chris Lattnereec40f92006-08-06 21:55:29 +0000151 ConsumeBrace();
152 break;
153
154 case tok::string_literal:
Chris Lattnerd3e98952006-10-06 05:22:26 +0000155 case tok::wide_string_literal:
Chris Lattnereec40f92006-08-06 21:55:29 +0000156 ConsumeStringToken();
157 break;
158 case tok::semi:
159 if (StopAtSemi)
160 return false;
161 // FALL THROUGH.
162 default:
163 // Skip this token.
164 ConsumeToken();
165 break;
166 }
Chris Lattner5bd57e02006-08-11 06:40:25 +0000167 isFirstTokenSkipped = false;
Chris Lattnereec40f92006-08-06 21:55:29 +0000168 }
169}
170
171//===----------------------------------------------------------------------===//
Chris Lattnere4e38592006-08-14 00:15:05 +0000172// Scope manipulation
173//===----------------------------------------------------------------------===//
174
175/// EnterScope - Start a new scope.
176void Parser::EnterScope() {
Chris Lattnere4e38592006-08-14 00:15:05 +0000177 CurScope = new Scope(CurScope);
178}
179
180/// ExitScope - Pop a scope off the scope stack.
181void Parser::ExitScope() {
182 assert(CurScope && "Scope imbalance!");
183
184 // Inform the actions module that this scope is going away.
185 Actions.PopScope(Tok.getLocation(), CurScope);
186
187 Scope *Old = CurScope;
188 CurScope = Old->getParent();
189 delete Old;
190}
191
192
193
194
195//===----------------------------------------------------------------------===//
Chris Lattner70f32b72006-07-31 05:09:04 +0000196// C99 6.9: External Definitions.
197//===----------------------------------------------------------------------===//
Chris Lattner0bb5f832006-07-31 01:59:18 +0000198
Chris Lattner38ba3362006-08-17 07:04:37 +0000199/// Initialize - Warm up the parser.
200///
201void Parser::Initialize() {
Chris Lattnere4e38592006-08-14 00:15:05 +0000202 // Prime the lexer look-ahead.
203 ConsumeToken();
204
205 // Create the global scope, install it as the current scope.
206 assert(CurScope == 0 && "A scope is already active?");
207 EnterScope();
Chris Lattner38ba3362006-08-17 07:04:37 +0000208
Chris Lattner6d7e6342006-08-15 03:41:14 +0000209
210 // Install builtin types.
211 // TODO: Move this someplace more useful.
212 {
213 //__builtin_va_list
214 DeclSpec DS;
215 DS.StorageClassSpec = DeclSpec::SCS_typedef;
216
217 // TODO: add a 'TST_builtin' type?
218 DS.TypeSpecType = DeclSpec::TST_typedef;
Chris Lattner38ba3362006-08-17 07:04:37 +0000219
Chris Lattner6d7e6342006-08-15 03:41:14 +0000220 Declarator D(DS, Declarator::FileContext);
221 D.SetIdentifier(PP.getIdentifierInfo("__builtin_va_list"),SourceLocation());
222 Actions.ParseDeclarator(SourceLocation(), CurScope, D, 0);
223 }
224
Chris Lattner0bb5f832006-07-31 01:59:18 +0000225 if (Tok.getKind() == tok::eof) // Empty source file is an extension.
226 Diag(diag::ext_empty_source_file);
Chris Lattner38ba3362006-08-17 07:04:37 +0000227}
228
229/// ParseTopLevelDecl - Parse one top-level declaration, return whatever the
230/// action tells us to. This returns true if the EOF was encountered.
231bool Parser::ParseTopLevelDecl(DeclTy*& Result) {
232 Result = 0;
233 if (Tok.getKind() == tok::eof) return true;
Chris Lattner0bb5f832006-07-31 01:59:18 +0000234
Chris Lattner38ba3362006-08-17 07:04:37 +0000235 ParseExternalDeclaration();
236 return false;
237}
238
239/// Finalize - Shut down the parser.
240///
241void Parser::Finalize() {
Chris Lattnere4e38592006-08-14 00:15:05 +0000242 ExitScope();
243 assert(CurScope == 0 && "Scope imbalance!");
Chris Lattner0bb5f832006-07-31 01:59:18 +0000244}
245
Chris Lattner38ba3362006-08-17 07:04:37 +0000246/// ParseTranslationUnit:
247/// translation-unit: [C99 6.9]
248/// external-declaration
249/// translation-unit external-declaration
250void Parser::ParseTranslationUnit() {
251 Initialize();
252
253 DeclTy *Res;
254 while (!ParseTopLevelDecl(Res))
255 /*parse them all*/;
256
257 Finalize();
258}
259
Chris Lattner0bb5f832006-07-31 01:59:18 +0000260/// ParseExternalDeclaration:
Chris Lattner70f32b72006-07-31 05:09:04 +0000261/// external-declaration: [C99 6.9]
Chris Lattner0bb5f832006-07-31 01:59:18 +0000262/// function-definition [TODO]
263/// declaration [TODO]
264/// [EXT] ';'
Chris Lattner6d7e6342006-08-15 03:41:14 +0000265/// [GNU] asm-definition
Chris Lattner0bb5f832006-07-31 01:59:18 +0000266/// [GNU] __extension__ external-declaration [TODO]
267/// [OBJC] objc-class-definition [TODO]
268/// [OBJC] objc-class-declaration [TODO]
269/// [OBJC] objc-alias-declaration [TODO]
270/// [OBJC] objc-protocol-definition [TODO]
271/// [OBJC] objc-method-definition [TODO]
272/// [OBJC] @end [TODO]
273///
Chris Lattner6d7e6342006-08-15 03:41:14 +0000274/// [GNU] asm-definition:
275/// simple-asm-expr ';'
276///
Chris Lattner0bb5f832006-07-31 01:59:18 +0000277void Parser::ParseExternalDeclaration() {
278 switch (Tok.getKind()) {
279 case tok::semi:
280 Diag(diag::ext_top_level_semi);
281 ConsumeToken();
282 break;
Chris Lattner6d7e6342006-08-15 03:41:14 +0000283 case tok::kw_asm:
284 ParseSimpleAsm();
285 ExpectAndConsume(tok::semi, diag::err_expected_semi_after,
286 "top-level asm block");
287 break;
Chris Lattner0bb5f832006-07-31 01:59:18 +0000288 default:
289 // We can't tell whether this is a function-definition or declaration yet.
290 ParseDeclarationOrFunctionDefinition();
291 break;
292 }
293}
294
295/// ParseDeclarationOrFunctionDefinition - Parse either a function-definition or
Chris Lattner70f32b72006-07-31 05:09:04 +0000296/// a declaration. We can't tell which we have until we read up to the
297/// compound-statement in function-definition.
Chris Lattner0bb5f832006-07-31 01:59:18 +0000298///
Chris Lattner70f32b72006-07-31 05:09:04 +0000299/// function-definition: [C99 6.9.1]
300/// declaration-specifiers[opt] declarator declaration-list[opt]
301/// compound-statement [TODO]
302/// declaration: [C99 6.7]
Chris Lattner0bb5f832006-07-31 01:59:18 +0000303/// declaration-specifiers init-declarator-list[opt] ';' [TODO]
Chris Lattnerd9c3c592006-08-05 06:26:47 +0000304/// [!C99] init-declarator-list ';' [TODO]
Chris Lattner70f32b72006-07-31 05:09:04 +0000305/// [OMP] threadprivate-directive [TODO]
306///
Chris Lattner0bb5f832006-07-31 01:59:18 +0000307void Parser::ParseDeclarationOrFunctionDefinition() {
Chris Lattner70f32b72006-07-31 05:09:04 +0000308 // Parse the common declaration-specifiers piece.
Chris Lattnerb9093cd2006-08-04 04:39:53 +0000309 DeclSpec DS;
310 ParseDeclarationSpecifiers(DS);
Chris Lattnerd2864882006-08-05 08:09:44 +0000311
312 // C99 6.7.2.3p6: Handle "struct-or-union identifier;", "enum { X };"
Chris Lattner53361ac2006-08-10 05:19:57 +0000313 // declaration-specifiers init-declarator-list[opt] ';'
Chris Lattner0e894622006-08-13 19:58:17 +0000314 if (Tok.getKind() == tok::semi) {
315 // TODO: emit error on 'int;' or 'const enum foo;'.
316 // if (!DS.isMissingDeclaratorOk()) Diag(...);
317
318 ConsumeToken();
319 return;
320 }
Chris Lattner70f32b72006-07-31 05:09:04 +0000321
Chris Lattnerfff824f2006-08-07 06:31:38 +0000322 // Parse the first declarator.
323 Declarator DeclaratorInfo(DS, Declarator::FileContext);
324 ParseDeclarator(DeclaratorInfo);
325 // Error parsing the declarator?
326 if (DeclaratorInfo.getIdentifier() == 0) {
327 // If so, skip until the semi-colon or a }.
328 SkipUntil(tok::r_brace, true);
329 if (Tok.getKind() == tok::semi)
330 ConsumeToken();
331 return;
332 }
Chris Lattner70f32b72006-07-31 05:09:04 +0000333
Chris Lattnerfff824f2006-08-07 06:31:38 +0000334 // If the declarator is the start of a function definition, handle it.
335 if (Tok.getKind() == tok::equal || // int X()= -> not a function def
336 Tok.getKind() == tok::comma || // int X(), -> not a function def
337 Tok.getKind() == tok::semi || // int X(); -> not a function def
338 Tok.getKind() == tok::kw_asm || // int X() __asm__ -> not a fn def
339 Tok.getKind() == tok::kw___attribute) {// int X() __attr__ -> not a fn def
340 // FALL THROUGH.
341 } else if (DeclaratorInfo.isInnermostFunctionType() &&
342 (Tok.getKind() == tok::l_brace || // int X() {}
343 isDeclarationSpecifier())) { // int X(f) int f; {}
344 ParseFunctionDefinition(DeclaratorInfo);
345 return;
346 } else {
347 if (DeclaratorInfo.isInnermostFunctionType())
348 Diag(Tok, diag::err_expected_fn_body);
349 else
350 Diag(Tok, diag::err_expected_after_declarator);
Chris Lattnere4e38592006-08-14 00:15:05 +0000351 SkipUntil(tok::semi);
Chris Lattnerfff824f2006-08-07 06:31:38 +0000352 return;
353 }
Chris Lattnerd9c3c592006-08-05 06:26:47 +0000354
Chris Lattner53361ac2006-08-10 05:19:57 +0000355 // Parse the init-declarator-list for a normal declaration.
356 ParseInitDeclaratorListAfterFirstDeclarator(DeclaratorInfo);
Chris Lattner70f32b72006-07-31 05:09:04 +0000357}
358
Chris Lattnerfff824f2006-08-07 06:31:38 +0000359/// ParseFunctionDefinition - We parsed and verified that the specified
360/// Declarator is well formed. If this is a K&R-style function, read the
361/// parameters declaration-list, then start the compound-statement.
362///
363/// declaration-specifiers[opt] declarator declaration-list[opt]
364/// compound-statement [TODO]
365///
366void Parser::ParseFunctionDefinition(Declarator &D) {
367 const DeclaratorTypeInfo &FnTypeInfo = D.getTypeObject(0);
368 assert(FnTypeInfo.Kind == DeclaratorTypeInfo::Function &&
369 "This isn't a function declarator!");
370
371 // If this declaration was formed with a K&R-style identifier list for the
372 // arguments, parse declarations for all of the args next.
373 // int foo(a,b) int a; float b; {}
374 if (!FnTypeInfo.Fun.hasPrototype && !FnTypeInfo.Fun.isEmpty) {
375 // Read all the argument declarations.
Chris Lattner53361ac2006-08-10 05:19:57 +0000376 while (isDeclarationSpecifier())
377 ParseDeclaration(Declarator::KNRTypeListContext);
Chris Lattnerfff824f2006-08-07 06:31:38 +0000378
379 // Note, check that we got them all.
380 } else {
381 //if (isDeclarationSpecifier())
382 // Diag('k&r declspecs with prototype?');
383
Chris Lattner8693a512006-08-13 21:54:02 +0000384 // TODO: Install the arguments into the current scope.
Chris Lattnerfff824f2006-08-07 06:31:38 +0000385 }
386
Chris Lattner0ccd51e2006-08-09 05:47:47 +0000387 // We should have an opening brace now.
388 if (Tok.getKind() != tok::l_brace) {
389 Diag(Tok, diag::err_expected_fn_body);
390
391 // Skip over garbage, until we get to '{'. Don't eat the '{'.
392 SkipUntil(tok::l_brace, true, true);
393
394 // If we didn't find the '{', bail out.
395 if (Tok.getKind() != tok::l_brace)
396 return;
397 }
Chris Lattnerfff824f2006-08-07 06:31:38 +0000398
Chris Lattner0ccd51e2006-08-09 05:47:47 +0000399 ParseCompoundStatement();
Chris Lattnerfff824f2006-08-07 06:31:38 +0000400}
401
Chris Lattner0116c472006-08-15 06:03:28 +0000402/// ParseAsmStringLiteral - This is just a normal string-literal, but is not
403/// allowed to be a wide string, and is not subject to character translation.
404///
405/// [GNU] asm-string-literal:
406/// string-literal
407///
408void Parser::ParseAsmStringLiteral() {
Chris Lattnerd3e98952006-10-06 05:22:26 +0000409 if (!isTokenStringLiteral()) {
Chris Lattner0116c472006-08-15 06:03:28 +0000410 Diag(Tok, diag::err_expected_string_literal);
411 return;
412 }
413
414 ExprResult Res = ParseStringLiteralExpression();
415 if (Res.isInvalid) return;
416
417 // TODO: Diagnose: wide string literal in 'asm'
418}
419
Chris Lattner6d7e6342006-08-15 03:41:14 +0000420/// ParseSimpleAsm
421///
422/// [GNU] simple-asm-expr:
423/// 'asm' '(' asm-string-literal ')'
Chris Lattner6d7e6342006-08-15 03:41:14 +0000424///
425void Parser::ParseSimpleAsm() {
426 assert(Tok.getKind() == tok::kw_asm && "Not an asm!");
427 ConsumeToken();
428
429 if (Tok.getKind() != tok::l_paren) {
430 Diag(Tok, diag::err_expected_lparen_after, "asm");
431 return;
432 }
433
434 SourceLocation Loc = Tok.getLocation();
435 ConsumeParen();
436
Chris Lattner0116c472006-08-15 06:03:28 +0000437 ParseAsmStringLiteral();
Chris Lattner6d7e6342006-08-15 03:41:14 +0000438
Chris Lattner04f80192006-08-15 04:55:54 +0000439 MatchRHSPunctuation(tok::r_paren, Loc);
Chris Lattner6d7e6342006-08-15 03:41:14 +0000440}