blob: c74c634632c87e4035a2b49c9d804be9a9a32bd9 [file] [log] [blame]
Chris Lattnereb8a28f2006-08-10 18:43:39 +00001//===--- Parser.cpp - C Language Family Parser ----------------------------===//
Chris Lattner0bb5f832006-07-31 01:59:18 +00002//
3// The LLVM Compiler Infrastructure
4//
5// This file was developed by Chris Lattner and is distributed under
6// the University of Illinois Open Source License. See LICENSE.TXT for details.
7//
8//===----------------------------------------------------------------------===//
9//
10// This file implements the Parser interfaces.
11//
12//===----------------------------------------------------------------------===//
13
14#include "clang/Parse/Parser.h"
Chris Lattnerb9093cd2006-08-04 04:39:53 +000015#include "clang/Parse/Declarations.h"
Chris Lattner971c6b62006-08-05 22:46:42 +000016#include "clang/Parse/Scope.h"
Chris Lattner0bb5f832006-07-31 01:59:18 +000017using namespace llvm;
18using namespace clang;
19
Chris Lattner685ed1e2006-08-14 00:22:04 +000020Parser::Parser(Preprocessor &pp, Action &actions)
Chris Lattner971c6b62006-08-05 22:46:42 +000021 : PP(pp), Actions(actions), Diags(PP.getDiagnostics()) {
Chris Lattneracd58a32006-08-06 17:24:14 +000022 Tok.SetKind(tok::eof);
Chris Lattnere4e38592006-08-14 00:15:05 +000023 CurScope = 0;
Chris Lattnereec40f92006-08-06 21:55:29 +000024
25 ParenCount = BracketCount = BraceCount = 0;
Chris Lattner971c6b62006-08-05 22:46:42 +000026}
27
28Parser::~Parser() {
Chris Lattnere4e38592006-08-14 00:15:05 +000029 // If we still have scopes active, delete the scope tree.
Chris Lattner971c6b62006-08-05 22:46:42 +000030 delete CurScope;
31}
32
Chris Lattner685ed1e2006-08-14 00:22:04 +000033/// Out-of-line virtual destructor to provide home for Action class.
34Action::~Action() {}
Chris Lattnere4e38592006-08-14 00:15:05 +000035
Chris Lattner0bb5f832006-07-31 01:59:18 +000036
Chris Lattnerb9093cd2006-08-04 04:39:53 +000037void Parser::Diag(SourceLocation Loc, unsigned DiagID,
Chris Lattner0bb5f832006-07-31 01:59:18 +000038 const std::string &Msg) {
Chris Lattnerb9093cd2006-08-04 04:39:53 +000039 Diags.Report(Loc, DiagID, Msg);
Chris Lattner0bb5f832006-07-31 01:59:18 +000040}
41
Chris Lattner4564bc12006-08-10 23:14:52 +000042/// MatchRHSPunctuation - For punctuation with a LHS and RHS (e.g. '['/']'),
43/// this helper function matches and consumes the specified RHS token if
44/// present. If not present, it emits the specified diagnostic indicating
45/// that the parser failed to match the RHS of the token at LHSLoc. LHSName
46/// should be the name of the unmatched LHS token.
Chris Lattner04f80192006-08-15 04:55:54 +000047void Parser::MatchRHSPunctuation(tok::TokenKind RHSTok, SourceLocation LHSLoc) {
Chris Lattner4564bc12006-08-10 23:14:52 +000048
49 if (Tok.getKind() == RHSTok) {
Chris Lattnerdbb2a462006-08-12 19:26:13 +000050 ConsumeAnyToken();
Chris Lattner4564bc12006-08-10 23:14:52 +000051 } else {
Chris Lattner04f80192006-08-15 04:55:54 +000052 const char *LHSName = "unknown";
53 diag::kind DID = diag::err_parse_error;
54 switch (RHSTok) {
55 default: break;
56 case tok::r_paren : LHSName = "("; DID = diag::err_expected_rparen; break;
57 case tok::r_brace : LHSName = "{"; DID = diag::err_expected_rbrace; break;
58 case tok::r_square: LHSName = "["; DID = diag::err_expected_rsquare; break;
59 }
60 Diag(Tok, DID);
Chris Lattner4564bc12006-08-10 23:14:52 +000061 Diag(LHSLoc, diag::err_matching, LHSName);
62 SkipUntil(RHSTok);
63 }
64}
65
Chris Lattnerdbb2a462006-08-12 19:26:13 +000066/// ExpectAndConsume - The parser expects that 'ExpectedTok' is next in the
67/// input. If so, it is consumed and false is returned.
68///
69/// If the input is malformed, this emits the specified diagnostic. Next, if
70/// SkipToTok is specified, it calls SkipUntil(SkipToTok). Finally, true is
71/// returned.
72bool Parser::ExpectAndConsume(tok::TokenKind ExpectedTok, unsigned DiagID,
Chris Lattner6d7e6342006-08-15 03:41:14 +000073 const char *Msg, tok::TokenKind SkipToTok) {
Chris Lattnerdbb2a462006-08-12 19:26:13 +000074 if (Tok.getKind() == ExpectedTok) {
Chris Lattner15a00da2006-08-15 04:10:31 +000075 ConsumeAnyToken();
Chris Lattnerdbb2a462006-08-12 19:26:13 +000076 return false;
77 }
78
Chris Lattner6d7e6342006-08-15 03:41:14 +000079 Diag(Tok, DiagID, Msg);
Chris Lattnerdbb2a462006-08-12 19:26:13 +000080 if (SkipToTok != tok::unknown)
81 SkipUntil(SkipToTok);
82 return true;
83}
84
Chris Lattner70f32b72006-07-31 05:09:04 +000085//===----------------------------------------------------------------------===//
Chris Lattnereec40f92006-08-06 21:55:29 +000086// Error recovery.
87//===----------------------------------------------------------------------===//
88
89/// SkipUntil - Read tokens until we get to the specified token, then consume
90/// it (unless DontConsume is false). Because we cannot guarantee that the
91/// token will ever occur, this skips to the next token, or to some likely
92/// good stopping point. If StopAtSemi is true, skipping will stop at a ';'
93/// character.
94///
95/// If SkipUntil finds the specified token, it returns true, otherwise it
96/// returns false.
97bool Parser::SkipUntil(tok::TokenKind T, bool StopAtSemi, bool DontConsume) {
Chris Lattner5bd57e02006-08-11 06:40:25 +000098 // We always want this function to skip at least one token if the first token
99 // isn't T and if not at EOF.
100 bool isFirstTokenSkipped = true;
Chris Lattnereec40f92006-08-06 21:55:29 +0000101 while (1) {
102 // If we found the token, stop and return true.
103 if (Tok.getKind() == T) {
104 if (DontConsume) {
105 // Noop, don't consume the token.
Chris Lattnereec40f92006-08-06 21:55:29 +0000106 } else {
Chris Lattnerdbb2a462006-08-12 19:26:13 +0000107 ConsumeAnyToken();
Chris Lattnereec40f92006-08-06 21:55:29 +0000108 }
109 return true;
110 }
111
112 switch (Tok.getKind()) {
113 case tok::eof:
114 // Ran out of tokens.
115 return false;
116
117 case tok::l_paren:
118 // Recursively skip properly-nested parens.
119 ConsumeParen();
Chris Lattner5bd57e02006-08-11 06:40:25 +0000120 SkipUntil(tok::r_paren, false);
Chris Lattnereec40f92006-08-06 21:55:29 +0000121 break;
122 case tok::l_square:
123 // Recursively skip properly-nested square brackets.
124 ConsumeBracket();
Chris Lattner5bd57e02006-08-11 06:40:25 +0000125 SkipUntil(tok::r_square, false);
Chris Lattnereec40f92006-08-06 21:55:29 +0000126 break;
127 case tok::l_brace:
128 // Recursively skip properly-nested braces.
129 ConsumeBrace();
Chris Lattner5bd57e02006-08-11 06:40:25 +0000130 SkipUntil(tok::r_brace, false);
Chris Lattnereec40f92006-08-06 21:55:29 +0000131 break;
132
133 // Okay, we found a ']' or '}' or ')', which we think should be balanced.
134 // Since the user wasn't looking for this token (if they were, it would
135 // already be handled), this isn't balanced. If there is a LHS token at a
136 // higher level, we will assume that this matches the unbalanced token
137 // and return it. Otherwise, this is a spurious RHS token, which we skip.
138 case tok::r_paren:
Chris Lattner5bd57e02006-08-11 06:40:25 +0000139 if (ParenCount && !isFirstTokenSkipped)
140 return false; // Matches something.
Chris Lattnereec40f92006-08-06 21:55:29 +0000141 ConsumeParen();
142 break;
143 case tok::r_square:
Chris Lattner5bd57e02006-08-11 06:40:25 +0000144 if (BracketCount && !isFirstTokenSkipped)
145 return false; // Matches something.
Chris Lattnereec40f92006-08-06 21:55:29 +0000146 ConsumeBracket();
147 break;
148 case tok::r_brace:
Chris Lattner5bd57e02006-08-11 06:40:25 +0000149 if (BraceCount && !isFirstTokenSkipped)
150 return false; // Matches something.
Chris Lattnereec40f92006-08-06 21:55:29 +0000151 ConsumeBrace();
152 break;
153
154 case tok::string_literal:
155 ConsumeStringToken();
156 break;
157 case tok::semi:
158 if (StopAtSemi)
159 return false;
160 // FALL THROUGH.
161 default:
162 // Skip this token.
163 ConsumeToken();
164 break;
165 }
Chris Lattner5bd57e02006-08-11 06:40:25 +0000166 isFirstTokenSkipped = false;
Chris Lattnereec40f92006-08-06 21:55:29 +0000167 }
168}
169
170//===----------------------------------------------------------------------===//
Chris Lattnere4e38592006-08-14 00:15:05 +0000171// Scope manipulation
172//===----------------------------------------------------------------------===//
173
174/// EnterScope - Start a new scope.
175void Parser::EnterScope() {
Chris Lattnere4e38592006-08-14 00:15:05 +0000176 CurScope = new Scope(CurScope);
177}
178
179/// ExitScope - Pop a scope off the scope stack.
180void Parser::ExitScope() {
181 assert(CurScope && "Scope imbalance!");
182
183 // Inform the actions module that this scope is going away.
184 Actions.PopScope(Tok.getLocation(), CurScope);
185
186 Scope *Old = CurScope;
187 CurScope = Old->getParent();
188 delete Old;
189}
190
191
192
193
194//===----------------------------------------------------------------------===//
Chris Lattner70f32b72006-07-31 05:09:04 +0000195// C99 6.9: External Definitions.
196//===----------------------------------------------------------------------===//
Chris Lattner0bb5f832006-07-31 01:59:18 +0000197
Chris Lattner38ba3362006-08-17 07:04:37 +0000198/// Initialize - Warm up the parser.
199///
200void Parser::Initialize() {
Chris Lattnere4e38592006-08-14 00:15:05 +0000201 // Prime the lexer look-ahead.
202 ConsumeToken();
203
204 // Create the global scope, install it as the current scope.
205 assert(CurScope == 0 && "A scope is already active?");
206 EnterScope();
Chris Lattner38ba3362006-08-17 07:04:37 +0000207
Chris Lattner6d7e6342006-08-15 03:41:14 +0000208
209 // Install builtin types.
210 // TODO: Move this someplace more useful.
211 {
212 //__builtin_va_list
213 DeclSpec DS;
214 DS.StorageClassSpec = DeclSpec::SCS_typedef;
215
216 // TODO: add a 'TST_builtin' type?
217 DS.TypeSpecType = DeclSpec::TST_typedef;
Chris Lattner38ba3362006-08-17 07:04:37 +0000218
Chris Lattner6d7e6342006-08-15 03:41:14 +0000219 Declarator D(DS, Declarator::FileContext);
220 D.SetIdentifier(PP.getIdentifierInfo("__builtin_va_list"),SourceLocation());
221 Actions.ParseDeclarator(SourceLocation(), CurScope, D, 0);
222 }
223
Chris Lattner0bb5f832006-07-31 01:59:18 +0000224 if (Tok.getKind() == tok::eof) // Empty source file is an extension.
225 Diag(diag::ext_empty_source_file);
Chris Lattner38ba3362006-08-17 07:04:37 +0000226}
227
228/// ParseTopLevelDecl - Parse one top-level declaration, return whatever the
229/// action tells us to. This returns true if the EOF was encountered.
230bool Parser::ParseTopLevelDecl(DeclTy*& Result) {
231 Result = 0;
232 if (Tok.getKind() == tok::eof) return true;
Chris Lattner0bb5f832006-07-31 01:59:18 +0000233
Chris Lattner38ba3362006-08-17 07:04:37 +0000234 ParseExternalDeclaration();
235 return false;
236}
237
238/// Finalize - Shut down the parser.
239///
240void Parser::Finalize() {
Chris Lattnere4e38592006-08-14 00:15:05 +0000241 ExitScope();
242 assert(CurScope == 0 && "Scope imbalance!");
Chris Lattner0bb5f832006-07-31 01:59:18 +0000243}
244
Chris Lattner38ba3362006-08-17 07:04:37 +0000245/// ParseTranslationUnit:
246/// translation-unit: [C99 6.9]
247/// external-declaration
248/// translation-unit external-declaration
249void Parser::ParseTranslationUnit() {
250 Initialize();
251
252 DeclTy *Res;
253 while (!ParseTopLevelDecl(Res))
254 /*parse them all*/;
255
256 Finalize();
257}
258
Chris Lattner0bb5f832006-07-31 01:59:18 +0000259/// ParseExternalDeclaration:
Chris Lattner70f32b72006-07-31 05:09:04 +0000260/// external-declaration: [C99 6.9]
Chris Lattner0bb5f832006-07-31 01:59:18 +0000261/// function-definition [TODO]
262/// declaration [TODO]
263/// [EXT] ';'
Chris Lattner6d7e6342006-08-15 03:41:14 +0000264/// [GNU] asm-definition
Chris Lattner0bb5f832006-07-31 01:59:18 +0000265/// [GNU] __extension__ external-declaration [TODO]
266/// [OBJC] objc-class-definition [TODO]
267/// [OBJC] objc-class-declaration [TODO]
268/// [OBJC] objc-alias-declaration [TODO]
269/// [OBJC] objc-protocol-definition [TODO]
270/// [OBJC] objc-method-definition [TODO]
271/// [OBJC] @end [TODO]
272///
Chris Lattner6d7e6342006-08-15 03:41:14 +0000273/// [GNU] asm-definition:
274/// simple-asm-expr ';'
275///
Chris Lattner0bb5f832006-07-31 01:59:18 +0000276void Parser::ParseExternalDeclaration() {
277 switch (Tok.getKind()) {
278 case tok::semi:
279 Diag(diag::ext_top_level_semi);
280 ConsumeToken();
281 break;
Chris Lattner6d7e6342006-08-15 03:41:14 +0000282 case tok::kw_asm:
283 ParseSimpleAsm();
284 ExpectAndConsume(tok::semi, diag::err_expected_semi_after,
285 "top-level asm block");
286 break;
Chris Lattner0bb5f832006-07-31 01:59:18 +0000287 default:
288 // We can't tell whether this is a function-definition or declaration yet.
289 ParseDeclarationOrFunctionDefinition();
290 break;
291 }
292}
293
294/// ParseDeclarationOrFunctionDefinition - Parse either a function-definition or
Chris Lattner70f32b72006-07-31 05:09:04 +0000295/// a declaration. We can't tell which we have until we read up to the
296/// compound-statement in function-definition.
Chris Lattner0bb5f832006-07-31 01:59:18 +0000297///
Chris Lattner70f32b72006-07-31 05:09:04 +0000298/// function-definition: [C99 6.9.1]
299/// declaration-specifiers[opt] declarator declaration-list[opt]
300/// compound-statement [TODO]
301/// declaration: [C99 6.7]
Chris Lattner0bb5f832006-07-31 01:59:18 +0000302/// declaration-specifiers init-declarator-list[opt] ';' [TODO]
Chris Lattnerd9c3c592006-08-05 06:26:47 +0000303/// [!C99] init-declarator-list ';' [TODO]
Chris Lattner70f32b72006-07-31 05:09:04 +0000304/// [OMP] threadprivate-directive [TODO]
305///
Chris Lattner0bb5f832006-07-31 01:59:18 +0000306void Parser::ParseDeclarationOrFunctionDefinition() {
Chris Lattner70f32b72006-07-31 05:09:04 +0000307 // Parse the common declaration-specifiers piece.
Chris Lattnerb9093cd2006-08-04 04:39:53 +0000308 DeclSpec DS;
309 ParseDeclarationSpecifiers(DS);
Chris Lattnerd2864882006-08-05 08:09:44 +0000310
311 // C99 6.7.2.3p6: Handle "struct-or-union identifier;", "enum { X };"
Chris Lattner53361ac2006-08-10 05:19:57 +0000312 // declaration-specifiers init-declarator-list[opt] ';'
Chris Lattner0e894622006-08-13 19:58:17 +0000313 if (Tok.getKind() == tok::semi) {
314 // TODO: emit error on 'int;' or 'const enum foo;'.
315 // if (!DS.isMissingDeclaratorOk()) Diag(...);
316
317 ConsumeToken();
318 return;
319 }
Chris Lattner70f32b72006-07-31 05:09:04 +0000320
Chris Lattnerfff824f2006-08-07 06:31:38 +0000321 // Parse the first declarator.
322 Declarator DeclaratorInfo(DS, Declarator::FileContext);
323 ParseDeclarator(DeclaratorInfo);
324 // Error parsing the declarator?
325 if (DeclaratorInfo.getIdentifier() == 0) {
326 // If so, skip until the semi-colon or a }.
327 SkipUntil(tok::r_brace, true);
328 if (Tok.getKind() == tok::semi)
329 ConsumeToken();
330 return;
331 }
Chris Lattner70f32b72006-07-31 05:09:04 +0000332
Chris Lattnerfff824f2006-08-07 06:31:38 +0000333 // If the declarator is the start of a function definition, handle it.
334 if (Tok.getKind() == tok::equal || // int X()= -> not a function def
335 Tok.getKind() == tok::comma || // int X(), -> not a function def
336 Tok.getKind() == tok::semi || // int X(); -> not a function def
337 Tok.getKind() == tok::kw_asm || // int X() __asm__ -> not a fn def
338 Tok.getKind() == tok::kw___attribute) {// int X() __attr__ -> not a fn def
339 // FALL THROUGH.
340 } else if (DeclaratorInfo.isInnermostFunctionType() &&
341 (Tok.getKind() == tok::l_brace || // int X() {}
342 isDeclarationSpecifier())) { // int X(f) int f; {}
343 ParseFunctionDefinition(DeclaratorInfo);
344 return;
345 } else {
346 if (DeclaratorInfo.isInnermostFunctionType())
347 Diag(Tok, diag::err_expected_fn_body);
348 else
349 Diag(Tok, diag::err_expected_after_declarator);
Chris Lattnere4e38592006-08-14 00:15:05 +0000350 SkipUntil(tok::semi);
Chris Lattnerfff824f2006-08-07 06:31:38 +0000351 return;
352 }
Chris Lattnerd9c3c592006-08-05 06:26:47 +0000353
Chris Lattner53361ac2006-08-10 05:19:57 +0000354 // Parse the init-declarator-list for a normal declaration.
355 ParseInitDeclaratorListAfterFirstDeclarator(DeclaratorInfo);
Chris Lattner70f32b72006-07-31 05:09:04 +0000356}
357
Chris Lattnerfff824f2006-08-07 06:31:38 +0000358/// ParseFunctionDefinition - We parsed and verified that the specified
359/// Declarator is well formed. If this is a K&R-style function, read the
360/// parameters declaration-list, then start the compound-statement.
361///
362/// declaration-specifiers[opt] declarator declaration-list[opt]
363/// compound-statement [TODO]
364///
365void Parser::ParseFunctionDefinition(Declarator &D) {
366 const DeclaratorTypeInfo &FnTypeInfo = D.getTypeObject(0);
367 assert(FnTypeInfo.Kind == DeclaratorTypeInfo::Function &&
368 "This isn't a function declarator!");
369
370 // If this declaration was formed with a K&R-style identifier list for the
371 // arguments, parse declarations for all of the args next.
372 // int foo(a,b) int a; float b; {}
373 if (!FnTypeInfo.Fun.hasPrototype && !FnTypeInfo.Fun.isEmpty) {
374 // Read all the argument declarations.
Chris Lattner53361ac2006-08-10 05:19:57 +0000375 while (isDeclarationSpecifier())
376 ParseDeclaration(Declarator::KNRTypeListContext);
Chris Lattnerfff824f2006-08-07 06:31:38 +0000377
378 // Note, check that we got them all.
379 } else {
380 //if (isDeclarationSpecifier())
381 // Diag('k&r declspecs with prototype?');
382
Chris Lattner8693a512006-08-13 21:54:02 +0000383 // TODO: Install the arguments into the current scope.
Chris Lattnerfff824f2006-08-07 06:31:38 +0000384 }
385
Chris Lattner0ccd51e2006-08-09 05:47:47 +0000386 // We should have an opening brace now.
387 if (Tok.getKind() != tok::l_brace) {
388 Diag(Tok, diag::err_expected_fn_body);
389
390 // Skip over garbage, until we get to '{'. Don't eat the '{'.
391 SkipUntil(tok::l_brace, true, true);
392
393 // If we didn't find the '{', bail out.
394 if (Tok.getKind() != tok::l_brace)
395 return;
396 }
Chris Lattnerfff824f2006-08-07 06:31:38 +0000397
Chris Lattner0ccd51e2006-08-09 05:47:47 +0000398 ParseCompoundStatement();
Chris Lattnerfff824f2006-08-07 06:31:38 +0000399}
400
Chris Lattner0116c472006-08-15 06:03:28 +0000401/// ParseAsmStringLiteral - This is just a normal string-literal, but is not
402/// allowed to be a wide string, and is not subject to character translation.
403///
404/// [GNU] asm-string-literal:
405/// string-literal
406///
407void Parser::ParseAsmStringLiteral() {
408 if (Tok.getKind() != tok::string_literal) {
409 Diag(Tok, diag::err_expected_string_literal);
410 return;
411 }
412
413 ExprResult Res = ParseStringLiteralExpression();
414 if (Res.isInvalid) return;
415
416 // TODO: Diagnose: wide string literal in 'asm'
417}
418
Chris Lattner6d7e6342006-08-15 03:41:14 +0000419/// ParseSimpleAsm
420///
421/// [GNU] simple-asm-expr:
422/// 'asm' '(' asm-string-literal ')'
Chris Lattner6d7e6342006-08-15 03:41:14 +0000423///
424void Parser::ParseSimpleAsm() {
425 assert(Tok.getKind() == tok::kw_asm && "Not an asm!");
426 ConsumeToken();
427
428 if (Tok.getKind() != tok::l_paren) {
429 Diag(Tok, diag::err_expected_lparen_after, "asm");
430 return;
431 }
432
433 SourceLocation Loc = Tok.getLocation();
434 ConsumeParen();
435
Chris Lattner0116c472006-08-15 06:03:28 +0000436 ParseAsmStringLiteral();
Chris Lattner6d7e6342006-08-15 03:41:14 +0000437
Chris Lattner04f80192006-08-15 04:55:54 +0000438 MatchRHSPunctuation(tok::r_paren, Loc);
Chris Lattner6d7e6342006-08-15 03:41:14 +0000439}