blob: 228551dcb114596e8457af78b093ef55c2da27cf [file] [log] [blame]
Chris Lattnereb8a28f2006-08-10 18:43:39 +00001//===--- Parser.cpp - C Language Family Parser ----------------------------===//
Chris Lattner0bb5f832006-07-31 01:59:18 +00002//
3// The LLVM Compiler Infrastructure
4//
5// This file was developed by Chris Lattner and is distributed under
6// the University of Illinois Open Source License. See LICENSE.TXT for details.
7//
8//===----------------------------------------------------------------------===//
9//
10// This file implements the Parser interfaces.
11//
12//===----------------------------------------------------------------------===//
13
14#include "clang/Parse/Parser.h"
Chris Lattnerb9093cd2006-08-04 04:39:53 +000015#include "clang/Parse/Declarations.h"
Chris Lattner971c6b62006-08-05 22:46:42 +000016#include "clang/Parse/Scope.h"
Chris Lattner0bb5f832006-07-31 01:59:18 +000017using namespace llvm;
18using namespace clang;
19
Chris Lattner685ed1e2006-08-14 00:22:04 +000020Parser::Parser(Preprocessor &pp, Action &actions)
Chris Lattner971c6b62006-08-05 22:46:42 +000021 : PP(pp), Actions(actions), Diags(PP.getDiagnostics()) {
Chris Lattneracd58a32006-08-06 17:24:14 +000022 Tok.SetKind(tok::eof);
Chris Lattnere4e38592006-08-14 00:15:05 +000023 CurScope = 0;
Chris Lattnereec40f92006-08-06 21:55:29 +000024
25 ParenCount = BracketCount = BraceCount = 0;
Chris Lattner971c6b62006-08-05 22:46:42 +000026}
27
28Parser::~Parser() {
Chris Lattnere4e38592006-08-14 00:15:05 +000029 // If we still have scopes active, delete the scope tree.
Chris Lattner971c6b62006-08-05 22:46:42 +000030 delete CurScope;
31}
32
Chris Lattner685ed1e2006-08-14 00:22:04 +000033/// Out-of-line virtual destructor to provide home for Action class.
34Action::~Action() {}
Chris Lattnere4e38592006-08-14 00:15:05 +000035
Chris Lattner0bb5f832006-07-31 01:59:18 +000036
Chris Lattnerb9093cd2006-08-04 04:39:53 +000037void Parser::Diag(SourceLocation Loc, unsigned DiagID,
Chris Lattner0bb5f832006-07-31 01:59:18 +000038 const std::string &Msg) {
Chris Lattnerb9093cd2006-08-04 04:39:53 +000039 Diags.Report(Loc, DiagID, Msg);
Chris Lattner0bb5f832006-07-31 01:59:18 +000040}
41
Chris Lattner4564bc12006-08-10 23:14:52 +000042/// MatchRHSPunctuation - For punctuation with a LHS and RHS (e.g. '['/']'),
43/// this helper function matches and consumes the specified RHS token if
44/// present. If not present, it emits the specified diagnostic indicating
45/// that the parser failed to match the RHS of the token at LHSLoc. LHSName
46/// should be the name of the unmatched LHS token.
Chris Lattner04f80192006-08-15 04:55:54 +000047void Parser::MatchRHSPunctuation(tok::TokenKind RHSTok, SourceLocation LHSLoc) {
Chris Lattner4564bc12006-08-10 23:14:52 +000048
49 if (Tok.getKind() == RHSTok) {
Chris Lattnerdbb2a462006-08-12 19:26:13 +000050 ConsumeAnyToken();
Chris Lattner4564bc12006-08-10 23:14:52 +000051 } else {
Chris Lattner04f80192006-08-15 04:55:54 +000052 const char *LHSName = "unknown";
53 diag::kind DID = diag::err_parse_error;
54 switch (RHSTok) {
55 default: break;
56 case tok::r_paren : LHSName = "("; DID = diag::err_expected_rparen; break;
57 case tok::r_brace : LHSName = "{"; DID = diag::err_expected_rbrace; break;
58 case tok::r_square: LHSName = "["; DID = diag::err_expected_rsquare; break;
59 }
60 Diag(Tok, DID);
Chris Lattner4564bc12006-08-10 23:14:52 +000061 Diag(LHSLoc, diag::err_matching, LHSName);
62 SkipUntil(RHSTok);
63 }
64}
65
Chris Lattnerdbb2a462006-08-12 19:26:13 +000066/// ExpectAndConsume - The parser expects that 'ExpectedTok' is next in the
67/// input. If so, it is consumed and false is returned.
68///
69/// If the input is malformed, this emits the specified diagnostic. Next, if
70/// SkipToTok is specified, it calls SkipUntil(SkipToTok). Finally, true is
71/// returned.
72bool Parser::ExpectAndConsume(tok::TokenKind ExpectedTok, unsigned DiagID,
Chris Lattner6d7e6342006-08-15 03:41:14 +000073 const char *Msg, tok::TokenKind SkipToTok) {
Chris Lattnerdbb2a462006-08-12 19:26:13 +000074 if (Tok.getKind() == ExpectedTok) {
Chris Lattner15a00da2006-08-15 04:10:31 +000075 ConsumeAnyToken();
Chris Lattnerdbb2a462006-08-12 19:26:13 +000076 return false;
77 }
78
Chris Lattner6d7e6342006-08-15 03:41:14 +000079 Diag(Tok, DiagID, Msg);
Chris Lattnerdbb2a462006-08-12 19:26:13 +000080 if (SkipToTok != tok::unknown)
81 SkipUntil(SkipToTok);
82 return true;
83}
84
Chris Lattner70f32b72006-07-31 05:09:04 +000085//===----------------------------------------------------------------------===//
Chris Lattnereec40f92006-08-06 21:55:29 +000086// Error recovery.
87//===----------------------------------------------------------------------===//
88
89/// SkipUntil - Read tokens until we get to the specified token, then consume
90/// it (unless DontConsume is false). Because we cannot guarantee that the
91/// token will ever occur, this skips to the next token, or to some likely
92/// good stopping point. If StopAtSemi is true, skipping will stop at a ';'
93/// character.
94///
95/// If SkipUntil finds the specified token, it returns true, otherwise it
96/// returns false.
97bool Parser::SkipUntil(tok::TokenKind T, bool StopAtSemi, bool DontConsume) {
Chris Lattner5bd57e02006-08-11 06:40:25 +000098 // We always want this function to skip at least one token if the first token
99 // isn't T and if not at EOF.
100 bool isFirstTokenSkipped = true;
Chris Lattnereec40f92006-08-06 21:55:29 +0000101 while (1) {
102 // If we found the token, stop and return true.
103 if (Tok.getKind() == T) {
104 if (DontConsume) {
105 // Noop, don't consume the token.
Chris Lattnereec40f92006-08-06 21:55:29 +0000106 } else {
Chris Lattnerdbb2a462006-08-12 19:26:13 +0000107 ConsumeAnyToken();
Chris Lattnereec40f92006-08-06 21:55:29 +0000108 }
109 return true;
110 }
111
112 switch (Tok.getKind()) {
113 case tok::eof:
114 // Ran out of tokens.
115 return false;
116
117 case tok::l_paren:
118 // Recursively skip properly-nested parens.
119 ConsumeParen();
Chris Lattner5bd57e02006-08-11 06:40:25 +0000120 SkipUntil(tok::r_paren, false);
Chris Lattnereec40f92006-08-06 21:55:29 +0000121 break;
122 case tok::l_square:
123 // Recursively skip properly-nested square brackets.
124 ConsumeBracket();
Chris Lattner5bd57e02006-08-11 06:40:25 +0000125 SkipUntil(tok::r_square, false);
Chris Lattnereec40f92006-08-06 21:55:29 +0000126 break;
127 case tok::l_brace:
128 // Recursively skip properly-nested braces.
129 ConsumeBrace();
Chris Lattner5bd57e02006-08-11 06:40:25 +0000130 SkipUntil(tok::r_brace, false);
Chris Lattnereec40f92006-08-06 21:55:29 +0000131 break;
132
133 // Okay, we found a ']' or '}' or ')', which we think should be balanced.
134 // Since the user wasn't looking for this token (if they were, it would
135 // already be handled), this isn't balanced. If there is a LHS token at a
136 // higher level, we will assume that this matches the unbalanced token
137 // and return it. Otherwise, this is a spurious RHS token, which we skip.
138 case tok::r_paren:
Chris Lattner5bd57e02006-08-11 06:40:25 +0000139 if (ParenCount && !isFirstTokenSkipped)
140 return false; // Matches something.
Chris Lattnereec40f92006-08-06 21:55:29 +0000141 ConsumeParen();
142 break;
143 case tok::r_square:
Chris Lattner5bd57e02006-08-11 06:40:25 +0000144 if (BracketCount && !isFirstTokenSkipped)
145 return false; // Matches something.
Chris Lattnereec40f92006-08-06 21:55:29 +0000146 ConsumeBracket();
147 break;
148 case tok::r_brace:
Chris Lattner5bd57e02006-08-11 06:40:25 +0000149 if (BraceCount && !isFirstTokenSkipped)
150 return false; // Matches something.
Chris Lattnereec40f92006-08-06 21:55:29 +0000151 ConsumeBrace();
152 break;
153
154 case tok::string_literal:
155 ConsumeStringToken();
156 break;
157 case tok::semi:
158 if (StopAtSemi)
159 return false;
160 // FALL THROUGH.
161 default:
162 // Skip this token.
163 ConsumeToken();
164 break;
165 }
Chris Lattner5bd57e02006-08-11 06:40:25 +0000166 isFirstTokenSkipped = false;
Chris Lattnereec40f92006-08-06 21:55:29 +0000167 }
168}
169
170//===----------------------------------------------------------------------===//
Chris Lattnere4e38592006-08-14 00:15:05 +0000171// Scope manipulation
172//===----------------------------------------------------------------------===//
173
174/// EnterScope - Start a new scope.
175void Parser::EnterScope() {
Chris Lattnere4e38592006-08-14 00:15:05 +0000176 CurScope = new Scope(CurScope);
177}
178
179/// ExitScope - Pop a scope off the scope stack.
180void Parser::ExitScope() {
181 assert(CurScope && "Scope imbalance!");
182
183 // Inform the actions module that this scope is going away.
184 Actions.PopScope(Tok.getLocation(), CurScope);
185
186 Scope *Old = CurScope;
187 CurScope = Old->getParent();
188 delete Old;
189}
190
191
192
193
194//===----------------------------------------------------------------------===//
Chris Lattner70f32b72006-07-31 05:09:04 +0000195// C99 6.9: External Definitions.
196//===----------------------------------------------------------------------===//
Chris Lattner0bb5f832006-07-31 01:59:18 +0000197
198/// ParseTranslationUnit:
Chris Lattner70f32b72006-07-31 05:09:04 +0000199/// translation-unit: [C99 6.9]
Chris Lattner0bb5f832006-07-31 01:59:18 +0000200/// external-declaration
201/// translation-unit external-declaration
202void Parser::ParseTranslationUnit() {
Chris Lattnere4e38592006-08-14 00:15:05 +0000203 // Prime the lexer look-ahead.
204 ConsumeToken();
205
206 // Create the global scope, install it as the current scope.
207 assert(CurScope == 0 && "A scope is already active?");
208 EnterScope();
Chris Lattner0bb5f832006-07-31 01:59:18 +0000209
Chris Lattner6d7e6342006-08-15 03:41:14 +0000210
211 // Install builtin types.
212 // TODO: Move this someplace more useful.
213 {
214 //__builtin_va_list
215 DeclSpec DS;
216 DS.StorageClassSpec = DeclSpec::SCS_typedef;
217
218 // TODO: add a 'TST_builtin' type?
219 DS.TypeSpecType = DeclSpec::TST_typedef;
220
221 Declarator D(DS, Declarator::FileContext);
222 D.SetIdentifier(PP.getIdentifierInfo("__builtin_va_list"),SourceLocation());
223 Actions.ParseDeclarator(SourceLocation(), CurScope, D, 0);
224 }
225
226
Chris Lattner0bb5f832006-07-31 01:59:18 +0000227 if (Tok.getKind() == tok::eof) // Empty source file is an extension.
228 Diag(diag::ext_empty_source_file);
229
230 while (Tok.getKind() != tok::eof)
231 ParseExternalDeclaration();
Chris Lattnere4e38592006-08-14 00:15:05 +0000232
233 ExitScope();
234 assert(CurScope == 0 && "Scope imbalance!");
Chris Lattner0bb5f832006-07-31 01:59:18 +0000235}
236
237/// ParseExternalDeclaration:
Chris Lattner70f32b72006-07-31 05:09:04 +0000238/// external-declaration: [C99 6.9]
Chris Lattner0bb5f832006-07-31 01:59:18 +0000239/// function-definition [TODO]
240/// declaration [TODO]
241/// [EXT] ';'
Chris Lattner6d7e6342006-08-15 03:41:14 +0000242/// [GNU] asm-definition
Chris Lattner0bb5f832006-07-31 01:59:18 +0000243/// [GNU] __extension__ external-declaration [TODO]
244/// [OBJC] objc-class-definition [TODO]
245/// [OBJC] objc-class-declaration [TODO]
246/// [OBJC] objc-alias-declaration [TODO]
247/// [OBJC] objc-protocol-definition [TODO]
248/// [OBJC] objc-method-definition [TODO]
249/// [OBJC] @end [TODO]
250///
Chris Lattner6d7e6342006-08-15 03:41:14 +0000251/// [GNU] asm-definition:
252/// simple-asm-expr ';'
253///
Chris Lattner0bb5f832006-07-31 01:59:18 +0000254void Parser::ParseExternalDeclaration() {
255 switch (Tok.getKind()) {
256 case tok::semi:
257 Diag(diag::ext_top_level_semi);
258 ConsumeToken();
259 break;
Chris Lattner6d7e6342006-08-15 03:41:14 +0000260 case tok::kw_asm:
261 ParseSimpleAsm();
262 ExpectAndConsume(tok::semi, diag::err_expected_semi_after,
263 "top-level asm block");
264 break;
Chris Lattner0bb5f832006-07-31 01:59:18 +0000265 default:
266 // We can't tell whether this is a function-definition or declaration yet.
267 ParseDeclarationOrFunctionDefinition();
268 break;
269 }
270}
271
272/// ParseDeclarationOrFunctionDefinition - Parse either a function-definition or
Chris Lattner70f32b72006-07-31 05:09:04 +0000273/// a declaration. We can't tell which we have until we read up to the
274/// compound-statement in function-definition.
Chris Lattner0bb5f832006-07-31 01:59:18 +0000275///
Chris Lattner70f32b72006-07-31 05:09:04 +0000276/// function-definition: [C99 6.9.1]
277/// declaration-specifiers[opt] declarator declaration-list[opt]
278/// compound-statement [TODO]
279/// declaration: [C99 6.7]
Chris Lattner0bb5f832006-07-31 01:59:18 +0000280/// declaration-specifiers init-declarator-list[opt] ';' [TODO]
Chris Lattnerd9c3c592006-08-05 06:26:47 +0000281/// [!C99] init-declarator-list ';' [TODO]
Chris Lattner70f32b72006-07-31 05:09:04 +0000282/// [OMP] threadprivate-directive [TODO]
283///
Chris Lattner0bb5f832006-07-31 01:59:18 +0000284void Parser::ParseDeclarationOrFunctionDefinition() {
Chris Lattner70f32b72006-07-31 05:09:04 +0000285 // Parse the common declaration-specifiers piece.
Chris Lattnerb9093cd2006-08-04 04:39:53 +0000286 DeclSpec DS;
287 ParseDeclarationSpecifiers(DS);
Chris Lattnerd2864882006-08-05 08:09:44 +0000288
289 // C99 6.7.2.3p6: Handle "struct-or-union identifier;", "enum { X };"
Chris Lattner53361ac2006-08-10 05:19:57 +0000290 // declaration-specifiers init-declarator-list[opt] ';'
Chris Lattner0e894622006-08-13 19:58:17 +0000291 if (Tok.getKind() == tok::semi) {
292 // TODO: emit error on 'int;' or 'const enum foo;'.
293 // if (!DS.isMissingDeclaratorOk()) Diag(...);
294
295 ConsumeToken();
296 return;
297 }
Chris Lattner70f32b72006-07-31 05:09:04 +0000298
Chris Lattnerfff824f2006-08-07 06:31:38 +0000299 // Parse the first declarator.
300 Declarator DeclaratorInfo(DS, Declarator::FileContext);
301 ParseDeclarator(DeclaratorInfo);
302 // Error parsing the declarator?
303 if (DeclaratorInfo.getIdentifier() == 0) {
304 // If so, skip until the semi-colon or a }.
305 SkipUntil(tok::r_brace, true);
306 if (Tok.getKind() == tok::semi)
307 ConsumeToken();
308 return;
309 }
Chris Lattner70f32b72006-07-31 05:09:04 +0000310
Chris Lattnerfff824f2006-08-07 06:31:38 +0000311 // If the declarator is the start of a function definition, handle it.
312 if (Tok.getKind() == tok::equal || // int X()= -> not a function def
313 Tok.getKind() == tok::comma || // int X(), -> not a function def
314 Tok.getKind() == tok::semi || // int X(); -> not a function def
315 Tok.getKind() == tok::kw_asm || // int X() __asm__ -> not a fn def
316 Tok.getKind() == tok::kw___attribute) {// int X() __attr__ -> not a fn def
317 // FALL THROUGH.
318 } else if (DeclaratorInfo.isInnermostFunctionType() &&
319 (Tok.getKind() == tok::l_brace || // int X() {}
320 isDeclarationSpecifier())) { // int X(f) int f; {}
321 ParseFunctionDefinition(DeclaratorInfo);
322 return;
323 } else {
324 if (DeclaratorInfo.isInnermostFunctionType())
325 Diag(Tok, diag::err_expected_fn_body);
326 else
327 Diag(Tok, diag::err_expected_after_declarator);
Chris Lattnere4e38592006-08-14 00:15:05 +0000328 SkipUntil(tok::semi);
Chris Lattnerfff824f2006-08-07 06:31:38 +0000329 return;
330 }
Chris Lattnerd9c3c592006-08-05 06:26:47 +0000331
Chris Lattner53361ac2006-08-10 05:19:57 +0000332 // Parse the init-declarator-list for a normal declaration.
333 ParseInitDeclaratorListAfterFirstDeclarator(DeclaratorInfo);
Chris Lattner70f32b72006-07-31 05:09:04 +0000334}
335
Chris Lattnerfff824f2006-08-07 06:31:38 +0000336/// ParseFunctionDefinition - We parsed and verified that the specified
337/// Declarator is well formed. If this is a K&R-style function, read the
338/// parameters declaration-list, then start the compound-statement.
339///
340/// declaration-specifiers[opt] declarator declaration-list[opt]
341/// compound-statement [TODO]
342///
343void Parser::ParseFunctionDefinition(Declarator &D) {
344 const DeclaratorTypeInfo &FnTypeInfo = D.getTypeObject(0);
345 assert(FnTypeInfo.Kind == DeclaratorTypeInfo::Function &&
346 "This isn't a function declarator!");
347
348 // If this declaration was formed with a K&R-style identifier list for the
349 // arguments, parse declarations for all of the args next.
350 // int foo(a,b) int a; float b; {}
351 if (!FnTypeInfo.Fun.hasPrototype && !FnTypeInfo.Fun.isEmpty) {
352 // Read all the argument declarations.
Chris Lattner53361ac2006-08-10 05:19:57 +0000353 while (isDeclarationSpecifier())
354 ParseDeclaration(Declarator::KNRTypeListContext);
Chris Lattnerfff824f2006-08-07 06:31:38 +0000355
356 // Note, check that we got them all.
357 } else {
358 //if (isDeclarationSpecifier())
359 // Diag('k&r declspecs with prototype?');
360
Chris Lattner8693a512006-08-13 21:54:02 +0000361 // TODO: Install the arguments into the current scope.
Chris Lattnerfff824f2006-08-07 06:31:38 +0000362 }
363
Chris Lattner0ccd51e2006-08-09 05:47:47 +0000364 // We should have an opening brace now.
365 if (Tok.getKind() != tok::l_brace) {
366 Diag(Tok, diag::err_expected_fn_body);
367
368 // Skip over garbage, until we get to '{'. Don't eat the '{'.
369 SkipUntil(tok::l_brace, true, true);
370
371 // If we didn't find the '{', bail out.
372 if (Tok.getKind() != tok::l_brace)
373 return;
374 }
Chris Lattnerfff824f2006-08-07 06:31:38 +0000375
Chris Lattner0ccd51e2006-08-09 05:47:47 +0000376 ParseCompoundStatement();
Chris Lattnerfff824f2006-08-07 06:31:38 +0000377}
378
Chris Lattner6d7e6342006-08-15 03:41:14 +0000379/// ParseSimpleAsm
380///
381/// [GNU] simple-asm-expr:
382/// 'asm' '(' asm-string-literal ')'
383/// [GNU] asm-string-literal:
384/// string-literal
385///
386void Parser::ParseSimpleAsm() {
387 assert(Tok.getKind() == tok::kw_asm && "Not an asm!");
388 ConsumeToken();
389
390 if (Tok.getKind() != tok::l_paren) {
391 Diag(Tok, diag::err_expected_lparen_after, "asm");
392 return;
393 }
394
395 SourceLocation Loc = Tok.getLocation();
396 ConsumeParen();
397
398 if (Tok.getKind() != tok::string_literal) {
399 Diag(Tok, diag::err_expected_string_literal);
400 SkipUntil(tok::r_paren);
401 return;
402 }
403
404 ExprResult Res = ParseStringLiteralExpression();
405 if (Res.isInvalid) {
406 Diag(Tok, diag::err_expected_string_literal);
407 SkipUntil(tok::r_paren);
408 return;
409 }
410
411 // TODO: Diagnose: wide string literal in 'asm'
412
Chris Lattner04f80192006-08-15 04:55:54 +0000413 MatchRHSPunctuation(tok::r_paren, Loc);
Chris Lattner6d7e6342006-08-15 03:41:14 +0000414}