blob: 8f400b370776541da8775f65211a7eb6079ee266 [file] [log] [blame]
Chris Lattner7ad0fbe2006-11-05 07:46:30 +00001//===--- ParseExpr.cpp - Expression Parsing -------------------------------===//
Chris Lattnerc951dae2006-08-10 04:23:57 +00002//
3// The LLVM Compiler Infrastructure
4//
5// This file was developed by Chris Lattner and is distributed under
6// the University of Illinois Open Source License. See LICENSE.TXT for details.
7//
8//===----------------------------------------------------------------------===//
9//
Chris Lattnercde626a2006-08-12 08:13:25 +000010// This file implements the Expression parsing implementation. Expressions in
11// C99 basically consist of a bunch of binary operators with unary operators and
12// other random stuff at the leaves.
13//
14// In the C99 grammar, these unary operators bind tightest and are represented
15// as the 'cast-expression' production. Everything else is either a binary
Chris Lattnerb7f1fc92006-08-12 16:45:01 +000016// operator (e.g. '/') or a ternary operator ("?:"). The unary leaves are
Chris Lattnercde626a2006-08-12 08:13:25 +000017// handled by ParseCastExpression, the higher level pieces are handled by
18// ParseBinaryExpression.
Chris Lattnerc951dae2006-08-10 04:23:57 +000019//
20//===----------------------------------------------------------------------===//
21
22#include "clang/Parse/Parser.h"
23#include "clang/Basic/Diagnostic.h"
Chris Lattner02dffbd2006-10-14 07:50:21 +000024#include "clang/Basic/TargetInfo.h"
Chris Lattner6d28d9b2006-08-24 03:51:22 +000025#include "llvm/ADT/SmallVector.h"
Chris Lattner834618d2006-11-03 07:48:41 +000026#include "llvm/ADT/SmallString.h"
Chris Lattnerd3e98952006-10-06 05:22:26 +000027#include "llvm/ADT/StringExtras.h"
Chris Lattnerc951dae2006-08-10 04:23:57 +000028using namespace llvm;
29using namespace clang;
30
Chris Lattnerb7f1fc92006-08-12 16:45:01 +000031/// PrecedenceLevels - These are precedences for the binary/ternary operators in
Chris Lattnercde626a2006-08-12 08:13:25 +000032/// the C99 grammar. These have been named to relate with the C99 grammar
33/// productions. Low precedences numbers bind more weakly than high numbers.
34namespace prec {
35 enum Level {
36 Unknown = 0, // Not binary operator.
37 Comma = 1, // ,
38 Assignment = 2, // =, *=, /=, %=, +=, -=, <<=, >>=, &=, ^=, |=
39 Conditional = 3, // ?
40 LogicalOr = 4, // ||
41 LogicalAnd = 5, // &&
42 InclusiveOr = 6, // |
43 ExclusiveOr = 7, // ^
44 And = 8, // &
Chris Lattner9916c5c2006-10-27 05:24:37 +000045 Equality = 9, // ==, !=
46 Relational = 10, // >=, <=, >, <
47 Shift = 11, // <<, >>
48 Additive = 12, // -, +
49 Multiplicative = 13 // *, /, %
Chris Lattnercde626a2006-08-12 08:13:25 +000050 };
51}
52
53
54/// getBinOpPrecedence - Return the precedence of the specified binary operator
55/// token. This returns:
56///
57static prec::Level getBinOpPrecedence(tok::TokenKind Kind) {
58 switch (Kind) {
59 default: return prec::Unknown;
60 case tok::comma: return prec::Comma;
61 case tok::equal:
62 case tok::starequal:
63 case tok::slashequal:
64 case tok::percentequal:
65 case tok::plusequal:
66 case tok::minusequal:
67 case tok::lesslessequal:
68 case tok::greatergreaterequal:
69 case tok::ampequal:
70 case tok::caretequal:
71 case tok::pipeequal: return prec::Assignment;
72 case tok::question: return prec::Conditional;
73 case tok::pipepipe: return prec::LogicalOr;
74 case tok::ampamp: return prec::LogicalAnd;
75 case tok::pipe: return prec::InclusiveOr;
76 case tok::caret: return prec::ExclusiveOr;
77 case tok::amp: return prec::And;
Chris Lattnercde626a2006-08-12 08:13:25 +000078 case tok::exclaimequal:
79 case tok::equalequal: return prec::Equality;
80 case tok::lessequal:
81 case tok::less:
82 case tok::greaterequal:
83 case tok::greater: return prec::Relational;
84 case tok::lessless:
85 case tok::greatergreater: return prec::Shift;
86 case tok::plus:
87 case tok::minus: return prec::Additive;
88 case tok::percent:
89 case tok::slash:
90 case tok::star: return prec::Multiplicative;
91 }
92}
93
94
Chris Lattnerce7e21d2006-08-12 17:22:40 +000095/// ParseExpression - Simple precedence-based parser for binary/ternary
Chris Lattnercde626a2006-08-12 08:13:25 +000096/// operators.
97///
Chris Lattnerb7f1fc92006-08-12 16:45:01 +000098/// Note: we diverge from the C99 grammar when parsing the assignment-expression
99/// production. C99 specifies that the LHS of an assignment operator should be
100/// parsed as a unary-expression, but consistency dictates that it be a
101/// conditional-expession. In practice, the important thing here is that the
102/// LHS of an assignment has to be an l-value, which productions between
103/// unary-expression and conditional-expression don't produce. Because we want
104/// consistency, we parse the LHS as a conditional-expression, then check for
105/// l-value-ness in semantic analysis stages.
106///
Chris Lattnercde626a2006-08-12 08:13:25 +0000107/// multiplicative-expression: [C99 6.5.5]
108/// cast-expression
109/// multiplicative-expression '*' cast-expression
110/// multiplicative-expression '/' cast-expression
111/// multiplicative-expression '%' cast-expression
112///
113/// additive-expression: [C99 6.5.6]
114/// multiplicative-expression
115/// additive-expression '+' multiplicative-expression
116/// additive-expression '-' multiplicative-expression
117///
118/// shift-expression: [C99 6.5.7]
119/// additive-expression
120/// shift-expression '<<' additive-expression
121/// shift-expression '>>' additive-expression
122///
123/// relational-expression: [C99 6.5.8]
124/// shift-expression
125/// relational-expression '<' shift-expression
126/// relational-expression '>' shift-expression
127/// relational-expression '<=' shift-expression
128/// relational-expression '>=' shift-expression
129///
130/// equality-expression: [C99 6.5.9]
131/// relational-expression
132/// equality-expression '==' relational-expression
133/// equality-expression '!=' relational-expression
134///
135/// AND-expression: [C99 6.5.10]
136/// equality-expression
137/// AND-expression '&' equality-expression
138///
139/// exclusive-OR-expression: [C99 6.5.11]
140/// AND-expression
141/// exclusive-OR-expression '^' AND-expression
142///
143/// inclusive-OR-expression: [C99 6.5.12]
144/// exclusive-OR-expression
145/// inclusive-OR-expression '|' exclusive-OR-expression
146///
147/// logical-AND-expression: [C99 6.5.13]
148/// inclusive-OR-expression
149/// logical-AND-expression '&&' inclusive-OR-expression
150///
151/// logical-OR-expression: [C99 6.5.14]
152/// logical-AND-expression
153/// logical-OR-expression '||' logical-AND-expression
154///
155/// conditional-expression: [C99 6.5.15]
156/// logical-OR-expression
157/// logical-OR-expression '?' expression ':' conditional-expression
158/// [GNU] logical-OR-expression '?' ':' conditional-expression
159///
160/// assignment-expression: [C99 6.5.16]
161/// conditional-expression
162/// unary-expression assignment-operator assignment-expression
163///
164/// assignment-operator: one of
165/// = *= /= %= += -= <<= >>= &= ^= |=
166///
167/// expression: [C99 6.5.17]
168/// assignment-expression
169/// expression ',' assignment-expression
170///
Chris Lattnerd35c34f2006-08-12 17:04:50 +0000171Parser::ExprResult Parser::ParseExpression() {
Chris Lattnercde626a2006-08-12 08:13:25 +0000172 ExprResult LHS = ParseCastExpression(false);
173 if (LHS.isInvalid) return LHS;
174
175 return ParseRHSOfBinaryExpression(LHS, prec::Comma);
176}
177
Chris Lattner0c6c0342006-08-12 18:12:45 +0000178/// ParseAssignmentExpression - Parse an expr that doesn't include commas.
179///
Chris Lattnerce7e21d2006-08-12 17:22:40 +0000180Parser::ExprResult Parser::ParseAssignmentExpression() {
181 ExprResult LHS = ParseCastExpression(false);
182 if (LHS.isInvalid) return LHS;
183
184 return ParseRHSOfBinaryExpression(LHS, prec::Assignment);
185}
186
Chris Lattner3b561a32006-08-13 00:12:11 +0000187Parser::ExprResult Parser::ParseConstantExpression() {
188 ExprResult LHS = ParseCastExpression(false);
189 if (LHS.isInvalid) return LHS;
190
191 // TODO: Validate that this is a constant expr!
192 return ParseRHSOfBinaryExpression(LHS, prec::Conditional);
193}
194
Chris Lattner0c6c0342006-08-12 18:12:45 +0000195/// ParseExpressionWithLeadingIdentifier - This special purpose method is used
196/// in contexts where we have already consumed an identifier (which we saved in
197/// 'Tok'), then discovered that the identifier was really the leading token of
198/// part of an expression. For example, in "A[1]+B", we consumed "A" (which is
199/// now in 'Tok') and the current token is "[".
200Parser::ExprResult Parser::
201ParseExpressionWithLeadingIdentifier(const LexerToken &Tok) {
202 // We know that 'Tok' must correspond to this production:
203 // primary-expression: identifier
204
Chris Lattnereb2feef2006-11-04 19:14:32 +0000205 // Let the actions module handle the identifier.
206 ExprResult Res = Actions.ParseSimplePrimaryExpr(Tok.getLocation(),
207 Tok.getKind());
Chris Lattner0c6c0342006-08-12 18:12:45 +0000208
209 // Because we have to parse an entire cast-expression before starting the
210 // ParseRHSOfBinaryExpression method (which parses any trailing binops), we
211 // need to handle the 'postfix-expression' rules. We do this by invoking
212 // ParsePostfixExpressionSuffix to consume any postfix-expression suffixes:
213 Res = ParsePostfixExpressionSuffix(Res);
214 if (Res.isInvalid) return Res;
215
216 // At this point, the "A[1]" part of "A[1]+B" has been consumed. Once this is
217 // done, we know we don't have to do anything for cast-expression, because the
218 // only non-postfix-expression production starts with a '(' token, and we know
219 // we have an identifier. As such, we can invoke ParseRHSOfBinaryExpression
220 // to consume any trailing operators (e.g. "+" in this example) and connected
221 // chunks of the expression.
222 return ParseRHSOfBinaryExpression(Res, prec::Comma);
223}
224
Chris Lattner8693a512006-08-13 21:54:02 +0000225/// ParseExpressionWithLeadingIdentifier - This special purpose method is used
226/// in contexts where we have already consumed an identifier (which we saved in
227/// 'Tok'), then discovered that the identifier was really the leading token of
228/// part of an assignment-expression. For example, in "A[1]+B", we consumed "A"
229/// (which is now in 'Tok') and the current token is "[".
230Parser::ExprResult Parser::
231ParseAssignmentExprWithLeadingIdentifier(const LexerToken &Tok) {
232 // We know that 'Tok' must correspond to this production:
233 // primary-expression: identifier
234
Chris Lattnereb2feef2006-11-04 19:14:32 +0000235 // Let the actions module handle the identifier.
236 ExprResult Res = Actions.ParseSimplePrimaryExpr(Tok.getLocation(),
237 Tok.getKind());
Chris Lattner8693a512006-08-13 21:54:02 +0000238
239 // Because we have to parse an entire cast-expression before starting the
240 // ParseRHSOfBinaryExpression method (which parses any trailing binops), we
241 // need to handle the 'postfix-expression' rules. We do this by invoking
242 // ParsePostfixExpressionSuffix to consume any postfix-expression suffixes:
243 Res = ParsePostfixExpressionSuffix(Res);
244 if (Res.isInvalid) return Res;
245
246 // At this point, the "A[1]" part of "A[1]+B" has been consumed. Once this is
247 // done, we know we don't have to do anything for cast-expression, because the
248 // only non-postfix-expression production starts with a '(' token, and we know
249 // we have an identifier. As such, we can invoke ParseRHSOfBinaryExpression
250 // to consume any trailing operators (e.g. "+" in this example) and connected
251 // chunks of the expression.
252 return ParseRHSOfBinaryExpression(Res, prec::Assignment);
253}
254
255
Chris Lattner62591722006-08-12 18:40:58 +0000256/// ParseAssignmentExpressionWithLeadingStar - This special purpose method is
257/// used in contexts where we have already consumed a '*' (which we saved in
258/// 'Tok'), then discovered that the '*' was really the leading token of an
259/// expression. For example, in "*(int*)P+B", we consumed "*" (which is
260/// now in 'Tok') and the current token is "(".
261Parser::ExprResult Parser::
262ParseAssignmentExpressionWithLeadingStar(const LexerToken &Tok) {
263 // We know that 'Tok' must correspond to this production:
264 // unary-expression: unary-operator cast-expression
265 // where 'unary-operator' is '*'.
266
267 // Parse the cast-expression that follows the '*'. This will parse the
268 // "*(int*)P" part of "*(int*)P+B".
269 ExprResult Res = ParseCastExpression(false);
270 if (Res.isInvalid) return Res;
271
272 // TODO: Combine Tok + Res to get the new AST.
273
274 // We have to parse an entire cast-expression before starting the
275 // ParseRHSOfBinaryExpression method (which parses any trailing binops). Since
276 // we know that the only production above us is the cast-expression
277 // production, and because the only alternative productions start with a '('
278 // token (we know we had a '*'), there is no work to do to get a whole
279 // cast-expression.
280
281 // At this point, the "*(int*)P" part of "*(int*)P+B" has been consumed. Once
282 // this is done, we can invoke ParseRHSOfBinaryExpression to consume any
283 // trailing operators (e.g. "+" in this example) and connected chunks of the
284 // assignment-expression.
285 return ParseRHSOfBinaryExpression(Res, prec::Assignment);
286}
287
288
Chris Lattnercde626a2006-08-12 08:13:25 +0000289/// ParseRHSOfBinaryExpression - Parse a binary expression that starts with
290/// LHS and has a precedence of at least MinPrec.
291Parser::ExprResult
292Parser::ParseRHSOfBinaryExpression(ExprResult LHS, unsigned MinPrec) {
293 unsigned NextTokPrec = getBinOpPrecedence(Tok.getKind());
Chris Lattner9b6d4cb2006-08-23 05:17:46 +0000294 SourceLocation ColonLoc;
295
Chris Lattnercde626a2006-08-12 08:13:25 +0000296 while (1) {
297 // If this token has a lower precedence than we are allowed to parse (e.g.
298 // because we are called recursively, or because the token is not a binop),
299 // then we are done!
300 if (NextTokPrec < MinPrec)
301 return LHS;
302
303 // Consume the operator, saving the operator token for error reporting.
304 LexerToken OpToken = Tok;
305 ConsumeToken();
306
Chris Lattner96c3deb2006-08-12 17:13:08 +0000307 // Special case handling for the ternary operator.
Chris Lattnerb5600a62006-10-06 05:40:05 +0000308 ExprResult TernaryMiddle(true);
Chris Lattner96c3deb2006-08-12 17:13:08 +0000309 if (NextTokPrec == prec::Conditional) {
310 if (Tok.getKind() != tok::colon) {
311 // Handle this production specially:
312 // logical-OR-expression '?' expression ':' conditional-expression
313 // In particular, the RHS of the '?' is 'expression', not
314 // 'logical-OR-expression' as we might expect.
315 TernaryMiddle = ParseExpression();
316 if (TernaryMiddle.isInvalid) return TernaryMiddle;
317 } else {
318 // Special case handling of "X ? Y : Z" where Y is empty:
319 // logical-OR-expression '?' ':' conditional-expression [GNU]
320 TernaryMiddle = ExprResult(false);
321 Diag(Tok, diag::ext_gnu_conditional_expr);
322 }
323
324 if (Tok.getKind() != tok::colon) {
325 Diag(Tok, diag::err_expected_colon);
326 Diag(OpToken, diag::err_matching, "?");
327 return ExprResult(true);
328 }
329
330 // Eat the colon.
Chris Lattneraf635312006-10-16 06:06:51 +0000331 ColonLoc = ConsumeToken();
Chris Lattnercde626a2006-08-12 08:13:25 +0000332 }
Chris Lattner96c3deb2006-08-12 17:13:08 +0000333
334 // Parse another leaf here for the RHS of the operator.
335 ExprResult RHS = ParseCastExpression(false);
336 if (RHS.isInvalid) return RHS;
Chris Lattnercde626a2006-08-12 08:13:25 +0000337
338 // Remember the precedence of this operator and get the precedence of the
339 // operator immediately to the right of the RHS.
340 unsigned ThisPrec = NextTokPrec;
341 NextTokPrec = getBinOpPrecedence(Tok.getKind());
Chris Lattner89d53752006-08-12 17:18:19 +0000342
343 // Assignment and conditional expressions are right-associative.
344 bool isRightAssoc = NextTokPrec == prec::Conditional ||
345 NextTokPrec == prec::Assignment;
Chris Lattnercde626a2006-08-12 08:13:25 +0000346
347 // Get the precedence of the operator to the right of the RHS. If it binds
348 // more tightly with RHS than we do, evaluate it completely first.
Chris Lattnercde626a2006-08-12 08:13:25 +0000349 if (ThisPrec < NextTokPrec ||
350 (ThisPrec == NextTokPrec && isRightAssoc)) {
Chris Lattner89d53752006-08-12 17:18:19 +0000351 // If this is left-associative, only parse things on the RHS that bind
352 // more tightly than the current operator. If it is left-associative, it
353 // is okay, to bind exactly as tightly. For example, compile A=B=C=D as
354 // A=(B=(C=D)), where each paren is a level of recursion here.
355 RHS = ParseRHSOfBinaryExpression(RHS, ThisPrec + !isRightAssoc);
Chris Lattnercde626a2006-08-12 08:13:25 +0000356 if (RHS.isInvalid) return RHS;
357
358 NextTokPrec = getBinOpPrecedence(Tok.getKind());
359 }
360 assert(NextTokPrec <= ThisPrec && "Recursion didn't work!");
361
Chris Lattner9b6d4cb2006-08-23 05:17:46 +0000362 // Combine the LHS and RHS into the LHS (e.g. build AST).
Chris Lattnerb5600a62006-10-06 05:40:05 +0000363 if (TernaryMiddle.isInvalid)
Chris Lattnerae319692006-10-25 03:49:28 +0000364 LHS = Actions.ParseBinOp(OpToken.getLocation(), OpToken.getKind(),
365 LHS.Val, RHS.Val);
Chris Lattner9b6d4cb2006-08-23 05:17:46 +0000366 else
367 LHS = Actions.ParseConditionalOp(OpToken.getLocation(), ColonLoc,
368 LHS.Val, TernaryMiddle.Val, RHS.Val);
Chris Lattnercde626a2006-08-12 08:13:25 +0000369 }
370}
371
Chris Lattnereaf06592006-08-11 02:02:23 +0000372/// ParseCastExpression - Parse a cast-expression, or, if isUnaryExpression is
373/// true, parse a unary-expression.
374///
Chris Lattner4564bc12006-08-10 23:14:52 +0000375/// cast-expression: [C99 6.5.4]
376/// unary-expression
377/// '(' type-name ')' cast-expression
Chris Lattner81b576e2006-08-11 02:13:20 +0000378///
Chris Lattnerc2dd85a2006-08-10 22:57:16 +0000379/// unary-expression: [C99 6.5.3]
380/// postfix-expression
381/// '++' unary-expression
382/// '--' unary-expression
383/// unary-operator cast-expression
384/// 'sizeof' unary-expression
385/// 'sizeof' '(' type-name ')'
386/// [GNU] '__alignof' unary-expression
387/// [GNU] '__alignof' '(' type-name ')'
388/// [GNU] '&&' identifier
Chris Lattner81b576e2006-08-11 02:13:20 +0000389///
Chris Lattnerc2dd85a2006-08-10 22:57:16 +0000390/// unary-operator: one of
391/// '&' '*' '+' '-' '~' '!'
392/// [GNU] '__extension__' '__real' '__imag'
393///
Chris Lattner52a99e52006-08-10 20:56:00 +0000394/// primary-expression: [C99 6.5.1]
Chris Lattnerc5e0d4a2006-08-10 19:06:03 +0000395/// identifier
396/// constant
397/// string-literal
398/// '(' expression ')'
Chris Lattner52a99e52006-08-10 20:56:00 +0000399/// '__func__' [C99 6.4.2.2]
400/// [GNU] '__FUNCTION__'
401/// [GNU] '__PRETTY_FUNCTION__'
402/// [GNU] '(' compound-statement ')'
403/// [GNU] '__builtin_va_arg' '(' assignment-expression ',' type-name ')'
404/// [GNU] '__builtin_offsetof' '(' type-name ',' offsetof-member-designator')'
405/// [GNU] '__builtin_choose_expr' '(' assign-expr ',' assign-expr ','
406/// assign-expr ')'
407/// [GNU] '__builtin_types_compatible_p' '(' type-name ',' type-name ')'
408/// [OBC] '[' objc-receiver objc-message-args ']' [TODO]
409/// [OBC] '@selector' '(' objc-selector-arg ')' [TODO]
410/// [OBC] '@protocol' '(' identifier ')' [TODO]
411/// [OBC] '@encode' '(' type-name ')' [TODO]
412/// [OBC] objc-string-literal [TODO]
413///
414/// constant: [C99 6.4.4]
415/// integer-constant
416/// floating-constant
417/// enumeration-constant -> identifier
418/// character-constant
Chris Lattner52a99e52006-08-10 20:56:00 +0000419///
Chris Lattner89c50c62006-08-11 06:41:18 +0000420Parser::ExprResult Parser::ParseCastExpression(bool isUnaryExpression) {
421 ExprResult Res;
Chris Lattner0ba3dc42006-10-25 03:38:23 +0000422 tok::TokenKind SavedKind = Tok.getKind();
Chris Lattner89c50c62006-08-11 06:41:18 +0000423
Chris Lattner81b576e2006-08-11 02:13:20 +0000424 // This handles all of cast-expression, unary-expression, postfix-expression,
425 // and primary-expression. We handle them together like this for efficiency
426 // and to simplify handling of an expression starting with a '(' token: which
427 // may be one of a parenthesized expression, cast-expression, compound literal
428 // expression, or statement expression.
429 //
430 // If the parsed tokens consist of a primary-expression, the cases below
Chris Lattner20c6a452006-08-12 17:40:43 +0000431 // call ParsePostfixExpressionSuffix to handle the postfix expression
432 // suffixes. Cases that cannot be followed by postfix exprs should
433 // return without invoking ParsePostfixExpressionSuffix.
Chris Lattnerae319692006-10-25 03:49:28 +0000434 switch (SavedKind) {
Chris Lattnere550a4e2006-08-24 06:37:51 +0000435 case tok::l_paren: {
Chris Lattner81b576e2006-08-11 02:13:20 +0000436 // If this expression is limited to being a unary-expression, the parent can
437 // not start a cast expression.
438 ParenParseOption ParenExprType =
439 isUnaryExpression ? CompoundLiteral : CastExpr;
Chris Lattnere550a4e2006-08-24 06:37:51 +0000440 TypeTy *CastTy;
441 SourceLocation LParenLoc = Tok.getLocation();
442 SourceLocation RParenLoc;
443 Res = ParseParenExpression(ParenExprType, CastTy, RParenLoc);
Chris Lattner89c50c62006-08-11 06:41:18 +0000444 if (Res.isInvalid) return Res;
445
Chris Lattner81b576e2006-08-11 02:13:20 +0000446 switch (ParenExprType) {
447 case SimpleExpr: break; // Nothing else to do.
448 case CompoundStmt: break; // Nothing else to do.
449 case CompoundLiteral:
450 // We parsed '(' type-name ')' '{' ... '}'. If any suffixes of
451 // postfix-expression exist, parse them now.
452 break;
453 case CastExpr:
454 // We parsed '(' type-name ')' and the thing after it wasn't a '{'. Parse
455 // the cast-expression that follows it next.
Chris Lattnere550a4e2006-08-24 06:37:51 +0000456 // TODO: For cast expression with CastTy.
457 Res = ParseCastExpression(false);
458 if (!Res.isInvalid)
459 Res = Actions.ParseCastExpr(LParenLoc, CastTy, RParenLoc, Res.Val);
460 return Res;
Chris Lattner81b576e2006-08-11 02:13:20 +0000461 }
Chris Lattner20c6a452006-08-12 17:40:43 +0000462
463 // These can be followed by postfix-expr pieces.
464 return ParsePostfixExpressionSuffix(Res);
Chris Lattnere550a4e2006-08-24 06:37:51 +0000465 }
Chris Lattner89c50c62006-08-11 06:41:18 +0000466
Chris Lattner52a99e52006-08-10 20:56:00 +0000467 // primary-expression
Chris Lattner9b6d4cb2006-08-23 05:17:46 +0000468 case tok::numeric_constant:
469 // constant: integer-constant
470 // constant: floating-constant
471
472 // TODO: Validate whether this is an integer or floating-constant or
473 // neither.
474 if (1) {
Chris Lattnerae319692006-10-25 03:49:28 +0000475 Res = Actions.ParseIntegerConstant(Tok.getLocation());
Chris Lattner9b6d4cb2006-08-23 05:17:46 +0000476 } else {
Chris Lattnerae319692006-10-25 03:49:28 +0000477 Res = Actions.ParseFloatingConstant(Tok.getLocation());
Chris Lattner9b6d4cb2006-08-23 05:17:46 +0000478 }
479 ConsumeToken();
480
481 // These can be followed by postfix-expr pieces.
482 return ParsePostfixExpressionSuffix(Res);
483
Chris Lattner52a99e52006-08-10 20:56:00 +0000484 case tok::identifier: // primary-expression: identifier
485 // constant: enumeration-constant
Chris Lattner52a99e52006-08-10 20:56:00 +0000486 case tok::char_constant: // constant: character-constant
487 case tok::kw___func__: // primary-expression: __func__ [C99 6.4.2.2]
488 case tok::kw___FUNCTION__: // primary-expression: __FUNCTION__ [GNU]
489 case tok::kw___PRETTY_FUNCTION__: // primary-expression: __P..Y_F..N__ [GNU]
Chris Lattnerae319692006-10-25 03:49:28 +0000490 Res = Actions.ParseSimplePrimaryExpr(Tok.getLocation(), SavedKind);
Chris Lattner52a99e52006-08-10 20:56:00 +0000491 ConsumeToken();
Chris Lattner20c6a452006-08-12 17:40:43 +0000492 // These can be followed by postfix-expr pieces.
493 return ParsePostfixExpressionSuffix(Res);
Chris Lattner52a99e52006-08-10 20:56:00 +0000494 case tok::string_literal: // primary-expression: string-literal
Chris Lattnerd3e98952006-10-06 05:22:26 +0000495 case tok::wide_string_literal:
Chris Lattner89c50c62006-08-11 06:41:18 +0000496 Res = ParseStringLiteralExpression();
497 if (Res.isInvalid) return Res;
Chris Lattner20c6a452006-08-12 17:40:43 +0000498 // This can be followed by postfix-expr pieces (e.g. "foo"[1]).
499 return ParsePostfixExpressionSuffix(Res);
Chris Lattnerf8339772006-08-10 22:01:51 +0000500 case tok::kw___builtin_va_arg:
501 case tok::kw___builtin_offsetof:
502 case tok::kw___builtin_choose_expr:
503 case tok::kw___builtin_types_compatible_p:
Chris Lattner11124352006-08-12 19:16:08 +0000504 return ParseBuiltinPrimaryExpression();
Chris Lattner81b576e2006-08-11 02:13:20 +0000505 case tok::plusplus: // unary-expression: '++' unary-expression
Chris Lattner0ba3dc42006-10-25 03:38:23 +0000506 case tok::minusminus: { // unary-expression: '--' unary-expression
507 SourceLocation SavedLoc = ConsumeToken();
Chris Lattner1b926492006-08-23 06:42:10 +0000508 Res = ParseCastExpression(true);
509 if (!Res.isInvalid)
Chris Lattner0ba3dc42006-10-25 03:38:23 +0000510 Res = Actions.ParseUnaryOp(SavedLoc, SavedKind, Res.Val);
Chris Lattner1b926492006-08-23 06:42:10 +0000511 return Res;
Chris Lattner0ba3dc42006-10-25 03:38:23 +0000512 }
Chris Lattner81b576e2006-08-11 02:13:20 +0000513 case tok::amp: // unary-expression: '&' cast-expression
514 case tok::star: // unary-expression: '*' cast-expression
515 case tok::plus: // unary-expression: '+' cast-expression
516 case tok::minus: // unary-expression: '-' cast-expression
517 case tok::tilde: // unary-expression: '~' cast-expression
518 case tok::exclaim: // unary-expression: '!' cast-expression
519 case tok::kw___real: // unary-expression: '__real' cast-expression [GNU]
Chris Lattner1b926492006-08-23 06:42:10 +0000520 case tok::kw___imag: // unary-expression: '__imag' cast-expression [GNU]
Chris Lattner0ba3dc42006-10-25 03:38:23 +0000521 case tok::kw___extension__:{//unary-expression:'__extension__' cast-expr [GNU]
Chris Lattner4daa0772006-10-20 05:03:44 +0000522 // FIXME: Extension not handled correctly here!
Chris Lattner0ba3dc42006-10-25 03:38:23 +0000523 SourceLocation SavedLoc = ConsumeToken();
Chris Lattner1b926492006-08-23 06:42:10 +0000524 Res = ParseCastExpression(false);
525 if (!Res.isInvalid)
Chris Lattner0ba3dc42006-10-25 03:38:23 +0000526 Res = Actions.ParseUnaryOp(SavedLoc, SavedKind, Res.Val);
Chris Lattner1b926492006-08-23 06:42:10 +0000527 return Res;
Chris Lattner0ba3dc42006-10-25 03:38:23 +0000528 }
Chris Lattner81b576e2006-08-11 02:13:20 +0000529 case tok::kw_sizeof: // unary-expression: 'sizeof' unary-expression
530 // unary-expression: 'sizeof' '(' type-name ')'
531 case tok::kw___alignof: // unary-expression: '__alignof' unary-expression
532 // unary-expression: '__alignof' '(' type-name ')'
Chris Lattner89c50c62006-08-11 06:41:18 +0000533 return ParseSizeofAlignofExpression();
Chris Lattner0ba3dc42006-10-25 03:38:23 +0000534 case tok::ampamp: { // unary-expression: '&&' identifier
Chris Lattner81b576e2006-08-11 02:13:20 +0000535 Diag(Tok, diag::ext_gnu_address_of_label);
Chris Lattner0ba3dc42006-10-25 03:38:23 +0000536 SourceLocation SavedLoc = ConsumeToken();
Chris Lattner14a1b642006-10-15 22:33:58 +0000537
538 if (Tok.getKind() != tok::identifier) {
Chris Lattner81b576e2006-08-11 02:13:20 +0000539 Diag(Tok, diag::err_expected_ident);
Chris Lattner89c50c62006-08-11 06:41:18 +0000540 return ExprResult(true);
Chris Lattner81b576e2006-08-11 02:13:20 +0000541 }
Chris Lattner14a1b642006-10-15 22:33:58 +0000542 // FIXME: Create a label ref for Tok.Ident.
Chris Lattner0ba3dc42006-10-25 03:38:23 +0000543 Res = Actions.ParseUnaryOp(SavedLoc, SavedKind, 0);
Chris Lattner14a1b642006-10-15 22:33:58 +0000544 ConsumeToken();
545
546 return Res;
Chris Lattner0ba3dc42006-10-25 03:38:23 +0000547 }
Chris Lattner52a99e52006-08-10 20:56:00 +0000548 default:
549 Diag(Tok, diag::err_expected_expression);
Chris Lattner89c50c62006-08-11 06:41:18 +0000550 return ExprResult(true);
Chris Lattnerf8339772006-08-10 22:01:51 +0000551 }
552
Chris Lattner20c6a452006-08-12 17:40:43 +0000553 // unreachable.
554 abort();
555}
556
557/// ParsePostfixExpressionSuffix - Once the leading part of a postfix-expression
558/// is parsed, this method parses any suffixes that apply.
559///
560/// postfix-expression: [C99 6.5.2]
561/// primary-expression
562/// postfix-expression '[' expression ']'
563/// postfix-expression '(' argument-expression-list[opt] ')'
564/// postfix-expression '.' identifier
565/// postfix-expression '->' identifier
566/// postfix-expression '++'
567/// postfix-expression '--'
568/// '(' type-name ')' '{' initializer-list '}'
569/// '(' type-name ')' '{' initializer-list ',' '}'
570///
571/// argument-expression-list: [C99 6.5.2]
572/// argument-expression
573/// argument-expression-list ',' assignment-expression
574///
575Parser::ExprResult Parser::ParsePostfixExpressionSuffix(ExprResult LHS) {
Chris Lattner20c6a452006-08-12 17:40:43 +0000576
Chris Lattnerf8339772006-08-10 22:01:51 +0000577 // Now that the primary-expression piece of the postfix-expression has been
578 // parsed, see if there are any postfix-expression pieces here.
579 SourceLocation Loc;
580 while (1) {
581 switch (Tok.getKind()) {
Chris Lattner20c6a452006-08-12 17:40:43 +0000582 default: // Not a postfix-expression suffix.
583 return LHS;
Chris Lattner6d28d9b2006-08-24 03:51:22 +0000584 case tok::l_square: { // postfix-expression: p-e '[' expression ']'
Chris Lattner04132372006-10-16 06:12:55 +0000585 Loc = ConsumeBracket();
Chris Lattner6d28d9b2006-08-24 03:51:22 +0000586 ExprResult Idx = ParseExpression();
587
588 SourceLocation RLoc = Tok.getLocation();
589
590 if (!LHS.isInvalid && !Idx.isInvalid && Tok.getKind() == tok::r_square)
591 LHS = Actions.ParseArraySubscriptExpr(LHS.Val, Loc, Idx.Val, RLoc);
592 else
593 LHS = ExprResult(true);
594
Chris Lattner89c50c62006-08-11 06:41:18 +0000595 // Match the ']'.
Chris Lattner04f80192006-08-15 04:55:54 +0000596 MatchRHSPunctuation(tok::r_square, Loc);
Chris Lattner89c50c62006-08-11 06:41:18 +0000597 break;
Chris Lattner6d28d9b2006-08-24 03:51:22 +0000598 }
Chris Lattner89c50c62006-08-11 06:41:18 +0000599
Chris Lattner6d28d9b2006-08-24 03:51:22 +0000600 case tok::l_paren: { // p-e: p-e '(' argument-expression-list[opt] ')'
601 SmallVector<ExprTy*, 8> ArgExprs;
602 SmallVector<SourceLocation, 8> CommaLocs;
603 bool ArgExprsOk = true;
604
Chris Lattner04132372006-10-16 06:12:55 +0000605 Loc = ConsumeParen();
Chris Lattner89c50c62006-08-11 06:41:18 +0000606
Chris Lattner0c6c0342006-08-12 18:12:45 +0000607 if (Tok.getKind() != tok::r_paren) {
608 while (1) {
Chris Lattner6d28d9b2006-08-24 03:51:22 +0000609 ExprResult ArgExpr = ParseAssignmentExpression();
610 if (ArgExpr.isInvalid)
611 ArgExprsOk = false;
612 else
613 ArgExprs.push_back(ArgExpr.Val);
614
Chris Lattner0c6c0342006-08-12 18:12:45 +0000615 if (Tok.getKind() != tok::comma)
616 break;
Chris Lattneraf635312006-10-16 06:06:51 +0000617 // Move to the next argument, remember where the comma was.
618 CommaLocs.push_back(ConsumeToken());
Chris Lattner0c6c0342006-08-12 18:12:45 +0000619 }
Chris Lattner89c50c62006-08-11 06:41:18 +0000620 }
Chris Lattner81b576e2006-08-11 02:13:20 +0000621
Chris Lattner89c50c62006-08-11 06:41:18 +0000622 // Match the ')'.
Chris Lattnere165d942006-08-24 04:40:38 +0000623 if (!LHS.isInvalid && ArgExprsOk && Tok.getKind() == tok::r_paren) {
624 assert((ArgExprs.size() == 0 || ArgExprs.size()-1 == CommaLocs.size())&&
625 "Unexpected number of commas!");
Chris Lattner6d28d9b2006-08-24 03:51:22 +0000626 LHS = Actions.ParseCallExpr(LHS.Val, Loc, &ArgExprs[0], ArgExprs.size(),
Chris Lattnere165d942006-08-24 04:40:38 +0000627 &CommaLocs[0], Tok.getLocation());
628 }
Chris Lattner6d28d9b2006-08-24 03:51:22 +0000629
Chris Lattner04f80192006-08-15 04:55:54 +0000630 MatchRHSPunctuation(tok::r_paren, Loc);
Chris Lattner89c50c62006-08-11 06:41:18 +0000631 break;
Chris Lattner6d28d9b2006-08-24 03:51:22 +0000632 }
Chris Lattner89c50c62006-08-11 06:41:18 +0000633 case tok::arrow: // postfix-expression: p-e '->' identifier
Chris Lattner6d28d9b2006-08-24 03:51:22 +0000634 case tok::period: { // postfix-expression: p-e '.' identifier
Chris Lattner6d28d9b2006-08-24 03:51:22 +0000635 tok::TokenKind OpKind = Tok.getKind();
Chris Lattneraf635312006-10-16 06:06:51 +0000636 SourceLocation OpLoc = ConsumeToken(); // Eat the "." or "->" token.
Chris Lattner6d28d9b2006-08-24 03:51:22 +0000637
Chris Lattner89c50c62006-08-11 06:41:18 +0000638 if (Tok.getKind() != tok::identifier) {
639 Diag(Tok, diag::err_expected_ident);
640 return ExprResult(true);
641 }
Chris Lattner6d28d9b2006-08-24 03:51:22 +0000642
643 if (!LHS.isInvalid)
644 LHS = Actions.ParseMemberReferenceExpr(LHS.Val, OpLoc, OpKind,
645 Tok.getLocation(),
646 *Tok.getIdentifierInfo());
Chris Lattner89c50c62006-08-11 06:41:18 +0000647 ConsumeToken();
648 break;
Chris Lattner6d28d9b2006-08-24 03:51:22 +0000649 }
Chris Lattner89c50c62006-08-11 06:41:18 +0000650 case tok::plusplus: // postfix-expression: postfix-expression '++'
651 case tok::minusminus: // postfix-expression: postfix-expression '--'
Chris Lattner1b926492006-08-23 06:42:10 +0000652 if (!LHS.isInvalid)
Chris Lattnerae319692006-10-25 03:49:28 +0000653 LHS = Actions.ParsePostfixUnaryOp(Tok.getLocation(), Tok.getKind(),
654 LHS.Val);
Chris Lattner89c50c62006-08-11 06:41:18 +0000655 ConsumeToken();
656 break;
Chris Lattnerf8339772006-08-10 22:01:51 +0000657 }
658 }
Chris Lattner52a99e52006-08-10 20:56:00 +0000659}
660
Chris Lattner20c6a452006-08-12 17:40:43 +0000661
Chris Lattner81b576e2006-08-11 02:13:20 +0000662/// ParseSizeofAlignofExpression - Parse a sizeof or alignof expression.
663/// unary-expression: [C99 6.5.3]
664/// 'sizeof' unary-expression
665/// 'sizeof' '(' type-name ')'
666/// [GNU] '__alignof' unary-expression
667/// [GNU] '__alignof' '(' type-name ')'
Chris Lattner89c50c62006-08-11 06:41:18 +0000668Parser::ExprResult Parser::ParseSizeofAlignofExpression() {
Chris Lattner81b576e2006-08-11 02:13:20 +0000669 assert((Tok.getKind() == tok::kw_sizeof ||
670 Tok.getKind() == tok::kw___alignof) &&
671 "Not a sizeof/alignof expression!");
Chris Lattner26115ac2006-08-24 06:10:04 +0000672 LexerToken OpTok = Tok;
Chris Lattner81b576e2006-08-11 02:13:20 +0000673 ConsumeToken();
674
675 // If the operand doesn't start with an '(', it must be an expression.
Chris Lattner26115ac2006-08-24 06:10:04 +0000676 ExprResult Operand;
677 if (Tok.getKind() != tok::l_paren) {
678 Operand = ParseCastExpression(true);
679 } else {
680 // If it starts with a '(', we know that it is either a parenthesized
681 // type-name, or it is a unary-expression that starts with a compound
682 // literal, or starts with a primary-expression that is a parenthesized
683 // expression.
684 ParenParseOption ExprType = CastExpr;
Chris Lattnere550a4e2006-08-24 06:37:51 +0000685 TypeTy *CastTy;
Chris Lattner26da7302006-08-24 06:49:19 +0000686 SourceLocation LParenLoc = Tok.getLocation(), RParenLoc;
Chris Lattnere550a4e2006-08-24 06:37:51 +0000687 Operand = ParseParenExpression(ExprType, CastTy, RParenLoc);
Chris Lattner26115ac2006-08-24 06:10:04 +0000688
689 // If ParseParenExpression parsed a '(typename)' sequence only, the this is
690 // sizeof/alignof a type. Otherwise, it is sizeof/alignof an expression.
691 if (ExprType == CastExpr) {
Chris Lattner26da7302006-08-24 06:49:19 +0000692 return Actions.ParseSizeOfAlignOfTypeExpr(OpTok.getLocation(),
693 OpTok.getKind() == tok::kw_sizeof,
694 LParenLoc, CastTy, RParenLoc);
Chris Lattner26115ac2006-08-24 06:10:04 +0000695 }
696 }
Chris Lattner81b576e2006-08-11 02:13:20 +0000697
Chris Lattner26115ac2006-08-24 06:10:04 +0000698 // If we get here, the operand to the sizeof/alignof was an expresion.
699 if (!Operand.isInvalid)
Chris Lattner0ba3dc42006-10-25 03:38:23 +0000700 Operand = Actions.ParseUnaryOp(OpTok.getLocation(), OpTok.getKind(),
701 Operand.Val);
Chris Lattner26115ac2006-08-24 06:10:04 +0000702 return Operand;
Chris Lattner81b576e2006-08-11 02:13:20 +0000703}
704
Chris Lattner11124352006-08-12 19:16:08 +0000705/// ParseBuiltinPrimaryExpression
706///
707/// primary-expression: [C99 6.5.1]
708/// [GNU] '__builtin_va_arg' '(' assignment-expression ',' type-name ')'
709/// [GNU] '__builtin_offsetof' '(' type-name ',' offsetof-member-designator')'
710/// [GNU] '__builtin_choose_expr' '(' assign-expr ',' assign-expr ','
711/// assign-expr ')'
712/// [GNU] '__builtin_types_compatible_p' '(' type-name ',' type-name ')'
713///
714/// [GNU] offsetof-member-designator:
715/// [GNU] identifier
716/// [GNU] offsetof-member-designator '.' identifier
717/// [GNU] offsetof-member-designator '[' expression ']'
718///
719Parser::ExprResult Parser::ParseBuiltinPrimaryExpression() {
720 ExprResult Res(false);
Chris Lattner11124352006-08-12 19:16:08 +0000721 const IdentifierInfo *BuiltinII = Tok.getIdentifierInfo();
722
723 tok::TokenKind T = Tok.getKind();
Chris Lattneraf635312006-10-16 06:06:51 +0000724 SourceLocation StartLoc = ConsumeToken(); // Eat the builtin identifier.
Chris Lattner11124352006-08-12 19:16:08 +0000725
726 // All of these start with an open paren.
727 if (Tok.getKind() != tok::l_paren) {
728 Diag(Tok, diag::err_expected_lparen_after, BuiltinII->getName());
729 return ExprResult(true);
730 }
731
Chris Lattner04132372006-10-16 06:12:55 +0000732 SourceLocation LParenLoc = ConsumeParen();
Chris Lattner6d28d9b2006-08-24 03:51:22 +0000733 // TODO: Build AST.
734
Chris Lattner11124352006-08-12 19:16:08 +0000735 switch (T) {
736 default: assert(0 && "Not a builtin primary expression!");
737 case tok::kw___builtin_va_arg:
738 Res = ParseAssignmentExpression();
739 if (Res.isInvalid) {
740 SkipUntil(tok::r_paren);
741 return Res;
742 }
Chris Lattner0be454e2006-08-12 19:30:51 +0000743
Chris Lattner6d7e6342006-08-15 03:41:14 +0000744 if (ExpectAndConsume(tok::comma, diag::err_expected_comma, "",tok::r_paren))
Chris Lattner11124352006-08-12 19:16:08 +0000745 return ExprResult(true);
Chris Lattner0be454e2006-08-12 19:30:51 +0000746
Chris Lattner11124352006-08-12 19:16:08 +0000747 ParseTypeName();
748 break;
749
750 case tok::kw___builtin_offsetof:
751 ParseTypeName();
752
Chris Lattner6d7e6342006-08-15 03:41:14 +0000753 if (ExpectAndConsume(tok::comma, diag::err_expected_comma, "",tok::r_paren))
Chris Lattner11124352006-08-12 19:16:08 +0000754 return ExprResult(true);
Chris Lattner11124352006-08-12 19:16:08 +0000755
756 // We must have at least one identifier here.
Chris Lattner6d7e6342006-08-15 03:41:14 +0000757 if (ExpectAndConsume(tok::identifier, diag::err_expected_ident, "",
Chris Lattnerdbb2a462006-08-12 19:26:13 +0000758 tok::r_paren))
Chris Lattner11124352006-08-12 19:16:08 +0000759 return ExprResult(true);
Chris Lattnerdbb2a462006-08-12 19:26:13 +0000760
Chris Lattner11124352006-08-12 19:16:08 +0000761 while (1) {
762 if (Tok.getKind() == tok::period) {
763 // offsetof-member-designator: offsetof-member-designator '.' identifier
764 ConsumeToken();
765
Chris Lattner6d7e6342006-08-15 03:41:14 +0000766 if (ExpectAndConsume(tok::identifier, diag::err_expected_ident, "",
Chris Lattnerdbb2a462006-08-12 19:26:13 +0000767 tok::r_paren))
Chris Lattner11124352006-08-12 19:16:08 +0000768 return ExprResult(true);
Chris Lattner11124352006-08-12 19:16:08 +0000769 } else if (Tok.getKind() == tok::l_square) {
770 // offsetof-member-designator: offsetof-member-design '[' expression ']'
Chris Lattner04132372006-10-16 06:12:55 +0000771 SourceLocation LSquareLoc = ConsumeBracket();
Chris Lattner11124352006-08-12 19:16:08 +0000772 Res = ParseExpression();
773 if (Res.isInvalid) {
774 SkipUntil(tok::r_paren);
775 return Res;
776 }
777
Chris Lattner04f80192006-08-15 04:55:54 +0000778 MatchRHSPunctuation(tok::r_square, LSquareLoc);
Chris Lattner11124352006-08-12 19:16:08 +0000779 } else {
780 break;
781 }
782 }
783 break;
784 case tok::kw___builtin_choose_expr:
785 Res = ParseAssignmentExpression();
786
Chris Lattner6d7e6342006-08-15 03:41:14 +0000787 if (ExpectAndConsume(tok::comma, diag::err_expected_comma, "",tok::r_paren))
Chris Lattner11124352006-08-12 19:16:08 +0000788 return ExprResult(true);
Chris Lattner11124352006-08-12 19:16:08 +0000789
790 Res = ParseAssignmentExpression();
791
Chris Lattner6d7e6342006-08-15 03:41:14 +0000792 if (ExpectAndConsume(tok::comma, diag::err_expected_comma, "",tok::r_paren))
Chris Lattner11124352006-08-12 19:16:08 +0000793 return ExprResult(true);
Chris Lattner11124352006-08-12 19:16:08 +0000794
795 Res = ParseAssignmentExpression();
796 break;
797 case tok::kw___builtin_types_compatible_p:
798 ParseTypeName();
799
Chris Lattner6d7e6342006-08-15 03:41:14 +0000800 if (ExpectAndConsume(tok::comma, diag::err_expected_comma, "",tok::r_paren))
Chris Lattner11124352006-08-12 19:16:08 +0000801 return ExprResult(true);
Chris Lattner11124352006-08-12 19:16:08 +0000802
803 ParseTypeName();
804 break;
805 }
806
Chris Lattner04f80192006-08-15 04:55:54 +0000807 MatchRHSPunctuation(tok::r_paren, LParenLoc);
Chris Lattner11124352006-08-12 19:16:08 +0000808
809 // These can be followed by postfix-expr pieces because they are
810 // primary-expressions.
811 return ParsePostfixExpressionSuffix(Res);
812}
813
Chris Lattnerc951dae2006-08-10 04:23:57 +0000814
Chris Lattner4add4e62006-08-11 01:33:00 +0000815/// ParseParenExpression - This parses the unit that starts with a '(' token,
816/// based on what is allowed by ExprType. The actual thing parsed is returned
817/// in ExprType.
818///
819/// primary-expression: [C99 6.5.1]
Chris Lattnerc951dae2006-08-10 04:23:57 +0000820/// '(' expression ')'
Chris Lattnerf8339772006-08-10 22:01:51 +0000821/// [GNU] '(' compound-statement ')' (if !ParenExprOnly)
822/// postfix-expression: [C99 6.5.2]
823/// '(' type-name ')' '{' initializer-list '}'
824/// '(' type-name ')' '{' initializer-list ',' '}'
Chris Lattner4add4e62006-08-11 01:33:00 +0000825/// cast-expression: [C99 6.5.4]
826/// '(' type-name ')' cast-expression
Chris Lattnerf8339772006-08-10 22:01:51 +0000827///
Chris Lattnere550a4e2006-08-24 06:37:51 +0000828Parser::ExprResult Parser::ParseParenExpression(ParenParseOption &ExprType,
829 TypeTy *&CastTy,
830 SourceLocation &RParenLoc) {
Chris Lattnerc951dae2006-08-10 04:23:57 +0000831 assert(Tok.getKind() == tok::l_paren && "Not a paren expr!");
Chris Lattner04132372006-10-16 06:12:55 +0000832 SourceLocation OpenLoc = ConsumeParen();
Chris Lattner89c50c62006-08-11 06:41:18 +0000833 ExprResult Result(false);
Chris Lattnere550a4e2006-08-24 06:37:51 +0000834 CastTy = 0;
Chris Lattnerc951dae2006-08-10 04:23:57 +0000835
Chris Lattner4add4e62006-08-11 01:33:00 +0000836 if (ExprType >= CompoundStmt && Tok.getKind() == tok::l_brace &&
Chris Lattnerf8339772006-08-10 22:01:51 +0000837 !getLang().NoExtensions) {
838 Diag(Tok, diag::ext_gnu_statement_expr);
839 ParseCompoundStatement();
Chris Lattner4add4e62006-08-11 01:33:00 +0000840 ExprType = CompoundStmt;
Chris Lattner1b926492006-08-23 06:42:10 +0000841 // TODO: Build AST for GNU compound stmt.
Chris Lattner4add4e62006-08-11 01:33:00 +0000842 } else if (ExprType >= CompoundLiteral && isTypeSpecifierQualifier()) {
Chris Lattner6c3f05d2006-08-12 16:54:25 +0000843 // Otherwise, this is a compound literal expression or cast expression.
Chris Lattnere550a4e2006-08-24 06:37:51 +0000844 TypeTy *Ty = ParseTypeName();
Chris Lattnerf5fbd792006-08-10 23:56:11 +0000845
846 // Match the ')'.
Chris Lattner04132372006-10-16 06:12:55 +0000847 if (Tok.getKind() == tok::r_paren)
848 RParenLoc = ConsumeParen();
849 else
Chris Lattnere550a4e2006-08-24 06:37:51 +0000850 MatchRHSPunctuation(tok::r_paren, OpenLoc);
Chris Lattnere550a4e2006-08-24 06:37:51 +0000851
Chris Lattner4add4e62006-08-11 01:33:00 +0000852 if (Tok.getKind() == tok::l_brace) {
Chris Lattner6c3f05d2006-08-12 16:54:25 +0000853 if (!getLang().C99) // Compound literals don't exist in C90.
854 Diag(OpenLoc, diag::ext_c99_compound_literal);
Chris Lattner89c50c62006-08-11 06:41:18 +0000855 Result = ParseInitializer();
Chris Lattner4add4e62006-08-11 01:33:00 +0000856 ExprType = CompoundLiteral;
Chris Lattner1b926492006-08-23 06:42:10 +0000857 // TODO: Build AST for compound literal.
Chris Lattner4add4e62006-08-11 01:33:00 +0000858 } else if (ExprType == CastExpr) {
Chris Lattnere550a4e2006-08-24 06:37:51 +0000859 // Note that this doesn't parse the subsequence cast-expression, it just
860 // returns the parsed type to the callee.
Chris Lattner4add4e62006-08-11 01:33:00 +0000861 ExprType = CastExpr;
Chris Lattnere550a4e2006-08-24 06:37:51 +0000862 CastTy = Ty;
863 return ExprResult(false);
Chris Lattner4add4e62006-08-11 01:33:00 +0000864 } else {
Chris Lattnerf5fbd792006-08-10 23:56:11 +0000865 Diag(Tok, diag::err_expected_lbrace_in_compound_literal);
Chris Lattner89c50c62006-08-11 06:41:18 +0000866 return ExprResult(true);
Chris Lattnerf5fbd792006-08-10 23:56:11 +0000867 }
Chris Lattner89c50c62006-08-11 06:41:18 +0000868 return Result;
Chris Lattner4add4e62006-08-11 01:33:00 +0000869 } else {
Chris Lattner89c50c62006-08-11 06:41:18 +0000870 Result = ParseExpression();
Chris Lattner4add4e62006-08-11 01:33:00 +0000871 ExprType = SimpleExpr;
Chris Lattner1b926492006-08-23 06:42:10 +0000872 if (!Result.isInvalid && Tok.getKind() == tok::r_paren)
873 Result = Actions.ParseParenExpr(OpenLoc, Tok.getLocation(), Result.Val);
Chris Lattnerf8339772006-08-10 22:01:51 +0000874 }
Chris Lattnerc951dae2006-08-10 04:23:57 +0000875
Chris Lattner4564bc12006-08-10 23:14:52 +0000876 // Match the ')'.
Chris Lattner89c50c62006-08-11 06:41:18 +0000877 if (Result.isInvalid)
878 SkipUntil(tok::r_paren);
Chris Lattnere550a4e2006-08-24 06:37:51 +0000879 else {
Chris Lattner04132372006-10-16 06:12:55 +0000880 if (Tok.getKind() == tok::r_paren)
881 RParenLoc = ConsumeParen();
882 else
Chris Lattnere550a4e2006-08-24 06:37:51 +0000883 MatchRHSPunctuation(tok::r_paren, OpenLoc);
Chris Lattnere550a4e2006-08-24 06:37:51 +0000884 }
Chris Lattner1b926492006-08-23 06:42:10 +0000885
Chris Lattner89c50c62006-08-11 06:41:18 +0000886 return Result;
Chris Lattnerc951dae2006-08-10 04:23:57 +0000887}
Chris Lattnerd3e98952006-10-06 05:22:26 +0000888
889/// HexDigitValue - Return the value of the specified hex digit, or -1 if it's
890/// not valid.
891static int HexDigitValue(char C) {
892 if (C >= '0' && C <= '9') return C-'0';
893 if (C >= 'a' && C <= 'f') return C-'a'+10;
894 if (C >= 'A' && C <= 'F') return C-'A'+10;
895 return -1;
896}
897
898/// ParseStringLiteralExpression - This handles the various token types that
899/// form string literals, and also handles string concatenation [C99 5.1.1.2,
900/// translation phase #6].
901///
902/// primary-expression: [C99 6.5.1]
903/// string-literal
904Parser::ExprResult Parser::ParseStringLiteralExpression() {
905 assert(isTokenStringLiteral() && "Not a string literal!");
906
907 // String concat. Note that keywords like __func__ and __FUNCTION__ are not
908 // considered to be strings for concatenation purposes.
909 SmallVector<LexerToken, 4> StringToks;
910
911 // While we're looking at all of the string portions, remember the max
912 // individual token length, computing a bound on the concatenated string
913 // length, and see whether any piece is a wide-string. If any of the string
914 // portions is a wide-string literal, the result is also a wide-string literal
915 // [C99 6.4.5p4].
916 unsigned SizeBound = 0, MaxTokenLength = 0;
917 bool AnyWide = false;
918 do {
919 // The string could be shorter than this if it needs cleaning, but this is a
920 // reasonable bound, which is all we need.
921 SizeBound += Tok.getLength()-2; // -2 for "".
922
923 // Find maximum string piece length.
924 if (Tok.getLength() > MaxTokenLength)
925 MaxTokenLength = Tok.getLength();
926
927 // Remember if we see any wide strings.
928 AnyWide |= Tok.getKind() == tok::wide_string_literal;
929
930 // Remember the string token.
931 StringToks.push_back(Tok);
932 ConsumeStringToken();
933 } while (isTokenStringLiteral());
934
935 // Include space for the null terminator.
936 ++SizeBound;
937
938 // TODO: K&R warning: "traditional C rejects string constant concatenation"
939
Chris Lattner02dffbd2006-10-14 07:50:21 +0000940 // Get the width in bytes of wchar_t. If no wchar_t strings are used, do not
941 // query the target. As such, wchar_tByteWidth is only valid if AnyWide=true.
942 unsigned wchar_tByteWidth = ~0U;
943 if (AnyWide)
944 wchar_tByteWidth=getTargetInfo().getWCharWidth(StringToks[0].getLocation());
Chris Lattnerd3e98952006-10-06 05:22:26 +0000945
946 // The output buffer size needs to be large enough to hold wide characters.
947 // This is a worst-case assumption which basically corresponds to L"" "long".
948 if (AnyWide)
949 SizeBound *= wchar_tByteWidth;
950
Chris Lattner834618d2006-11-03 07:48:41 +0000951 // Create a temporary buffer to hold the result string data.
952 SmallString<512> ResultBuf;
953 ResultBuf.resize(SizeBound);
Chris Lattnerd3e98952006-10-06 05:22:26 +0000954
955 // Likewise, but for each string piece.
Chris Lattner834618d2006-11-03 07:48:41 +0000956 SmallString<512> TokenBuf;
957 TokenBuf.resize(MaxTokenLength);
Chris Lattnerd3e98952006-10-06 05:22:26 +0000958
959 // Loop over all the strings, getting their spelling, and expanding them to
960 // wide strings as appropriate.
Chris Lattner834618d2006-11-03 07:48:41 +0000961 char *ResultPtr = &ResultBuf[0]; // Next byte to fill in.
Chris Lattnerd3e98952006-10-06 05:22:26 +0000962
963 for (unsigned i = 0, e = StringToks.size(); i != e; ++i) {
Chris Lattner834618d2006-11-03 07:48:41 +0000964 const char *ThisTokBuf = &TokenBuf[0];
Chris Lattnerd3e98952006-10-06 05:22:26 +0000965 // Get the spelling of the token, which eliminates trigraphs, etc. We know
966 // that ThisTokBuf points to a buffer that is big enough for the whole token
967 // and 'spelled' tokens can only shrink.
968 unsigned ThisTokLen = PP.getSpelling(StringToks[i], ThisTokBuf);
969 const char *ThisTokEnd = ThisTokBuf+ThisTokLen-1; // Skip end quote.
970
971 // TODO: Input character set mapping support.
972
973 // Skip L marker for wide strings.
974 if (ThisTokBuf[0] == 'L') ++ThisTokBuf;
975
976 assert(ThisTokBuf[0] == '"' && "Expected quote, lexer broken?");
977 ++ThisTokBuf;
978
979 while (ThisTokBuf != ThisTokEnd) {
980 // Is this a span of non-escape characters?
981 if (ThisTokBuf[0] != '\\') {
982 const char *InStart = ThisTokBuf;
983 do {
984 ++ThisTokBuf;
985 } while (ThisTokBuf != ThisTokEnd && ThisTokBuf[0] != '\\');
986
987 // Copy the character span over.
988 unsigned Len = ThisTokBuf-InStart;
989 if (!AnyWide) {
990 memcpy(ResultPtr, InStart, Len);
991 ResultPtr += Len;
992 } else {
993 // Note: our internal rep of wide char tokens is always little-endian.
994 for (; Len; --Len, ++InStart) {
995 *ResultPtr++ = InStart[0];
996 // Add zeros at the end.
997 for (unsigned i = 1, e = wchar_tByteWidth; i != e; ++i)
998 *ResultPtr++ = 0;
999 }
1000 }
1001 continue;
1002 }
1003
1004 // Otherwise, this is an escape character. Skip the '\' char.
1005 ++ThisTokBuf;
1006
1007 // We know that this character can't be off the end of the buffer, because
1008 // that would have been \", which would not have been the end of string.
1009 unsigned ResultChar = *ThisTokBuf++;
1010 switch (ResultChar) {
1011 // These map to themselves.
1012 case '\\': case '\'': case '"': case '?': break;
1013
1014 // These have fixed mappings.
1015 case 'a':
1016 // TODO: K&R: the meaning of '\\a' is different in traditional C
1017 ResultChar = 7;
1018 break;
1019 case 'b':
1020 ResultChar = 8;
1021 break;
1022 case 'e':
1023 PP.Diag(StringToks[i], diag::ext_nonstandard_escape, "e");
1024 ResultChar = 27;
1025 break;
1026 case 'f':
1027 ResultChar = 12;
1028 break;
1029 case 'n':
1030 ResultChar = 10;
1031 break;
1032 case 'r':
1033 ResultChar = 13;
1034 break;
1035 case 't':
1036 ResultChar = 9;
1037 break;
1038 case 'v':
1039 ResultChar = 11;
1040 break;
1041
1042 //case 'u': case 'U': // FIXME: UCNs.
1043 case 'x': // Hex escape.
1044 if (ThisTokBuf == ThisTokEnd ||
1045 (ResultChar = HexDigitValue(*ThisTokBuf)) == ~0U) {
1046 PP.Diag(StringToks[i], diag::err_hex_escape_no_digits);
1047 ResultChar = 0;
1048 break;
1049 }
1050 ++ThisTokBuf; // Consumed one hex digit.
1051
1052 assert(0 && "hex escape: unimp!");
1053 break;
1054 case '0': case '1': case '2': case '3':
1055 case '4': case '5': case '6': case '7':
1056 // Octal escapes.
1057 assert(0 && "octal escape: unimp!");
1058 break;
1059
1060 // Otherwise, these are not valid escapes.
1061 case '(': case '{': case '[': case '%':
1062 // GCC accepts these as extensions. We warn about them as such though.
1063 if (!PP.getLangOptions().NoExtensions) {
1064 PP.Diag(StringToks[i], diag::ext_nonstandard_escape,
1065 std::string()+(char)ResultChar);
1066 break;
1067 }
1068 // FALL THROUGH.
1069 default:
1070 if (isgraph(ThisTokBuf[0])) {
1071 PP.Diag(StringToks[i], diag::ext_unknown_escape,
1072 std::string()+(char)ResultChar);
1073 } else {
1074 PP.Diag(StringToks[i], diag::ext_unknown_escape,
1075 "x"+utohexstr(ResultChar));
1076 }
1077 }
1078
1079 // Note: our internal rep of wide char tokens is always little-endian.
Chris Lattner02dffbd2006-10-14 07:50:21 +00001080 *ResultPtr++ = ResultChar & 0xFF;
1081
1082 if (AnyWide) {
1083 for (unsigned i = 1, e = wchar_tByteWidth; i != e; ++i)
1084 *ResultPtr++ = ResultChar >> i*8;
1085 }
Chris Lattnerd3e98952006-10-06 05:22:26 +00001086 }
1087 }
1088
1089 // Add zero terminator.
1090 *ResultPtr = 0;
1091 if (AnyWide) {
1092 for (unsigned i = 1, e = wchar_tByteWidth; i != e; ++i)
1093 *ResultPtr++ = 0;
1094 }
1095
Chris Lattnerae319692006-10-25 03:49:28 +00001096 SmallVector<SourceLocation, 4> StringTokLocs;
1097 for (unsigned i = 0; i != StringToks.size(); ++i)
1098 StringTokLocs.push_back(StringToks[i].getLocation());
1099
Chris Lattnerd3e98952006-10-06 05:22:26 +00001100 // Hand this off to the Actions.
Chris Lattner834618d2006-11-03 07:48:41 +00001101 return Actions.ParseStringExpr(&ResultBuf[0], ResultPtr-&ResultBuf[0],
1102 AnyWide, &StringTokLocs[0],
1103 StringTokLocs.size());
Chris Lattnerd3e98952006-10-06 05:22:26 +00001104}
1105