blob: c6b22e56bc83a9fa049d38958f61d4c604d8f2f7 [file] [log] [blame]
Chris Lattnerc951dae2006-08-10 04:23:57 +00001//===--- Expression.cpp - Expression Parsing ------------------------------===//
2//
3// The LLVM Compiler Infrastructure
4//
5// This file was developed by Chris Lattner and is distributed under
6// the University of Illinois Open Source License. See LICENSE.TXT for details.
7//
8//===----------------------------------------------------------------------===//
9//
Chris Lattnercde626a2006-08-12 08:13:25 +000010// This file implements the Expression parsing implementation. Expressions in
11// C99 basically consist of a bunch of binary operators with unary operators and
12// other random stuff at the leaves.
13//
14// In the C99 grammar, these unary operators bind tightest and are represented
15// as the 'cast-expression' production. Everything else is either a binary
Chris Lattnerb7f1fc92006-08-12 16:45:01 +000016// operator (e.g. '/') or a ternary operator ("?:"). The unary leaves are
Chris Lattnercde626a2006-08-12 08:13:25 +000017// handled by ParseCastExpression, the higher level pieces are handled by
18// ParseBinaryExpression.
Chris Lattnerc951dae2006-08-10 04:23:57 +000019//
20//===----------------------------------------------------------------------===//
21
22#include "clang/Parse/Parser.h"
23#include "clang/Basic/Diagnostic.h"
Chris Lattner02dffbd2006-10-14 07:50:21 +000024#include "clang/Basic/TargetInfo.h"
Chris Lattner6d28d9b2006-08-24 03:51:22 +000025#include "llvm/ADT/SmallVector.h"
Chris Lattnerd3e98952006-10-06 05:22:26 +000026#include "llvm/ADT/StringExtras.h"
27#include "llvm/Config/Alloca.h"
Chris Lattnerc951dae2006-08-10 04:23:57 +000028using namespace llvm;
29using namespace clang;
30
Chris Lattnerb7f1fc92006-08-12 16:45:01 +000031/// PrecedenceLevels - These are precedences for the binary/ternary operators in
Chris Lattnercde626a2006-08-12 08:13:25 +000032/// the C99 grammar. These have been named to relate with the C99 grammar
33/// productions. Low precedences numbers bind more weakly than high numbers.
34namespace prec {
35 enum Level {
36 Unknown = 0, // Not binary operator.
37 Comma = 1, // ,
38 Assignment = 2, // =, *=, /=, %=, +=, -=, <<=, >>=, &=, ^=, |=
39 Conditional = 3, // ?
40 LogicalOr = 4, // ||
41 LogicalAnd = 5, // &&
42 InclusiveOr = 6, // |
43 ExclusiveOr = 7, // ^
44 And = 8, // &
45 MinMax = 9, // <?, >? min, max (GCC extensions)
46 Equality = 10, // ==, !=
47 Relational = 11, // >=, <=, >, <
48 Shift = 12, // <<, >>
49 Additive = 13, // -, +
50 Multiplicative = 14 // *, /, %
51 };
52}
53
54
55/// getBinOpPrecedence - Return the precedence of the specified binary operator
56/// token. This returns:
57///
58static prec::Level getBinOpPrecedence(tok::TokenKind Kind) {
59 switch (Kind) {
60 default: return prec::Unknown;
61 case tok::comma: return prec::Comma;
62 case tok::equal:
63 case tok::starequal:
64 case tok::slashequal:
65 case tok::percentequal:
66 case tok::plusequal:
67 case tok::minusequal:
68 case tok::lesslessequal:
69 case tok::greatergreaterequal:
70 case tok::ampequal:
71 case tok::caretequal:
72 case tok::pipeequal: return prec::Assignment;
73 case tok::question: return prec::Conditional;
74 case tok::pipepipe: return prec::LogicalOr;
75 case tok::ampamp: return prec::LogicalAnd;
76 case tok::pipe: return prec::InclusiveOr;
77 case tok::caret: return prec::ExclusiveOr;
78 case tok::amp: return prec::And;
79 case tok::lessquestion:
80 case tok::greaterquestion: return prec::MinMax;
81 case tok::exclaimequal:
82 case tok::equalequal: return prec::Equality;
83 case tok::lessequal:
84 case tok::less:
85 case tok::greaterequal:
86 case tok::greater: return prec::Relational;
87 case tok::lessless:
88 case tok::greatergreater: return prec::Shift;
89 case tok::plus:
90 case tok::minus: return prec::Additive;
91 case tok::percent:
92 case tok::slash:
93 case tok::star: return prec::Multiplicative;
94 }
95}
96
97
Chris Lattnerce7e21d2006-08-12 17:22:40 +000098/// ParseExpression - Simple precedence-based parser for binary/ternary
Chris Lattnercde626a2006-08-12 08:13:25 +000099/// operators.
100///
Chris Lattnerb7f1fc92006-08-12 16:45:01 +0000101/// Note: we diverge from the C99 grammar when parsing the assignment-expression
102/// production. C99 specifies that the LHS of an assignment operator should be
103/// parsed as a unary-expression, but consistency dictates that it be a
104/// conditional-expession. In practice, the important thing here is that the
105/// LHS of an assignment has to be an l-value, which productions between
106/// unary-expression and conditional-expression don't produce. Because we want
107/// consistency, we parse the LHS as a conditional-expression, then check for
108/// l-value-ness in semantic analysis stages.
109///
Chris Lattnercde626a2006-08-12 08:13:25 +0000110/// multiplicative-expression: [C99 6.5.5]
111/// cast-expression
112/// multiplicative-expression '*' cast-expression
113/// multiplicative-expression '/' cast-expression
114/// multiplicative-expression '%' cast-expression
115///
116/// additive-expression: [C99 6.5.6]
117/// multiplicative-expression
118/// additive-expression '+' multiplicative-expression
119/// additive-expression '-' multiplicative-expression
120///
121/// shift-expression: [C99 6.5.7]
122/// additive-expression
123/// shift-expression '<<' additive-expression
124/// shift-expression '>>' additive-expression
125///
126/// relational-expression: [C99 6.5.8]
127/// shift-expression
128/// relational-expression '<' shift-expression
129/// relational-expression '>' shift-expression
130/// relational-expression '<=' shift-expression
131/// relational-expression '>=' shift-expression
132///
133/// equality-expression: [C99 6.5.9]
134/// relational-expression
135/// equality-expression '==' relational-expression
136/// equality-expression '!=' relational-expression
137///
138/// AND-expression: [C99 6.5.10]
139/// equality-expression
140/// AND-expression '&' equality-expression
141///
142/// exclusive-OR-expression: [C99 6.5.11]
143/// AND-expression
144/// exclusive-OR-expression '^' AND-expression
145///
146/// inclusive-OR-expression: [C99 6.5.12]
147/// exclusive-OR-expression
148/// inclusive-OR-expression '|' exclusive-OR-expression
149///
150/// logical-AND-expression: [C99 6.5.13]
151/// inclusive-OR-expression
152/// logical-AND-expression '&&' inclusive-OR-expression
153///
154/// logical-OR-expression: [C99 6.5.14]
155/// logical-AND-expression
156/// logical-OR-expression '||' logical-AND-expression
157///
158/// conditional-expression: [C99 6.5.15]
159/// logical-OR-expression
160/// logical-OR-expression '?' expression ':' conditional-expression
161/// [GNU] logical-OR-expression '?' ':' conditional-expression
162///
163/// assignment-expression: [C99 6.5.16]
164/// conditional-expression
165/// unary-expression assignment-operator assignment-expression
166///
167/// assignment-operator: one of
168/// = *= /= %= += -= <<= >>= &= ^= |=
169///
170/// expression: [C99 6.5.17]
171/// assignment-expression
172/// expression ',' assignment-expression
173///
Chris Lattnerd35c34f2006-08-12 17:04:50 +0000174Parser::ExprResult Parser::ParseExpression() {
Chris Lattnercde626a2006-08-12 08:13:25 +0000175 ExprResult LHS = ParseCastExpression(false);
176 if (LHS.isInvalid) return LHS;
177
178 return ParseRHSOfBinaryExpression(LHS, prec::Comma);
179}
180
Chris Lattner0c6c0342006-08-12 18:12:45 +0000181/// ParseAssignmentExpression - Parse an expr that doesn't include commas.
182///
Chris Lattnerce7e21d2006-08-12 17:22:40 +0000183Parser::ExprResult Parser::ParseAssignmentExpression() {
184 ExprResult LHS = ParseCastExpression(false);
185 if (LHS.isInvalid) return LHS;
186
187 return ParseRHSOfBinaryExpression(LHS, prec::Assignment);
188}
189
Chris Lattner3b561a32006-08-13 00:12:11 +0000190Parser::ExprResult Parser::ParseConstantExpression() {
191 ExprResult LHS = ParseCastExpression(false);
192 if (LHS.isInvalid) return LHS;
193
194 // TODO: Validate that this is a constant expr!
195 return ParseRHSOfBinaryExpression(LHS, prec::Conditional);
196}
197
Chris Lattner0c6c0342006-08-12 18:12:45 +0000198/// ParseExpressionWithLeadingIdentifier - This special purpose method is used
199/// in contexts where we have already consumed an identifier (which we saved in
200/// 'Tok'), then discovered that the identifier was really the leading token of
201/// part of an expression. For example, in "A[1]+B", we consumed "A" (which is
202/// now in 'Tok') and the current token is "[".
203Parser::ExprResult Parser::
204ParseExpressionWithLeadingIdentifier(const LexerToken &Tok) {
205 // We know that 'Tok' must correspond to this production:
206 // primary-expression: identifier
207
208 // TODO: Pass 'Tok' to the action.
209 ExprResult Res = ExprResult(false);
210
211 // Because we have to parse an entire cast-expression before starting the
212 // ParseRHSOfBinaryExpression method (which parses any trailing binops), we
213 // need to handle the 'postfix-expression' rules. We do this by invoking
214 // ParsePostfixExpressionSuffix to consume any postfix-expression suffixes:
215 Res = ParsePostfixExpressionSuffix(Res);
216 if (Res.isInvalid) return Res;
217
218 // At this point, the "A[1]" part of "A[1]+B" has been consumed. Once this is
219 // done, we know we don't have to do anything for cast-expression, because the
220 // only non-postfix-expression production starts with a '(' token, and we know
221 // we have an identifier. As such, we can invoke ParseRHSOfBinaryExpression
222 // to consume any trailing operators (e.g. "+" in this example) and connected
223 // chunks of the expression.
224 return ParseRHSOfBinaryExpression(Res, prec::Comma);
225}
226
Chris Lattner8693a512006-08-13 21:54:02 +0000227/// ParseExpressionWithLeadingIdentifier - This special purpose method is used
228/// in contexts where we have already consumed an identifier (which we saved in
229/// 'Tok'), then discovered that the identifier was really the leading token of
230/// part of an assignment-expression. For example, in "A[1]+B", we consumed "A"
231/// (which is now in 'Tok') and the current token is "[".
232Parser::ExprResult Parser::
233ParseAssignmentExprWithLeadingIdentifier(const LexerToken &Tok) {
234 // We know that 'Tok' must correspond to this production:
235 // primary-expression: identifier
236
237 // TODO: Pass 'Tok' to the action.
238 ExprResult Res = ExprResult(false);
239
240 // Because we have to parse an entire cast-expression before starting the
241 // ParseRHSOfBinaryExpression method (which parses any trailing binops), we
242 // need to handle the 'postfix-expression' rules. We do this by invoking
243 // ParsePostfixExpressionSuffix to consume any postfix-expression suffixes:
244 Res = ParsePostfixExpressionSuffix(Res);
245 if (Res.isInvalid) return Res;
246
247 // At this point, the "A[1]" part of "A[1]+B" has been consumed. Once this is
248 // done, we know we don't have to do anything for cast-expression, because the
249 // only non-postfix-expression production starts with a '(' token, and we know
250 // we have an identifier. As such, we can invoke ParseRHSOfBinaryExpression
251 // to consume any trailing operators (e.g. "+" in this example) and connected
252 // chunks of the expression.
253 return ParseRHSOfBinaryExpression(Res, prec::Assignment);
254}
255
256
Chris Lattner62591722006-08-12 18:40:58 +0000257/// ParseAssignmentExpressionWithLeadingStar - This special purpose method is
258/// used in contexts where we have already consumed a '*' (which we saved in
259/// 'Tok'), then discovered that the '*' was really the leading token of an
260/// expression. For example, in "*(int*)P+B", we consumed "*" (which is
261/// now in 'Tok') and the current token is "(".
262Parser::ExprResult Parser::
263ParseAssignmentExpressionWithLeadingStar(const LexerToken &Tok) {
264 // We know that 'Tok' must correspond to this production:
265 // unary-expression: unary-operator cast-expression
266 // where 'unary-operator' is '*'.
267
268 // Parse the cast-expression that follows the '*'. This will parse the
269 // "*(int*)P" part of "*(int*)P+B".
270 ExprResult Res = ParseCastExpression(false);
271 if (Res.isInvalid) return Res;
272
273 // TODO: Combine Tok + Res to get the new AST.
274
275 // We have to parse an entire cast-expression before starting the
276 // ParseRHSOfBinaryExpression method (which parses any trailing binops). Since
277 // we know that the only production above us is the cast-expression
278 // production, and because the only alternative productions start with a '('
279 // token (we know we had a '*'), there is no work to do to get a whole
280 // cast-expression.
281
282 // At this point, the "*(int*)P" part of "*(int*)P+B" has been consumed. Once
283 // this is done, we can invoke ParseRHSOfBinaryExpression to consume any
284 // trailing operators (e.g. "+" in this example) and connected chunks of the
285 // assignment-expression.
286 return ParseRHSOfBinaryExpression(Res, prec::Assignment);
287}
288
289
Chris Lattnercde626a2006-08-12 08:13:25 +0000290/// ParseRHSOfBinaryExpression - Parse a binary expression that starts with
291/// LHS and has a precedence of at least MinPrec.
292Parser::ExprResult
293Parser::ParseRHSOfBinaryExpression(ExprResult LHS, unsigned MinPrec) {
294 unsigned NextTokPrec = getBinOpPrecedence(Tok.getKind());
Chris Lattner9b6d4cb2006-08-23 05:17:46 +0000295 SourceLocation ColonLoc;
296
Chris Lattnercde626a2006-08-12 08:13:25 +0000297 while (1) {
298 // If this token has a lower precedence than we are allowed to parse (e.g.
299 // because we are called recursively, or because the token is not a binop),
300 // then we are done!
301 if (NextTokPrec < MinPrec)
302 return LHS;
303
304 // Consume the operator, saving the operator token for error reporting.
305 LexerToken OpToken = Tok;
306 ConsumeToken();
307
Chris Lattner96c3deb2006-08-12 17:13:08 +0000308 // Special case handling for the ternary operator.
Chris Lattnerb5600a62006-10-06 05:40:05 +0000309 ExprResult TernaryMiddle(true);
Chris Lattner96c3deb2006-08-12 17:13:08 +0000310 if (NextTokPrec == prec::Conditional) {
311 if (Tok.getKind() != tok::colon) {
312 // Handle this production specially:
313 // logical-OR-expression '?' expression ':' conditional-expression
314 // In particular, the RHS of the '?' is 'expression', not
315 // 'logical-OR-expression' as we might expect.
316 TernaryMiddle = ParseExpression();
317 if (TernaryMiddle.isInvalid) return TernaryMiddle;
318 } else {
319 // Special case handling of "X ? Y : Z" where Y is empty:
320 // logical-OR-expression '?' ':' conditional-expression [GNU]
321 TernaryMiddle = ExprResult(false);
322 Diag(Tok, diag::ext_gnu_conditional_expr);
323 }
324
325 if (Tok.getKind() != tok::colon) {
326 Diag(Tok, diag::err_expected_colon);
327 Diag(OpToken, diag::err_matching, "?");
328 return ExprResult(true);
329 }
330
331 // Eat the colon.
Chris Lattneraf635312006-10-16 06:06:51 +0000332 ColonLoc = ConsumeToken();
Chris Lattnercde626a2006-08-12 08:13:25 +0000333 }
Chris Lattner96c3deb2006-08-12 17:13:08 +0000334
335 // Parse another leaf here for the RHS of the operator.
336 ExprResult RHS = ParseCastExpression(false);
337 if (RHS.isInvalid) return RHS;
Chris Lattnercde626a2006-08-12 08:13:25 +0000338
339 // Remember the precedence of this operator and get the precedence of the
340 // operator immediately to the right of the RHS.
341 unsigned ThisPrec = NextTokPrec;
342 NextTokPrec = getBinOpPrecedence(Tok.getKind());
Chris Lattner89d53752006-08-12 17:18:19 +0000343
344 // Assignment and conditional expressions are right-associative.
345 bool isRightAssoc = NextTokPrec == prec::Conditional ||
346 NextTokPrec == prec::Assignment;
Chris Lattnercde626a2006-08-12 08:13:25 +0000347
348 // Get the precedence of the operator to the right of the RHS. If it binds
349 // more tightly with RHS than we do, evaluate it completely first.
Chris Lattnercde626a2006-08-12 08:13:25 +0000350 if (ThisPrec < NextTokPrec ||
351 (ThisPrec == NextTokPrec && isRightAssoc)) {
Chris Lattner89d53752006-08-12 17:18:19 +0000352 // If this is left-associative, only parse things on the RHS that bind
353 // more tightly than the current operator. If it is left-associative, it
354 // is okay, to bind exactly as tightly. For example, compile A=B=C=D as
355 // A=(B=(C=D)), where each paren is a level of recursion here.
356 RHS = ParseRHSOfBinaryExpression(RHS, ThisPrec + !isRightAssoc);
Chris Lattnercde626a2006-08-12 08:13:25 +0000357 if (RHS.isInvalid) return RHS;
358
359 NextTokPrec = getBinOpPrecedence(Tok.getKind());
360 }
361 assert(NextTokPrec <= ThisPrec && "Recursion didn't work!");
362
Chris Lattner9b6d4cb2006-08-23 05:17:46 +0000363 // Combine the LHS and RHS into the LHS (e.g. build AST).
Chris Lattnerb5600a62006-10-06 05:40:05 +0000364 if (TernaryMiddle.isInvalid)
Chris Lattner9b6d4cb2006-08-23 05:17:46 +0000365 LHS = Actions.ParseBinOp(OpToken, LHS.Val, RHS.Val);
366 else
367 LHS = Actions.ParseConditionalOp(OpToken.getLocation(), ColonLoc,
368 LHS.Val, TernaryMiddle.Val, RHS.Val);
Chris Lattnercde626a2006-08-12 08:13:25 +0000369 }
370}
371
Chris Lattnereaf06592006-08-11 02:02:23 +0000372/// ParseCastExpression - Parse a cast-expression, or, if isUnaryExpression is
373/// true, parse a unary-expression.
374///
Chris Lattner4564bc12006-08-10 23:14:52 +0000375/// cast-expression: [C99 6.5.4]
376/// unary-expression
377/// '(' type-name ')' cast-expression
Chris Lattner81b576e2006-08-11 02:13:20 +0000378///
Chris Lattnerc2dd85a2006-08-10 22:57:16 +0000379/// unary-expression: [C99 6.5.3]
380/// postfix-expression
381/// '++' unary-expression
382/// '--' unary-expression
383/// unary-operator cast-expression
384/// 'sizeof' unary-expression
385/// 'sizeof' '(' type-name ')'
386/// [GNU] '__alignof' unary-expression
387/// [GNU] '__alignof' '(' type-name ')'
388/// [GNU] '&&' identifier
Chris Lattner81b576e2006-08-11 02:13:20 +0000389///
Chris Lattnerc2dd85a2006-08-10 22:57:16 +0000390/// unary-operator: one of
391/// '&' '*' '+' '-' '~' '!'
392/// [GNU] '__extension__' '__real' '__imag'
393///
Chris Lattner52a99e52006-08-10 20:56:00 +0000394/// primary-expression: [C99 6.5.1]
Chris Lattnerc5e0d4a2006-08-10 19:06:03 +0000395/// identifier
396/// constant
397/// string-literal
398/// '(' expression ')'
Chris Lattner52a99e52006-08-10 20:56:00 +0000399/// '__func__' [C99 6.4.2.2]
400/// [GNU] '__FUNCTION__'
401/// [GNU] '__PRETTY_FUNCTION__'
402/// [GNU] '(' compound-statement ')'
403/// [GNU] '__builtin_va_arg' '(' assignment-expression ',' type-name ')'
404/// [GNU] '__builtin_offsetof' '(' type-name ',' offsetof-member-designator')'
405/// [GNU] '__builtin_choose_expr' '(' assign-expr ',' assign-expr ','
406/// assign-expr ')'
407/// [GNU] '__builtin_types_compatible_p' '(' type-name ',' type-name ')'
408/// [OBC] '[' objc-receiver objc-message-args ']' [TODO]
409/// [OBC] '@selector' '(' objc-selector-arg ')' [TODO]
410/// [OBC] '@protocol' '(' identifier ')' [TODO]
411/// [OBC] '@encode' '(' type-name ')' [TODO]
412/// [OBC] objc-string-literal [TODO]
413///
414/// constant: [C99 6.4.4]
415/// integer-constant
416/// floating-constant
417/// enumeration-constant -> identifier
418/// character-constant
Chris Lattner52a99e52006-08-10 20:56:00 +0000419///
Chris Lattner89c50c62006-08-11 06:41:18 +0000420Parser::ExprResult Parser::ParseCastExpression(bool isUnaryExpression) {
421 ExprResult Res;
Chris Lattner0ba3dc42006-10-25 03:38:23 +0000422 tok::TokenKind SavedKind = Tok.getKind();
Chris Lattner89c50c62006-08-11 06:41:18 +0000423
Chris Lattner81b576e2006-08-11 02:13:20 +0000424 // This handles all of cast-expression, unary-expression, postfix-expression,
425 // and primary-expression. We handle them together like this for efficiency
426 // and to simplify handling of an expression starting with a '(' token: which
427 // may be one of a parenthesized expression, cast-expression, compound literal
428 // expression, or statement expression.
429 //
430 // If the parsed tokens consist of a primary-expression, the cases below
Chris Lattner20c6a452006-08-12 17:40:43 +0000431 // call ParsePostfixExpressionSuffix to handle the postfix expression
432 // suffixes. Cases that cannot be followed by postfix exprs should
433 // return without invoking ParsePostfixExpressionSuffix.
Chris Lattner52a99e52006-08-10 20:56:00 +0000434 switch (Tok.getKind()) {
Chris Lattnere550a4e2006-08-24 06:37:51 +0000435 case tok::l_paren: {
Chris Lattner81b576e2006-08-11 02:13:20 +0000436 // If this expression is limited to being a unary-expression, the parent can
437 // not start a cast expression.
438 ParenParseOption ParenExprType =
439 isUnaryExpression ? CompoundLiteral : CastExpr;
Chris Lattnere550a4e2006-08-24 06:37:51 +0000440 TypeTy *CastTy;
441 SourceLocation LParenLoc = Tok.getLocation();
442 SourceLocation RParenLoc;
443 Res = ParseParenExpression(ParenExprType, CastTy, RParenLoc);
Chris Lattner89c50c62006-08-11 06:41:18 +0000444 if (Res.isInvalid) return Res;
445
Chris Lattner81b576e2006-08-11 02:13:20 +0000446 switch (ParenExprType) {
447 case SimpleExpr: break; // Nothing else to do.
448 case CompoundStmt: break; // Nothing else to do.
449 case CompoundLiteral:
450 // We parsed '(' type-name ')' '{' ... '}'. If any suffixes of
451 // postfix-expression exist, parse them now.
452 break;
453 case CastExpr:
454 // We parsed '(' type-name ')' and the thing after it wasn't a '{'. Parse
455 // the cast-expression that follows it next.
Chris Lattnere550a4e2006-08-24 06:37:51 +0000456 // TODO: For cast expression with CastTy.
457 Res = ParseCastExpression(false);
458 if (!Res.isInvalid)
459 Res = Actions.ParseCastExpr(LParenLoc, CastTy, RParenLoc, Res.Val);
460 return Res;
Chris Lattner81b576e2006-08-11 02:13:20 +0000461 }
Chris Lattner20c6a452006-08-12 17:40:43 +0000462
463 // These can be followed by postfix-expr pieces.
464 return ParsePostfixExpressionSuffix(Res);
Chris Lattnere550a4e2006-08-24 06:37:51 +0000465 }
Chris Lattner89c50c62006-08-11 06:41:18 +0000466
Chris Lattner52a99e52006-08-10 20:56:00 +0000467 // primary-expression
Chris Lattner9b6d4cb2006-08-23 05:17:46 +0000468 case tok::numeric_constant:
469 // constant: integer-constant
470 // constant: floating-constant
471
472 // TODO: Validate whether this is an integer or floating-constant or
473 // neither.
474 if (1) {
475 Res = Actions.ParseIntegerConstant(Tok);
476 } else {
477 Res = Actions.ParseFloatingConstant(Tok);
478 }
479 ConsumeToken();
480
481 // These can be followed by postfix-expr pieces.
482 return ParsePostfixExpressionSuffix(Res);
483
Chris Lattner52a99e52006-08-10 20:56:00 +0000484 case tok::identifier: // primary-expression: identifier
485 // constant: enumeration-constant
Chris Lattner52a99e52006-08-10 20:56:00 +0000486 case tok::char_constant: // constant: character-constant
487 case tok::kw___func__: // primary-expression: __func__ [C99 6.4.2.2]
488 case tok::kw___FUNCTION__: // primary-expression: __FUNCTION__ [GNU]
489 case tok::kw___PRETTY_FUNCTION__: // primary-expression: __P..Y_F..N__ [GNU]
Chris Lattner879b9ad2006-08-24 04:53:44 +0000490 Res = Actions.ParseSimplePrimaryExpr(Tok);
Chris Lattner52a99e52006-08-10 20:56:00 +0000491 ConsumeToken();
Chris Lattner20c6a452006-08-12 17:40:43 +0000492 // These can be followed by postfix-expr pieces.
493 return ParsePostfixExpressionSuffix(Res);
Chris Lattner52a99e52006-08-10 20:56:00 +0000494 case tok::string_literal: // primary-expression: string-literal
Chris Lattnerd3e98952006-10-06 05:22:26 +0000495 case tok::wide_string_literal:
Chris Lattner89c50c62006-08-11 06:41:18 +0000496 Res = ParseStringLiteralExpression();
497 if (Res.isInvalid) return Res;
Chris Lattner20c6a452006-08-12 17:40:43 +0000498 // This can be followed by postfix-expr pieces (e.g. "foo"[1]).
499 return ParsePostfixExpressionSuffix(Res);
Chris Lattnerf8339772006-08-10 22:01:51 +0000500 case tok::kw___builtin_va_arg:
501 case tok::kw___builtin_offsetof:
502 case tok::kw___builtin_choose_expr:
503 case tok::kw___builtin_types_compatible_p:
Chris Lattner11124352006-08-12 19:16:08 +0000504 return ParseBuiltinPrimaryExpression();
Chris Lattner81b576e2006-08-11 02:13:20 +0000505 case tok::plusplus: // unary-expression: '++' unary-expression
Chris Lattner0ba3dc42006-10-25 03:38:23 +0000506 case tok::minusminus: { // unary-expression: '--' unary-expression
507 SourceLocation SavedLoc = ConsumeToken();
Chris Lattner1b926492006-08-23 06:42:10 +0000508 Res = ParseCastExpression(true);
509 if (!Res.isInvalid)
Chris Lattner0ba3dc42006-10-25 03:38:23 +0000510 Res = Actions.ParseUnaryOp(SavedLoc, SavedKind, Res.Val);
Chris Lattner1b926492006-08-23 06:42:10 +0000511 return Res;
Chris Lattner0ba3dc42006-10-25 03:38:23 +0000512 }
Chris Lattner81b576e2006-08-11 02:13:20 +0000513 case tok::amp: // unary-expression: '&' cast-expression
514 case tok::star: // unary-expression: '*' cast-expression
515 case tok::plus: // unary-expression: '+' cast-expression
516 case tok::minus: // unary-expression: '-' cast-expression
517 case tok::tilde: // unary-expression: '~' cast-expression
518 case tok::exclaim: // unary-expression: '!' cast-expression
519 case tok::kw___real: // unary-expression: '__real' cast-expression [GNU]
Chris Lattner1b926492006-08-23 06:42:10 +0000520 case tok::kw___imag: // unary-expression: '__imag' cast-expression [GNU]
Chris Lattner0ba3dc42006-10-25 03:38:23 +0000521 case tok::kw___extension__:{//unary-expression:'__extension__' cast-expr [GNU]
Chris Lattner4daa0772006-10-20 05:03:44 +0000522 // FIXME: Extension not handled correctly here!
Chris Lattner0ba3dc42006-10-25 03:38:23 +0000523 SourceLocation SavedLoc = ConsumeToken();
Chris Lattner1b926492006-08-23 06:42:10 +0000524 Res = ParseCastExpression(false);
525 if (!Res.isInvalid)
Chris Lattner0ba3dc42006-10-25 03:38:23 +0000526 Res = Actions.ParseUnaryOp(SavedLoc, SavedKind, Res.Val);
Chris Lattner1b926492006-08-23 06:42:10 +0000527 return Res;
Chris Lattner0ba3dc42006-10-25 03:38:23 +0000528 }
Chris Lattner81b576e2006-08-11 02:13:20 +0000529 case tok::kw_sizeof: // unary-expression: 'sizeof' unary-expression
530 // unary-expression: 'sizeof' '(' type-name ')'
531 case tok::kw___alignof: // unary-expression: '__alignof' unary-expression
532 // unary-expression: '__alignof' '(' type-name ')'
Chris Lattner89c50c62006-08-11 06:41:18 +0000533 return ParseSizeofAlignofExpression();
Chris Lattner0ba3dc42006-10-25 03:38:23 +0000534 case tok::ampamp: { // unary-expression: '&&' identifier
Chris Lattner81b576e2006-08-11 02:13:20 +0000535 Diag(Tok, diag::ext_gnu_address_of_label);
Chris Lattner0ba3dc42006-10-25 03:38:23 +0000536 SourceLocation SavedLoc = ConsumeToken();
Chris Lattner14a1b642006-10-15 22:33:58 +0000537
538 if (Tok.getKind() != tok::identifier) {
Chris Lattner81b576e2006-08-11 02:13:20 +0000539 Diag(Tok, diag::err_expected_ident);
Chris Lattner89c50c62006-08-11 06:41:18 +0000540 return ExprResult(true);
Chris Lattner81b576e2006-08-11 02:13:20 +0000541 }
Chris Lattner14a1b642006-10-15 22:33:58 +0000542 // FIXME: Create a label ref for Tok.Ident.
Chris Lattner0ba3dc42006-10-25 03:38:23 +0000543 Res = Actions.ParseUnaryOp(SavedLoc, SavedKind, 0);
Chris Lattner14a1b642006-10-15 22:33:58 +0000544 ConsumeToken();
545
546 return Res;
Chris Lattner0ba3dc42006-10-25 03:38:23 +0000547 }
Chris Lattner52a99e52006-08-10 20:56:00 +0000548 default:
549 Diag(Tok, diag::err_expected_expression);
Chris Lattner89c50c62006-08-11 06:41:18 +0000550 return ExprResult(true);
Chris Lattnerf8339772006-08-10 22:01:51 +0000551 }
552
Chris Lattner20c6a452006-08-12 17:40:43 +0000553 // unreachable.
554 abort();
555}
556
557/// ParsePostfixExpressionSuffix - Once the leading part of a postfix-expression
558/// is parsed, this method parses any suffixes that apply.
559///
560/// postfix-expression: [C99 6.5.2]
561/// primary-expression
562/// postfix-expression '[' expression ']'
563/// postfix-expression '(' argument-expression-list[opt] ')'
564/// postfix-expression '.' identifier
565/// postfix-expression '->' identifier
566/// postfix-expression '++'
567/// postfix-expression '--'
568/// '(' type-name ')' '{' initializer-list '}'
569/// '(' type-name ')' '{' initializer-list ',' '}'
570///
571/// argument-expression-list: [C99 6.5.2]
572/// argument-expression
573/// argument-expression-list ',' assignment-expression
574///
575Parser::ExprResult Parser::ParsePostfixExpressionSuffix(ExprResult LHS) {
Chris Lattner20c6a452006-08-12 17:40:43 +0000576
Chris Lattnerf8339772006-08-10 22:01:51 +0000577 // Now that the primary-expression piece of the postfix-expression has been
578 // parsed, see if there are any postfix-expression pieces here.
579 SourceLocation Loc;
580 while (1) {
581 switch (Tok.getKind()) {
Chris Lattner20c6a452006-08-12 17:40:43 +0000582 default: // Not a postfix-expression suffix.
583 return LHS;
Chris Lattner6d28d9b2006-08-24 03:51:22 +0000584 case tok::l_square: { // postfix-expression: p-e '[' expression ']'
Chris Lattner04132372006-10-16 06:12:55 +0000585 Loc = ConsumeBracket();
Chris Lattner6d28d9b2006-08-24 03:51:22 +0000586 ExprResult Idx = ParseExpression();
587
588 SourceLocation RLoc = Tok.getLocation();
589
590 if (!LHS.isInvalid && !Idx.isInvalid && Tok.getKind() == tok::r_square)
591 LHS = Actions.ParseArraySubscriptExpr(LHS.Val, Loc, Idx.Val, RLoc);
592 else
593 LHS = ExprResult(true);
594
Chris Lattner89c50c62006-08-11 06:41:18 +0000595 // Match the ']'.
Chris Lattner04f80192006-08-15 04:55:54 +0000596 MatchRHSPunctuation(tok::r_square, Loc);
Chris Lattner89c50c62006-08-11 06:41:18 +0000597 break;
Chris Lattner6d28d9b2006-08-24 03:51:22 +0000598 }
Chris Lattner89c50c62006-08-11 06:41:18 +0000599
Chris Lattner6d28d9b2006-08-24 03:51:22 +0000600 case tok::l_paren: { // p-e: p-e '(' argument-expression-list[opt] ')'
601 SmallVector<ExprTy*, 8> ArgExprs;
602 SmallVector<SourceLocation, 8> CommaLocs;
603 bool ArgExprsOk = true;
604
Chris Lattner04132372006-10-16 06:12:55 +0000605 Loc = ConsumeParen();
Chris Lattner89c50c62006-08-11 06:41:18 +0000606
Chris Lattner0c6c0342006-08-12 18:12:45 +0000607 if (Tok.getKind() != tok::r_paren) {
608 while (1) {
Chris Lattner6d28d9b2006-08-24 03:51:22 +0000609 ExprResult ArgExpr = ParseAssignmentExpression();
610 if (ArgExpr.isInvalid)
611 ArgExprsOk = false;
612 else
613 ArgExprs.push_back(ArgExpr.Val);
614
Chris Lattner0c6c0342006-08-12 18:12:45 +0000615 if (Tok.getKind() != tok::comma)
616 break;
Chris Lattneraf635312006-10-16 06:06:51 +0000617 // Move to the next argument, remember where the comma was.
618 CommaLocs.push_back(ConsumeToken());
Chris Lattner0c6c0342006-08-12 18:12:45 +0000619 }
Chris Lattner89c50c62006-08-11 06:41:18 +0000620 }
Chris Lattner81b576e2006-08-11 02:13:20 +0000621
Chris Lattner89c50c62006-08-11 06:41:18 +0000622 // Match the ')'.
Chris Lattnere165d942006-08-24 04:40:38 +0000623 if (!LHS.isInvalid && ArgExprsOk && Tok.getKind() == tok::r_paren) {
624 assert((ArgExprs.size() == 0 || ArgExprs.size()-1 == CommaLocs.size())&&
625 "Unexpected number of commas!");
Chris Lattner6d28d9b2006-08-24 03:51:22 +0000626 LHS = Actions.ParseCallExpr(LHS.Val, Loc, &ArgExprs[0], ArgExprs.size(),
Chris Lattnere165d942006-08-24 04:40:38 +0000627 &CommaLocs[0], Tok.getLocation());
628 }
Chris Lattner6d28d9b2006-08-24 03:51:22 +0000629
Chris Lattner04f80192006-08-15 04:55:54 +0000630 MatchRHSPunctuation(tok::r_paren, Loc);
Chris Lattner89c50c62006-08-11 06:41:18 +0000631 break;
Chris Lattner6d28d9b2006-08-24 03:51:22 +0000632 }
Chris Lattner89c50c62006-08-11 06:41:18 +0000633 case tok::arrow: // postfix-expression: p-e '->' identifier
Chris Lattner6d28d9b2006-08-24 03:51:22 +0000634 case tok::period: { // postfix-expression: p-e '.' identifier
Chris Lattner6d28d9b2006-08-24 03:51:22 +0000635 tok::TokenKind OpKind = Tok.getKind();
Chris Lattneraf635312006-10-16 06:06:51 +0000636 SourceLocation OpLoc = ConsumeToken(); // Eat the "." or "->" token.
Chris Lattner6d28d9b2006-08-24 03:51:22 +0000637
Chris Lattner89c50c62006-08-11 06:41:18 +0000638 if (Tok.getKind() != tok::identifier) {
639 Diag(Tok, diag::err_expected_ident);
640 return ExprResult(true);
641 }
Chris Lattner6d28d9b2006-08-24 03:51:22 +0000642
643 if (!LHS.isInvalid)
644 LHS = Actions.ParseMemberReferenceExpr(LHS.Val, OpLoc, OpKind,
645 Tok.getLocation(),
646 *Tok.getIdentifierInfo());
Chris Lattner89c50c62006-08-11 06:41:18 +0000647 ConsumeToken();
648 break;
Chris Lattner6d28d9b2006-08-24 03:51:22 +0000649 }
Chris Lattner89c50c62006-08-11 06:41:18 +0000650 case tok::plusplus: // postfix-expression: postfix-expression '++'
651 case tok::minusminus: // postfix-expression: postfix-expression '--'
Chris Lattner1b926492006-08-23 06:42:10 +0000652 if (!LHS.isInvalid)
653 LHS = Actions.ParsePostfixUnaryOp(Tok, LHS.Val);
Chris Lattner89c50c62006-08-11 06:41:18 +0000654 ConsumeToken();
655 break;
Chris Lattnerf8339772006-08-10 22:01:51 +0000656 }
657 }
Chris Lattner52a99e52006-08-10 20:56:00 +0000658}
659
Chris Lattner20c6a452006-08-12 17:40:43 +0000660
Chris Lattner81b576e2006-08-11 02:13:20 +0000661/// ParseSizeofAlignofExpression - Parse a sizeof or alignof expression.
662/// unary-expression: [C99 6.5.3]
663/// 'sizeof' unary-expression
664/// 'sizeof' '(' type-name ')'
665/// [GNU] '__alignof' unary-expression
666/// [GNU] '__alignof' '(' type-name ')'
Chris Lattner89c50c62006-08-11 06:41:18 +0000667Parser::ExprResult Parser::ParseSizeofAlignofExpression() {
Chris Lattner81b576e2006-08-11 02:13:20 +0000668 assert((Tok.getKind() == tok::kw_sizeof ||
669 Tok.getKind() == tok::kw___alignof) &&
670 "Not a sizeof/alignof expression!");
Chris Lattner26115ac2006-08-24 06:10:04 +0000671 LexerToken OpTok = Tok;
Chris Lattner81b576e2006-08-11 02:13:20 +0000672 ConsumeToken();
673
674 // If the operand doesn't start with an '(', it must be an expression.
Chris Lattner26115ac2006-08-24 06:10:04 +0000675 ExprResult Operand;
676 if (Tok.getKind() != tok::l_paren) {
677 Operand = ParseCastExpression(true);
678 } else {
679 // If it starts with a '(', we know that it is either a parenthesized
680 // type-name, or it is a unary-expression that starts with a compound
681 // literal, or starts with a primary-expression that is a parenthesized
682 // expression.
683 ParenParseOption ExprType = CastExpr;
Chris Lattnere550a4e2006-08-24 06:37:51 +0000684 TypeTy *CastTy;
Chris Lattner26da7302006-08-24 06:49:19 +0000685 SourceLocation LParenLoc = Tok.getLocation(), RParenLoc;
Chris Lattnere550a4e2006-08-24 06:37:51 +0000686 Operand = ParseParenExpression(ExprType, CastTy, RParenLoc);
Chris Lattner26115ac2006-08-24 06:10:04 +0000687
688 // If ParseParenExpression parsed a '(typename)' sequence only, the this is
689 // sizeof/alignof a type. Otherwise, it is sizeof/alignof an expression.
690 if (ExprType == CastExpr) {
Chris Lattner26da7302006-08-24 06:49:19 +0000691 return Actions.ParseSizeOfAlignOfTypeExpr(OpTok.getLocation(),
692 OpTok.getKind() == tok::kw_sizeof,
693 LParenLoc, CastTy, RParenLoc);
Chris Lattner26115ac2006-08-24 06:10:04 +0000694 }
695 }
Chris Lattner81b576e2006-08-11 02:13:20 +0000696
Chris Lattner26115ac2006-08-24 06:10:04 +0000697 // If we get here, the operand to the sizeof/alignof was an expresion.
698 if (!Operand.isInvalid)
Chris Lattner0ba3dc42006-10-25 03:38:23 +0000699 Operand = Actions.ParseUnaryOp(OpTok.getLocation(), OpTok.getKind(),
700 Operand.Val);
Chris Lattner26115ac2006-08-24 06:10:04 +0000701 return Operand;
Chris Lattner81b576e2006-08-11 02:13:20 +0000702}
703
Chris Lattner11124352006-08-12 19:16:08 +0000704/// ParseBuiltinPrimaryExpression
705///
706/// primary-expression: [C99 6.5.1]
707/// [GNU] '__builtin_va_arg' '(' assignment-expression ',' type-name ')'
708/// [GNU] '__builtin_offsetof' '(' type-name ',' offsetof-member-designator')'
709/// [GNU] '__builtin_choose_expr' '(' assign-expr ',' assign-expr ','
710/// assign-expr ')'
711/// [GNU] '__builtin_types_compatible_p' '(' type-name ',' type-name ')'
712///
713/// [GNU] offsetof-member-designator:
714/// [GNU] identifier
715/// [GNU] offsetof-member-designator '.' identifier
716/// [GNU] offsetof-member-designator '[' expression ']'
717///
718Parser::ExprResult Parser::ParseBuiltinPrimaryExpression() {
719 ExprResult Res(false);
Chris Lattner11124352006-08-12 19:16:08 +0000720 const IdentifierInfo *BuiltinII = Tok.getIdentifierInfo();
721
722 tok::TokenKind T = Tok.getKind();
Chris Lattneraf635312006-10-16 06:06:51 +0000723 SourceLocation StartLoc = ConsumeToken(); // Eat the builtin identifier.
Chris Lattner11124352006-08-12 19:16:08 +0000724
725 // All of these start with an open paren.
726 if (Tok.getKind() != tok::l_paren) {
727 Diag(Tok, diag::err_expected_lparen_after, BuiltinII->getName());
728 return ExprResult(true);
729 }
730
Chris Lattner04132372006-10-16 06:12:55 +0000731 SourceLocation LParenLoc = ConsumeParen();
Chris Lattner6d28d9b2006-08-24 03:51:22 +0000732 // TODO: Build AST.
733
Chris Lattner11124352006-08-12 19:16:08 +0000734 switch (T) {
735 default: assert(0 && "Not a builtin primary expression!");
736 case tok::kw___builtin_va_arg:
737 Res = ParseAssignmentExpression();
738 if (Res.isInvalid) {
739 SkipUntil(tok::r_paren);
740 return Res;
741 }
Chris Lattner0be454e2006-08-12 19:30:51 +0000742
Chris Lattner6d7e6342006-08-15 03:41:14 +0000743 if (ExpectAndConsume(tok::comma, diag::err_expected_comma, "",tok::r_paren))
Chris Lattner11124352006-08-12 19:16:08 +0000744 return ExprResult(true);
Chris Lattner0be454e2006-08-12 19:30:51 +0000745
Chris Lattner11124352006-08-12 19:16:08 +0000746 ParseTypeName();
747 break;
748
749 case tok::kw___builtin_offsetof:
750 ParseTypeName();
751
Chris Lattner6d7e6342006-08-15 03:41:14 +0000752 if (ExpectAndConsume(tok::comma, diag::err_expected_comma, "",tok::r_paren))
Chris Lattner11124352006-08-12 19:16:08 +0000753 return ExprResult(true);
Chris Lattner11124352006-08-12 19:16:08 +0000754
755 // We must have at least one identifier here.
Chris Lattner6d7e6342006-08-15 03:41:14 +0000756 if (ExpectAndConsume(tok::identifier, diag::err_expected_ident, "",
Chris Lattnerdbb2a462006-08-12 19:26:13 +0000757 tok::r_paren))
Chris Lattner11124352006-08-12 19:16:08 +0000758 return ExprResult(true);
Chris Lattnerdbb2a462006-08-12 19:26:13 +0000759
Chris Lattner11124352006-08-12 19:16:08 +0000760 while (1) {
761 if (Tok.getKind() == tok::period) {
762 // offsetof-member-designator: offsetof-member-designator '.' identifier
763 ConsumeToken();
764
Chris Lattner6d7e6342006-08-15 03:41:14 +0000765 if (ExpectAndConsume(tok::identifier, diag::err_expected_ident, "",
Chris Lattnerdbb2a462006-08-12 19:26:13 +0000766 tok::r_paren))
Chris Lattner11124352006-08-12 19:16:08 +0000767 return ExprResult(true);
Chris Lattner11124352006-08-12 19:16:08 +0000768 } else if (Tok.getKind() == tok::l_square) {
769 // offsetof-member-designator: offsetof-member-design '[' expression ']'
Chris Lattner04132372006-10-16 06:12:55 +0000770 SourceLocation LSquareLoc = ConsumeBracket();
Chris Lattner11124352006-08-12 19:16:08 +0000771 Res = ParseExpression();
772 if (Res.isInvalid) {
773 SkipUntil(tok::r_paren);
774 return Res;
775 }
776
Chris Lattner04f80192006-08-15 04:55:54 +0000777 MatchRHSPunctuation(tok::r_square, LSquareLoc);
Chris Lattner11124352006-08-12 19:16:08 +0000778 } else {
779 break;
780 }
781 }
782 break;
783 case tok::kw___builtin_choose_expr:
784 Res = ParseAssignmentExpression();
785
Chris Lattner6d7e6342006-08-15 03:41:14 +0000786 if (ExpectAndConsume(tok::comma, diag::err_expected_comma, "",tok::r_paren))
Chris Lattner11124352006-08-12 19:16:08 +0000787 return ExprResult(true);
Chris Lattner11124352006-08-12 19:16:08 +0000788
789 Res = ParseAssignmentExpression();
790
Chris Lattner6d7e6342006-08-15 03:41:14 +0000791 if (ExpectAndConsume(tok::comma, diag::err_expected_comma, "",tok::r_paren))
Chris Lattner11124352006-08-12 19:16:08 +0000792 return ExprResult(true);
Chris Lattner11124352006-08-12 19:16:08 +0000793
794 Res = ParseAssignmentExpression();
795 break;
796 case tok::kw___builtin_types_compatible_p:
797 ParseTypeName();
798
Chris Lattner6d7e6342006-08-15 03:41:14 +0000799 if (ExpectAndConsume(tok::comma, diag::err_expected_comma, "",tok::r_paren))
Chris Lattner11124352006-08-12 19:16:08 +0000800 return ExprResult(true);
Chris Lattner11124352006-08-12 19:16:08 +0000801
802 ParseTypeName();
803 break;
804 }
805
Chris Lattner04f80192006-08-15 04:55:54 +0000806 MatchRHSPunctuation(tok::r_paren, LParenLoc);
Chris Lattner11124352006-08-12 19:16:08 +0000807
808 // These can be followed by postfix-expr pieces because they are
809 // primary-expressions.
810 return ParsePostfixExpressionSuffix(Res);
811}
812
Chris Lattnerc951dae2006-08-10 04:23:57 +0000813
Chris Lattner4add4e62006-08-11 01:33:00 +0000814/// ParseParenExpression - This parses the unit that starts with a '(' token,
815/// based on what is allowed by ExprType. The actual thing parsed is returned
816/// in ExprType.
817///
818/// primary-expression: [C99 6.5.1]
Chris Lattnerc951dae2006-08-10 04:23:57 +0000819/// '(' expression ')'
Chris Lattnerf8339772006-08-10 22:01:51 +0000820/// [GNU] '(' compound-statement ')' (if !ParenExprOnly)
821/// postfix-expression: [C99 6.5.2]
822/// '(' type-name ')' '{' initializer-list '}'
823/// '(' type-name ')' '{' initializer-list ',' '}'
Chris Lattner4add4e62006-08-11 01:33:00 +0000824/// cast-expression: [C99 6.5.4]
825/// '(' type-name ')' cast-expression
Chris Lattnerf8339772006-08-10 22:01:51 +0000826///
Chris Lattnere550a4e2006-08-24 06:37:51 +0000827Parser::ExprResult Parser::ParseParenExpression(ParenParseOption &ExprType,
828 TypeTy *&CastTy,
829 SourceLocation &RParenLoc) {
Chris Lattnerc951dae2006-08-10 04:23:57 +0000830 assert(Tok.getKind() == tok::l_paren && "Not a paren expr!");
Chris Lattner04132372006-10-16 06:12:55 +0000831 SourceLocation OpenLoc = ConsumeParen();
Chris Lattner89c50c62006-08-11 06:41:18 +0000832 ExprResult Result(false);
Chris Lattnere550a4e2006-08-24 06:37:51 +0000833 CastTy = 0;
Chris Lattnerc951dae2006-08-10 04:23:57 +0000834
Chris Lattner4add4e62006-08-11 01:33:00 +0000835 if (ExprType >= CompoundStmt && Tok.getKind() == tok::l_brace &&
Chris Lattnerf8339772006-08-10 22:01:51 +0000836 !getLang().NoExtensions) {
837 Diag(Tok, diag::ext_gnu_statement_expr);
838 ParseCompoundStatement();
Chris Lattner4add4e62006-08-11 01:33:00 +0000839 ExprType = CompoundStmt;
Chris Lattner1b926492006-08-23 06:42:10 +0000840 // TODO: Build AST for GNU compound stmt.
Chris Lattner4add4e62006-08-11 01:33:00 +0000841 } else if (ExprType >= CompoundLiteral && isTypeSpecifierQualifier()) {
Chris Lattner6c3f05d2006-08-12 16:54:25 +0000842 // Otherwise, this is a compound literal expression or cast expression.
Chris Lattnere550a4e2006-08-24 06:37:51 +0000843 TypeTy *Ty = ParseTypeName();
Chris Lattnerf5fbd792006-08-10 23:56:11 +0000844
845 // Match the ')'.
Chris Lattner04132372006-10-16 06:12:55 +0000846 if (Tok.getKind() == tok::r_paren)
847 RParenLoc = ConsumeParen();
848 else
Chris Lattnere550a4e2006-08-24 06:37:51 +0000849 MatchRHSPunctuation(tok::r_paren, OpenLoc);
Chris Lattnere550a4e2006-08-24 06:37:51 +0000850
Chris Lattner4add4e62006-08-11 01:33:00 +0000851 if (Tok.getKind() == tok::l_brace) {
Chris Lattner6c3f05d2006-08-12 16:54:25 +0000852 if (!getLang().C99) // Compound literals don't exist in C90.
853 Diag(OpenLoc, diag::ext_c99_compound_literal);
Chris Lattner89c50c62006-08-11 06:41:18 +0000854 Result = ParseInitializer();
Chris Lattner4add4e62006-08-11 01:33:00 +0000855 ExprType = CompoundLiteral;
Chris Lattner1b926492006-08-23 06:42:10 +0000856 // TODO: Build AST for compound literal.
Chris Lattner4add4e62006-08-11 01:33:00 +0000857 } else if (ExprType == CastExpr) {
Chris Lattnere550a4e2006-08-24 06:37:51 +0000858 // Note that this doesn't parse the subsequence cast-expression, it just
859 // returns the parsed type to the callee.
Chris Lattner4add4e62006-08-11 01:33:00 +0000860 ExprType = CastExpr;
Chris Lattnere550a4e2006-08-24 06:37:51 +0000861 CastTy = Ty;
862 return ExprResult(false);
Chris Lattner4add4e62006-08-11 01:33:00 +0000863 } else {
Chris Lattnerf5fbd792006-08-10 23:56:11 +0000864 Diag(Tok, diag::err_expected_lbrace_in_compound_literal);
Chris Lattner89c50c62006-08-11 06:41:18 +0000865 return ExprResult(true);
Chris Lattnerf5fbd792006-08-10 23:56:11 +0000866 }
Chris Lattner89c50c62006-08-11 06:41:18 +0000867 return Result;
Chris Lattner4add4e62006-08-11 01:33:00 +0000868 } else {
Chris Lattner89c50c62006-08-11 06:41:18 +0000869 Result = ParseExpression();
Chris Lattner4add4e62006-08-11 01:33:00 +0000870 ExprType = SimpleExpr;
Chris Lattner1b926492006-08-23 06:42:10 +0000871 if (!Result.isInvalid && Tok.getKind() == tok::r_paren)
872 Result = Actions.ParseParenExpr(OpenLoc, Tok.getLocation(), Result.Val);
Chris Lattnerf8339772006-08-10 22:01:51 +0000873 }
Chris Lattnerc951dae2006-08-10 04:23:57 +0000874
Chris Lattner4564bc12006-08-10 23:14:52 +0000875 // Match the ')'.
Chris Lattner89c50c62006-08-11 06:41:18 +0000876 if (Result.isInvalid)
877 SkipUntil(tok::r_paren);
Chris Lattnere550a4e2006-08-24 06:37:51 +0000878 else {
Chris Lattner04132372006-10-16 06:12:55 +0000879 if (Tok.getKind() == tok::r_paren)
880 RParenLoc = ConsumeParen();
881 else
Chris Lattnere550a4e2006-08-24 06:37:51 +0000882 MatchRHSPunctuation(tok::r_paren, OpenLoc);
Chris Lattnere550a4e2006-08-24 06:37:51 +0000883 }
Chris Lattner1b926492006-08-23 06:42:10 +0000884
Chris Lattner89c50c62006-08-11 06:41:18 +0000885 return Result;
Chris Lattnerc951dae2006-08-10 04:23:57 +0000886}
Chris Lattnerd3e98952006-10-06 05:22:26 +0000887
888/// HexDigitValue - Return the value of the specified hex digit, or -1 if it's
889/// not valid.
890static int HexDigitValue(char C) {
891 if (C >= '0' && C <= '9') return C-'0';
892 if (C >= 'a' && C <= 'f') return C-'a'+10;
893 if (C >= 'A' && C <= 'F') return C-'A'+10;
894 return -1;
895}
896
897/// ParseStringLiteralExpression - This handles the various token types that
898/// form string literals, and also handles string concatenation [C99 5.1.1.2,
899/// translation phase #6].
900///
901/// primary-expression: [C99 6.5.1]
902/// string-literal
903Parser::ExprResult Parser::ParseStringLiteralExpression() {
904 assert(isTokenStringLiteral() && "Not a string literal!");
905
906 // String concat. Note that keywords like __func__ and __FUNCTION__ are not
907 // considered to be strings for concatenation purposes.
908 SmallVector<LexerToken, 4> StringToks;
909
910 // While we're looking at all of the string portions, remember the max
911 // individual token length, computing a bound on the concatenated string
912 // length, and see whether any piece is a wide-string. If any of the string
913 // portions is a wide-string literal, the result is also a wide-string literal
914 // [C99 6.4.5p4].
915 unsigned SizeBound = 0, MaxTokenLength = 0;
916 bool AnyWide = false;
917 do {
918 // The string could be shorter than this if it needs cleaning, but this is a
919 // reasonable bound, which is all we need.
920 SizeBound += Tok.getLength()-2; // -2 for "".
921
922 // Find maximum string piece length.
923 if (Tok.getLength() > MaxTokenLength)
924 MaxTokenLength = Tok.getLength();
925
926 // Remember if we see any wide strings.
927 AnyWide |= Tok.getKind() == tok::wide_string_literal;
928
929 // Remember the string token.
930 StringToks.push_back(Tok);
931 ConsumeStringToken();
932 } while (isTokenStringLiteral());
933
934 // Include space for the null terminator.
935 ++SizeBound;
936
937 // TODO: K&R warning: "traditional C rejects string constant concatenation"
938
Chris Lattner02dffbd2006-10-14 07:50:21 +0000939 // Get the width in bytes of wchar_t. If no wchar_t strings are used, do not
940 // query the target. As such, wchar_tByteWidth is only valid if AnyWide=true.
941 unsigned wchar_tByteWidth = ~0U;
942 if (AnyWide)
943 wchar_tByteWidth=getTargetInfo().getWCharWidth(StringToks[0].getLocation());
Chris Lattnerd3e98952006-10-06 05:22:26 +0000944
945 // The output buffer size needs to be large enough to hold wide characters.
946 // This is a worst-case assumption which basically corresponds to L"" "long".
947 if (AnyWide)
948 SizeBound *= wchar_tByteWidth;
949
950 // Create a temporary buffer to hold the result string data. If it is "big",
951 // use malloc, otherwise use alloca.
952 char *ResultBuf;
953 if (SizeBound > 512)
954 ResultBuf = (char*)malloc(SizeBound);
955 else
956 ResultBuf = (char*)alloca(SizeBound);
957
958 // Likewise, but for each string piece.
959 char *TokenBuf;
960 if (MaxTokenLength > 512)
961 TokenBuf = (char*)malloc(MaxTokenLength);
962 else
963 TokenBuf = (char*)alloca(MaxTokenLength);
964
965 // Loop over all the strings, getting their spelling, and expanding them to
966 // wide strings as appropriate.
967 char *ResultPtr = ResultBuf; // Next byte to fill in.
968
969 for (unsigned i = 0, e = StringToks.size(); i != e; ++i) {
970 const char *ThisTokBuf = TokenBuf;
971 // Get the spelling of the token, which eliminates trigraphs, etc. We know
972 // that ThisTokBuf points to a buffer that is big enough for the whole token
973 // and 'spelled' tokens can only shrink.
974 unsigned ThisTokLen = PP.getSpelling(StringToks[i], ThisTokBuf);
975 const char *ThisTokEnd = ThisTokBuf+ThisTokLen-1; // Skip end quote.
976
977 // TODO: Input character set mapping support.
978
979 // Skip L marker for wide strings.
980 if (ThisTokBuf[0] == 'L') ++ThisTokBuf;
981
982 assert(ThisTokBuf[0] == '"' && "Expected quote, lexer broken?");
983 ++ThisTokBuf;
984
985 while (ThisTokBuf != ThisTokEnd) {
986 // Is this a span of non-escape characters?
987 if (ThisTokBuf[0] != '\\') {
988 const char *InStart = ThisTokBuf;
989 do {
990 ++ThisTokBuf;
991 } while (ThisTokBuf != ThisTokEnd && ThisTokBuf[0] != '\\');
992
993 // Copy the character span over.
994 unsigned Len = ThisTokBuf-InStart;
995 if (!AnyWide) {
996 memcpy(ResultPtr, InStart, Len);
997 ResultPtr += Len;
998 } else {
999 // Note: our internal rep of wide char tokens is always little-endian.
1000 for (; Len; --Len, ++InStart) {
1001 *ResultPtr++ = InStart[0];
1002 // Add zeros at the end.
1003 for (unsigned i = 1, e = wchar_tByteWidth; i != e; ++i)
1004 *ResultPtr++ = 0;
1005 }
1006 }
1007 continue;
1008 }
1009
1010 // Otherwise, this is an escape character. Skip the '\' char.
1011 ++ThisTokBuf;
1012
1013 // We know that this character can't be off the end of the buffer, because
1014 // that would have been \", which would not have been the end of string.
1015 unsigned ResultChar = *ThisTokBuf++;
1016 switch (ResultChar) {
1017 // These map to themselves.
1018 case '\\': case '\'': case '"': case '?': break;
1019
1020 // These have fixed mappings.
1021 case 'a':
1022 // TODO: K&R: the meaning of '\\a' is different in traditional C
1023 ResultChar = 7;
1024 break;
1025 case 'b':
1026 ResultChar = 8;
1027 break;
1028 case 'e':
1029 PP.Diag(StringToks[i], diag::ext_nonstandard_escape, "e");
1030 ResultChar = 27;
1031 break;
1032 case 'f':
1033 ResultChar = 12;
1034 break;
1035 case 'n':
1036 ResultChar = 10;
1037 break;
1038 case 'r':
1039 ResultChar = 13;
1040 break;
1041 case 't':
1042 ResultChar = 9;
1043 break;
1044 case 'v':
1045 ResultChar = 11;
1046 break;
1047
1048 //case 'u': case 'U': // FIXME: UCNs.
1049 case 'x': // Hex escape.
1050 if (ThisTokBuf == ThisTokEnd ||
1051 (ResultChar = HexDigitValue(*ThisTokBuf)) == ~0U) {
1052 PP.Diag(StringToks[i], diag::err_hex_escape_no_digits);
1053 ResultChar = 0;
1054 break;
1055 }
1056 ++ThisTokBuf; // Consumed one hex digit.
1057
1058 assert(0 && "hex escape: unimp!");
1059 break;
1060 case '0': case '1': case '2': case '3':
1061 case '4': case '5': case '6': case '7':
1062 // Octal escapes.
1063 assert(0 && "octal escape: unimp!");
1064 break;
1065
1066 // Otherwise, these are not valid escapes.
1067 case '(': case '{': case '[': case '%':
1068 // GCC accepts these as extensions. We warn about them as such though.
1069 if (!PP.getLangOptions().NoExtensions) {
1070 PP.Diag(StringToks[i], diag::ext_nonstandard_escape,
1071 std::string()+(char)ResultChar);
1072 break;
1073 }
1074 // FALL THROUGH.
1075 default:
1076 if (isgraph(ThisTokBuf[0])) {
1077 PP.Diag(StringToks[i], diag::ext_unknown_escape,
1078 std::string()+(char)ResultChar);
1079 } else {
1080 PP.Diag(StringToks[i], diag::ext_unknown_escape,
1081 "x"+utohexstr(ResultChar));
1082 }
1083 }
1084
1085 // Note: our internal rep of wide char tokens is always little-endian.
Chris Lattner02dffbd2006-10-14 07:50:21 +00001086 *ResultPtr++ = ResultChar & 0xFF;
1087
1088 if (AnyWide) {
1089 for (unsigned i = 1, e = wchar_tByteWidth; i != e; ++i)
1090 *ResultPtr++ = ResultChar >> i*8;
1091 }
Chris Lattnerd3e98952006-10-06 05:22:26 +00001092 }
1093 }
1094
1095 // Add zero terminator.
1096 *ResultPtr = 0;
1097 if (AnyWide) {
1098 for (unsigned i = 1, e = wchar_tByteWidth; i != e; ++i)
1099 *ResultPtr++ = 0;
1100 }
1101
1102 // Hand this off to the Actions.
1103 ExprResult Res = Actions.ParseStringExpr(ResultBuf, ResultPtr-ResultBuf,
1104 AnyWide,
1105 &StringToks[0], StringToks.size());
1106
1107 // If either buffer was heap allocated, release it now.
1108 if (MaxTokenLength > 512) free(TokenBuf);
1109 if (SizeBound > 512) free(ResultBuf);
1110
1111 return Res;
1112}
1113