blob: 1a3543aac77f21d670872af2410b4c5a375b177a [file] [log] [blame]
Chris Lattner27aa7d22009-06-21 20:16:42 +00001//===- AsmParser.cpp - Parser for Assembly Files --------------------------===//
2//
3// The LLVM Compiler Infrastructure
4//
5// This file is distributed under the University of Illinois Open Source
6// License. See LICENSE.TXT for details.
7//
8//===----------------------------------------------------------------------===//
9//
10// This class implements the parser for assembly files.
11//
12//===----------------------------------------------------------------------===//
13
14#include "AsmParser.h"
Daniel Dunbar475839e2009-06-29 20:37:27 +000015
16#include "AsmExpr.h"
Daniel Dunbarecc63f82009-06-23 22:01:43 +000017#include "llvm/MC/MCContext.h"
Chris Lattner29dfe7c2009-06-23 18:41:30 +000018#include "llvm/MC/MCInst.h"
Daniel Dunbarecc63f82009-06-23 22:01:43 +000019#include "llvm/MC/MCStreamer.h"
Daniel Dunbardce0f3c2009-06-29 23:43:14 +000020#include "llvm/MC/MCSymbol.h"
Chris Lattnerb0789ed2009-06-21 20:54:55 +000021#include "llvm/Support/SourceMgr.h"
22#include "llvm/Support/raw_ostream.h"
Chris Lattner27aa7d22009-06-21 20:16:42 +000023using namespace llvm;
24
Daniel Dunbar3fb76832009-06-30 00:49:23 +000025void AsmParser::Warning(SMLoc L, const char *Msg) {
26 Lexer.PrintMessage(L, Msg, "warning");
27}
28
Chris Lattner14ee48a2009-06-21 21:22:11 +000029bool AsmParser::Error(SMLoc L, const char *Msg) {
Daniel Dunbar3fb76832009-06-30 00:49:23 +000030 Lexer.PrintMessage(L, Msg, "error");
Chris Lattner14ee48a2009-06-21 21:22:11 +000031 return true;
32}
33
34bool AsmParser::TokError(const char *Msg) {
Daniel Dunbar3fb76832009-06-30 00:49:23 +000035 Lexer.PrintMessage(Lexer.getLoc(), Msg, "error");
Chris Lattner14ee48a2009-06-21 21:22:11 +000036 return true;
37}
38
Chris Lattner27aa7d22009-06-21 20:16:42 +000039bool AsmParser::Run() {
Chris Lattnerb0789ed2009-06-21 20:54:55 +000040 // Prime the lexer.
41 Lexer.Lex();
42
Chris Lattnerb717fb02009-07-02 21:53:43 +000043 bool HadError = false;
Chris Lattnerb0789ed2009-06-21 20:54:55 +000044
Chris Lattnerb717fb02009-07-02 21:53:43 +000045 // While we have input, parse each statement.
46 while (Lexer.isNot(asmtok::Eof)) {
47 if (!ParseStatement()) continue;
48
49 // If we had an error, remember it and recover by skipping to the next line.
50 HadError = true;
51 EatToEndOfStatement();
52 }
53
54 return HadError;
Chris Lattnerb0789ed2009-06-21 20:54:55 +000055}
56
Chris Lattner2cf5f142009-06-22 01:29:09 +000057/// EatToEndOfStatement - Throw away the rest of the line for testing purposes.
58void AsmParser::EatToEndOfStatement() {
59 while (Lexer.isNot(asmtok::EndOfStatement) &&
60 Lexer.isNot(asmtok::Eof))
61 Lexer.Lex();
62
63 // Eat EOL.
64 if (Lexer.is(asmtok::EndOfStatement))
65 Lexer.Lex();
66}
67
Chris Lattnerc4193832009-06-22 05:51:26 +000068
Chris Lattner74ec1a32009-06-22 06:32:03 +000069/// ParseParenExpr - Parse a paren expression and return it.
70/// NOTE: This assumes the leading '(' has already been consumed.
71///
72/// parenexpr ::= expr)
73///
Daniel Dunbar475839e2009-06-29 20:37:27 +000074bool AsmParser::ParseParenExpr(AsmExpr *&Res) {
Chris Lattner74ec1a32009-06-22 06:32:03 +000075 if (ParseExpression(Res)) return true;
76 if (Lexer.isNot(asmtok::RParen))
77 return TokError("expected ')' in parentheses expression");
78 Lexer.Lex();
79 return false;
80}
Chris Lattnerc4193832009-06-22 05:51:26 +000081
Chris Lattner74ec1a32009-06-22 06:32:03 +000082/// ParsePrimaryExpr - Parse a primary expression and return it.
83/// primaryexpr ::= (parenexpr
84/// primaryexpr ::= symbol
85/// primaryexpr ::= number
86/// primaryexpr ::= ~,+,- primaryexpr
Daniel Dunbar475839e2009-06-29 20:37:27 +000087bool AsmParser::ParsePrimaryExpr(AsmExpr *&Res) {
Chris Lattnerc4193832009-06-22 05:51:26 +000088 switch (Lexer.getKind()) {
89 default:
90 return TokError("unknown token in expression");
Daniel Dunbar475839e2009-06-29 20:37:27 +000091 case asmtok::Exclaim:
92 Lexer.Lex(); // Eat the operator.
93 if (ParsePrimaryExpr(Res))
94 return true;
95 Res = new AsmUnaryExpr(AsmUnaryExpr::LNot, Res);
96 return false;
Daniel Dunbardce0f3c2009-06-29 23:43:14 +000097 case asmtok::Identifier: {
Chris Lattnerc4193832009-06-22 05:51:26 +000098 // This is a label, this should be parsed as part of an expression, to
Daniel Dunbar475839e2009-06-29 20:37:27 +000099 // handle things like LFOO+4.
Daniel Dunbardce0f3c2009-06-29 23:43:14 +0000100 MCSymbol *Sym = Ctx.GetOrCreateSymbol(Lexer.getCurStrVal());
101
102 // If this is use of an undefined symbol then mark it external.
103 if (!Sym->getSection() && !Ctx.GetSymbolValue(Sym))
104 Sym->setExternal(true);
105
106 Res = new AsmSymbolRefExpr(Sym);
Chris Lattnerc4193832009-06-22 05:51:26 +0000107 Lexer.Lex(); // Eat identifier.
108 return false;
Daniel Dunbardce0f3c2009-06-29 23:43:14 +0000109 }
Chris Lattnerc4193832009-06-22 05:51:26 +0000110 case asmtok::IntVal:
Daniel Dunbar475839e2009-06-29 20:37:27 +0000111 Res = new AsmConstantExpr(Lexer.getCurIntVal());
Chris Lattnerc4193832009-06-22 05:51:26 +0000112 Lexer.Lex(); // Eat identifier.
113 return false;
Chris Lattner74ec1a32009-06-22 06:32:03 +0000114 case asmtok::LParen:
115 Lexer.Lex(); // Eat the '('.
116 return ParseParenExpr(Res);
Chris Lattner74ec1a32009-06-22 06:32:03 +0000117 case asmtok::Minus:
118 Lexer.Lex(); // Eat the operator.
Daniel Dunbar475839e2009-06-29 20:37:27 +0000119 if (ParsePrimaryExpr(Res))
120 return true;
121 Res = new AsmUnaryExpr(AsmUnaryExpr::Minus, Res);
122 return false;
123 case asmtok::Plus:
124 Lexer.Lex(); // Eat the operator.
125 if (ParsePrimaryExpr(Res))
126 return true;
127 Res = new AsmUnaryExpr(AsmUnaryExpr::Plus, Res);
128 return false;
129 case asmtok::Tilde:
130 Lexer.Lex(); // Eat the operator.
131 if (ParsePrimaryExpr(Res))
132 return true;
133 Res = new AsmUnaryExpr(AsmUnaryExpr::Not, Res);
134 return false;
Chris Lattnerc4193832009-06-22 05:51:26 +0000135 }
136}
Chris Lattner74ec1a32009-06-22 06:32:03 +0000137
138/// ParseExpression - Parse an expression and return it.
139///
140/// expr ::= expr +,- expr -> lowest.
141/// expr ::= expr |,^,&,! expr -> middle.
142/// expr ::= expr *,/,%,<<,>> expr -> highest.
143/// expr ::= primaryexpr
144///
Daniel Dunbar475839e2009-06-29 20:37:27 +0000145bool AsmParser::ParseExpression(AsmExpr *&Res) {
146 Res = 0;
Chris Lattner8dfbe6c2009-06-23 05:57:07 +0000147 return ParsePrimaryExpr(Res) ||
148 ParseBinOpRHS(1, Res);
Chris Lattner74ec1a32009-06-22 06:32:03 +0000149}
Chris Lattner8dfbe6c2009-06-23 05:57:07 +0000150
Daniel Dunbar475839e2009-06-29 20:37:27 +0000151bool AsmParser::ParseAbsoluteExpression(int64_t &Res) {
152 AsmExpr *Expr;
153
Daniel Dunbarf4b830f2009-06-30 02:10:03 +0000154 SMLoc StartLoc = Lexer.getLoc();
Daniel Dunbar475839e2009-06-29 20:37:27 +0000155 if (ParseExpression(Expr))
156 return true;
157
158 if (!Expr->EvaluateAsAbsolute(Ctx, Res))
Daniel Dunbarf4b830f2009-06-30 02:10:03 +0000159 return Error(StartLoc, "expected absolute expression");
Daniel Dunbar475839e2009-06-29 20:37:27 +0000160
161 return false;
162}
163
Daniel Dunbar15d17072009-06-30 01:49:52 +0000164bool AsmParser::ParseRelocatableExpression(MCValue &Res) {
165 AsmExpr *Expr;
166
Daniel Dunbarf4b830f2009-06-30 02:10:03 +0000167 SMLoc StartLoc = Lexer.getLoc();
Daniel Dunbar15d17072009-06-30 01:49:52 +0000168 if (ParseExpression(Expr))
169 return true;
170
171 if (!Expr->EvaluateAsRelocatable(Ctx, Res))
Daniel Dunbarf4b830f2009-06-30 02:10:03 +0000172 return Error(StartLoc, "expected relocatable expression");
Daniel Dunbar15d17072009-06-30 01:49:52 +0000173
174 return false;
175}
176
Daniel Dunbar2c3f00c2009-07-02 02:09:07 +0000177bool AsmParser::ParseParenRelocatableExpression(MCValue &Res) {
178 AsmExpr *Expr;
179
180 SMLoc StartLoc = Lexer.getLoc();
181 if (ParseParenExpr(Expr))
182 return true;
183
184 if (!Expr->EvaluateAsRelocatable(Ctx, Res))
185 return Error(StartLoc, "expected relocatable expression");
186
187 return false;
188}
189
Daniel Dunbar475839e2009-06-29 20:37:27 +0000190static unsigned getBinOpPrecedence(asmtok::TokKind K,
191 AsmBinaryExpr::Opcode &Kind) {
Chris Lattner8dfbe6c2009-06-23 05:57:07 +0000192 switch (K) {
193 default: return 0; // not a binop.
Daniel Dunbar475839e2009-06-29 20:37:27 +0000194
195 // Lowest Precedence: &&, ||
196 case asmtok::AmpAmp:
197 Kind = AsmBinaryExpr::LAnd;
Chris Lattner8dfbe6c2009-06-23 05:57:07 +0000198 return 1;
Daniel Dunbar475839e2009-06-29 20:37:27 +0000199 case asmtok::PipePipe:
200 Kind = AsmBinaryExpr::LOr;
201 return 1;
202
203 // Low Precedence: +, -, ==, !=, <>, <, <=, >, >=
204 case asmtok::Plus:
205 Kind = AsmBinaryExpr::Add;
Chris Lattner8dfbe6c2009-06-23 05:57:07 +0000206 return 2;
Daniel Dunbar475839e2009-06-29 20:37:27 +0000207 case asmtok::Minus:
208 Kind = AsmBinaryExpr::Sub;
209 return 2;
210 case asmtok::EqualEqual:
211 Kind = AsmBinaryExpr::EQ;
212 return 2;
213 case asmtok::ExclaimEqual:
214 case asmtok::LessGreater:
215 Kind = AsmBinaryExpr::NE;
216 return 2;
217 case asmtok::Less:
218 Kind = AsmBinaryExpr::LT;
219 return 2;
220 case asmtok::LessEqual:
221 Kind = AsmBinaryExpr::LTE;
222 return 2;
223 case asmtok::Greater:
224 Kind = AsmBinaryExpr::GT;
225 return 2;
226 case asmtok::GreaterEqual:
227 Kind = AsmBinaryExpr::GTE;
228 return 2;
229
230 // Intermediate Precedence: |, &, ^
231 //
232 // FIXME: gas seems to support '!' as an infix operator?
233 case asmtok::Pipe:
234 Kind = AsmBinaryExpr::Or;
Chris Lattner8dfbe6c2009-06-23 05:57:07 +0000235 return 3;
Daniel Dunbar475839e2009-06-29 20:37:27 +0000236 case asmtok::Caret:
237 Kind = AsmBinaryExpr::Xor;
238 return 3;
239 case asmtok::Amp:
240 Kind = AsmBinaryExpr::And;
241 return 3;
242
243 // Highest Precedence: *, /, %, <<, >>
244 case asmtok::Star:
245 Kind = AsmBinaryExpr::Mul;
246 return 4;
247 case asmtok::Slash:
248 Kind = AsmBinaryExpr::Div;
249 return 4;
250 case asmtok::Percent:
251 Kind = AsmBinaryExpr::Mod;
252 return 4;
253 case asmtok::LessLess:
254 Kind = AsmBinaryExpr::Shl;
255 return 4;
256 case asmtok::GreaterGreater:
257 Kind = AsmBinaryExpr::Shr;
258 return 4;
Chris Lattner8dfbe6c2009-06-23 05:57:07 +0000259 }
260}
261
262
263/// ParseBinOpRHS - Parse all binary operators with precedence >= 'Precedence'.
264/// Res contains the LHS of the expression on input.
Daniel Dunbar475839e2009-06-29 20:37:27 +0000265bool AsmParser::ParseBinOpRHS(unsigned Precedence, AsmExpr *&Res) {
Chris Lattner8dfbe6c2009-06-23 05:57:07 +0000266 while (1) {
Daniel Dunbar51330632009-06-29 21:14:21 +0000267 AsmBinaryExpr::Opcode Kind = AsmBinaryExpr::Add;
Daniel Dunbar475839e2009-06-29 20:37:27 +0000268 unsigned TokPrec = getBinOpPrecedence(Lexer.getKind(), Kind);
Chris Lattner8dfbe6c2009-06-23 05:57:07 +0000269
270 // If the next token is lower precedence than we are allowed to eat, return
271 // successfully with what we ate already.
272 if (TokPrec < Precedence)
273 return false;
274
Chris Lattner8dfbe6c2009-06-23 05:57:07 +0000275 Lexer.Lex();
276
277 // Eat the next primary expression.
Daniel Dunbar475839e2009-06-29 20:37:27 +0000278 AsmExpr *RHS;
Chris Lattner8dfbe6c2009-06-23 05:57:07 +0000279 if (ParsePrimaryExpr(RHS)) return true;
280
281 // If BinOp binds less tightly with RHS than the operator after RHS, let
282 // the pending operator take RHS as its LHS.
Daniel Dunbar475839e2009-06-29 20:37:27 +0000283 AsmBinaryExpr::Opcode Dummy;
284 unsigned NextTokPrec = getBinOpPrecedence(Lexer.getKind(), Dummy);
Chris Lattner8dfbe6c2009-06-23 05:57:07 +0000285 if (TokPrec < NextTokPrec) {
286 if (ParseBinOpRHS(Precedence+1, RHS)) return true;
287 }
288
Daniel Dunbar475839e2009-06-29 20:37:27 +0000289 // Merge LHS and RHS according to operator.
290 Res = new AsmBinaryExpr(Kind, Res, RHS);
Chris Lattner8dfbe6c2009-06-23 05:57:07 +0000291 }
292}
293
Chris Lattnerc4193832009-06-22 05:51:26 +0000294
295
296
Chris Lattnerb0789ed2009-06-21 20:54:55 +0000297/// ParseStatement:
298/// ::= EndOfStatement
Chris Lattner2cf5f142009-06-22 01:29:09 +0000299/// ::= Label* Directive ...Operands... EndOfStatement
300/// ::= Label* Identifier OperandList* EndOfStatement
Chris Lattnerb0789ed2009-06-21 20:54:55 +0000301bool AsmParser::ParseStatement() {
302 switch (Lexer.getKind()) {
303 default:
Chris Lattner14ee48a2009-06-21 21:22:11 +0000304 return TokError("unexpected token at start of statement");
Chris Lattnerb0789ed2009-06-21 20:54:55 +0000305 case asmtok::EndOfStatement:
306 Lexer.Lex();
307 return false;
308 case asmtok::Identifier:
309 break;
310 // TODO: Recurse on local labels etc.
311 }
312
313 // If we have an identifier, handle it as the key symbol.
Chris Lattner2cf5f142009-06-22 01:29:09 +0000314 SMLoc IDLoc = Lexer.getLoc();
Chris Lattnerfaf32c12009-06-24 00:33:19 +0000315 const char *IDVal = Lexer.getCurStrVal();
Chris Lattnerb0789ed2009-06-21 20:54:55 +0000316
317 // Consume the identifier, see what is after it.
Daniel Dunbar8f780cd2009-06-25 21:56:11 +0000318 switch (Lexer.Lex()) {
Daniel Dunbardce0f3c2009-06-29 23:43:14 +0000319 case asmtok::Colon: {
Chris Lattnerb0789ed2009-06-21 20:54:55 +0000320 // identifier ':' -> Label.
321 Lexer.Lex();
Daniel Dunbardce0f3c2009-06-29 23:43:14 +0000322
323 // Diagnose attempt to use a variable as a label.
324 //
325 // FIXME: Diagnostics. Note the location of the definition as a label.
326 // FIXME: This doesn't diagnose assignment to a symbol which has been
327 // implicitly marked as external.
328 MCSymbol *Sym = Ctx.GetOrCreateSymbol(IDVal);
329 if (Sym->getSection())
330 return Error(IDLoc, "invalid symbol redefinition");
331 if (Ctx.GetSymbolValue(Sym))
332 return Error(IDLoc, "symbol already used as assembler variable");
Chris Lattnerc69485e2009-06-24 04:31:49 +0000333
334 // Since we saw a label, create a symbol and emit it.
335 // FIXME: If the label starts with L it is an assembler temporary label.
336 // Why does the client of this api need to know this?
Daniel Dunbardce0f3c2009-06-29 23:43:14 +0000337 Out.EmitLabel(Sym);
338
Chris Lattnerb0789ed2009-06-21 20:54:55 +0000339 return ParseStatement();
Daniel Dunbardce0f3c2009-06-29 23:43:14 +0000340 }
Daniel Dunbar8f780cd2009-06-25 21:56:11 +0000341
342 case asmtok::Equal:
343 // identifier '=' ... -> assignment statement
344 Lexer.Lex();
345
346 return ParseAssignment(IDVal, false);
347
348 default: // Normal instruction or directive.
349 break;
Chris Lattnerb0789ed2009-06-21 20:54:55 +0000350 }
351
352 // Otherwise, we have a normal instruction or directive.
Chris Lattner2cf5f142009-06-22 01:29:09 +0000353 if (IDVal[0] == '.') {
Chris Lattner529fb542009-06-24 05:13:15 +0000354 // FIXME: This should be driven based on a hash lookup and callback.
Chris Lattner9a023f72009-06-24 04:43:34 +0000355 if (!strcmp(IDVal, ".section"))
Chris Lattner529fb542009-06-24 05:13:15 +0000356 return ParseDirectiveDarwinSection();
357 if (!strcmp(IDVal, ".text"))
358 // FIXME: This changes behavior based on the -static flag to the
359 // assembler.
360 return ParseDirectiveSectionSwitch("__TEXT,__text",
361 "regular,pure_instructions");
362 if (!strcmp(IDVal, ".const"))
363 return ParseDirectiveSectionSwitch("__TEXT,__const");
364 if (!strcmp(IDVal, ".static_const"))
365 return ParseDirectiveSectionSwitch("__TEXT,__static_const");
366 if (!strcmp(IDVal, ".cstring"))
Daniel Dunbar8f780cd2009-06-25 21:56:11 +0000367 return ParseDirectiveSectionSwitch("__TEXT,__cstring",
368 "cstring_literals");
Chris Lattner529fb542009-06-24 05:13:15 +0000369 if (!strcmp(IDVal, ".literal4"))
370 return ParseDirectiveSectionSwitch("__TEXT,__literal4", "4byte_literals");
371 if (!strcmp(IDVal, ".literal8"))
372 return ParseDirectiveSectionSwitch("__TEXT,__literal8", "8byte_literals");
373 if (!strcmp(IDVal, ".literal16"))
374 return ParseDirectiveSectionSwitch("__TEXT,__literal16",
375 "16byte_literals");
376 if (!strcmp(IDVal, ".constructor"))
377 return ParseDirectiveSectionSwitch("__TEXT,__constructor");
378 if (!strcmp(IDVal, ".destructor"))
379 return ParseDirectiveSectionSwitch("__TEXT,__destructor");
380 if (!strcmp(IDVal, ".fvmlib_init0"))
381 return ParseDirectiveSectionSwitch("__TEXT,__fvmlib_init0");
382 if (!strcmp(IDVal, ".fvmlib_init1"))
383 return ParseDirectiveSectionSwitch("__TEXT,__fvmlib_init1");
384 if (!strcmp(IDVal, ".symbol_stub")) // FIXME: Different on PPC.
385 return ParseDirectiveSectionSwitch("__IMPORT,__jump_table,symbol_stubs",
386 "self_modifying_code+pure_instructions,5");
387 // FIXME: .picsymbol_stub on PPC.
388 if (!strcmp(IDVal, ".data"))
389 return ParseDirectiveSectionSwitch("__DATA,__data");
390 if (!strcmp(IDVal, ".static_data"))
391 return ParseDirectiveSectionSwitch("__DATA,__static_data");
392 if (!strcmp(IDVal, ".non_lazy_symbol_pointer"))
393 return ParseDirectiveSectionSwitch("__DATA,__nl_symbol_pointer",
394 "non_lazy_symbol_pointers");
395 if (!strcmp(IDVal, ".lazy_symbol_pointer"))
396 return ParseDirectiveSectionSwitch("__DATA,__la_symbol_pointer",
397 "lazy_symbol_pointers");
398 if (!strcmp(IDVal, ".dyld"))
399 return ParseDirectiveSectionSwitch("__DATA,__dyld");
400 if (!strcmp(IDVal, ".mod_init_func"))
401 return ParseDirectiveSectionSwitch("__DATA,__mod_init_func",
402 "mod_init_funcs");
403 if (!strcmp(IDVal, ".mod_term_func"))
404 return ParseDirectiveSectionSwitch("__DATA,__mod_term_func",
405 "mod_term_funcs");
406 if (!strcmp(IDVal, ".const_data"))
407 return ParseDirectiveSectionSwitch("__DATA,__const", "regular");
408
409
410 // FIXME: Verify attributes on sections.
411 if (!strcmp(IDVal, ".objc_class"))
412 return ParseDirectiveSectionSwitch("__OBJC,__class");
413 if (!strcmp(IDVal, ".objc_meta_class"))
414 return ParseDirectiveSectionSwitch("__OBJC,__meta_class");
415 if (!strcmp(IDVal, ".objc_cat_cls_meth"))
416 return ParseDirectiveSectionSwitch("__OBJC,__cat_cls_meth");
417 if (!strcmp(IDVal, ".objc_cat_inst_meth"))
418 return ParseDirectiveSectionSwitch("__OBJC,__cat_inst_meth");
419 if (!strcmp(IDVal, ".objc_protocol"))
420 return ParseDirectiveSectionSwitch("__OBJC,__protocol");
421 if (!strcmp(IDVal, ".objc_string_object"))
422 return ParseDirectiveSectionSwitch("__OBJC,__string_object");
423 if (!strcmp(IDVal, ".objc_cls_meth"))
424 return ParseDirectiveSectionSwitch("__OBJC,__cls_meth");
425 if (!strcmp(IDVal, ".objc_inst_meth"))
426 return ParseDirectiveSectionSwitch("__OBJC,__inst_meth");
427 if (!strcmp(IDVal, ".objc_cls_refs"))
428 return ParseDirectiveSectionSwitch("__OBJC,__cls_refs");
429 if (!strcmp(IDVal, ".objc_message_refs"))
430 return ParseDirectiveSectionSwitch("__OBJC,__message_refs");
431 if (!strcmp(IDVal, ".objc_symbols"))
432 return ParseDirectiveSectionSwitch("__OBJC,__symbols");
433 if (!strcmp(IDVal, ".objc_category"))
434 return ParseDirectiveSectionSwitch("__OBJC,__category");
435 if (!strcmp(IDVal, ".objc_class_vars"))
436 return ParseDirectiveSectionSwitch("__OBJC,__class_vars");
437 if (!strcmp(IDVal, ".objc_instance_vars"))
438 return ParseDirectiveSectionSwitch("__OBJC,__instance_vars");
439 if (!strcmp(IDVal, ".objc_module_info"))
440 return ParseDirectiveSectionSwitch("__OBJC,__module_info");
441 if (!strcmp(IDVal, ".objc_class_names"))
442 return ParseDirectiveSectionSwitch("__TEXT,__cstring","cstring_literals");
443 if (!strcmp(IDVal, ".objc_meth_var_types"))
444 return ParseDirectiveSectionSwitch("__TEXT,__cstring","cstring_literals");
445 if (!strcmp(IDVal, ".objc_meth_var_names"))
446 return ParseDirectiveSectionSwitch("__TEXT,__cstring","cstring_literals");
447 if (!strcmp(IDVal, ".objc_selector_strs"))
448 return ParseDirectiveSectionSwitch("__OBJC,__selector_strs");
Chris Lattner9a023f72009-06-24 04:43:34 +0000449
Daniel Dunbar8f780cd2009-06-25 21:56:11 +0000450 // Assembler features
451 if (!strcmp(IDVal, ".set"))
452 return ParseDirectiveSet();
453
Daniel Dunbara0d14262009-06-24 23:30:00 +0000454 // Data directives
455
456 if (!strcmp(IDVal, ".ascii"))
457 return ParseDirectiveAscii(false);
458 if (!strcmp(IDVal, ".asciz"))
459 return ParseDirectiveAscii(true);
460
461 // FIXME: Target hooks for size? Also for "word", "hword".
462 if (!strcmp(IDVal, ".byte"))
463 return ParseDirectiveValue(1);
464 if (!strcmp(IDVal, ".short"))
465 return ParseDirectiveValue(2);
466 if (!strcmp(IDVal, ".long"))
467 return ParseDirectiveValue(4);
468 if (!strcmp(IDVal, ".quad"))
469 return ParseDirectiveValue(8);
Daniel Dunbarc29dfa72009-06-29 23:46:59 +0000470
471 // FIXME: Target hooks for IsPow2.
472 if (!strcmp(IDVal, ".align"))
473 return ParseDirectiveAlign(/*IsPow2=*/true, /*ExprSize=*/1);
474 if (!strcmp(IDVal, ".align32"))
475 return ParseDirectiveAlign(/*IsPow2=*/true, /*ExprSize=*/4);
476 if (!strcmp(IDVal, ".balign"))
477 return ParseDirectiveAlign(/*IsPow2=*/false, /*ExprSize=*/1);
478 if (!strcmp(IDVal, ".balignw"))
479 return ParseDirectiveAlign(/*IsPow2=*/false, /*ExprSize=*/2);
480 if (!strcmp(IDVal, ".balignl"))
481 return ParseDirectiveAlign(/*IsPow2=*/false, /*ExprSize=*/4);
482 if (!strcmp(IDVal, ".p2align"))
483 return ParseDirectiveAlign(/*IsPow2=*/true, /*ExprSize=*/1);
484 if (!strcmp(IDVal, ".p2alignw"))
485 return ParseDirectiveAlign(/*IsPow2=*/true, /*ExprSize=*/2);
486 if (!strcmp(IDVal, ".p2alignl"))
487 return ParseDirectiveAlign(/*IsPow2=*/true, /*ExprSize=*/4);
488
Daniel Dunbarc238b582009-06-25 22:44:51 +0000489 if (!strcmp(IDVal, ".org"))
490 return ParseDirectiveOrg();
Daniel Dunbarc29dfa72009-06-29 23:46:59 +0000491
492 if (!strcmp(IDVal, ".fill"))
493 return ParseDirectiveFill();
Daniel Dunbara0d14262009-06-24 23:30:00 +0000494 if (!strcmp(IDVal, ".space"))
495 return ParseDirectiveSpace();
496
Daniel Dunbard7b267b2009-06-30 00:33:19 +0000497 // Symbol attribute directives
498 if (!strcmp(IDVal, ".globl") || !strcmp(IDVal, ".global"))
499 return ParseDirectiveSymbolAttribute(MCStreamer::Global);
500 if (!strcmp(IDVal, ".hidden"))
501 return ParseDirectiveSymbolAttribute(MCStreamer::Hidden);
502 if (!strcmp(IDVal, ".indirect_symbol"))
503 return ParseDirectiveSymbolAttribute(MCStreamer::IndirectSymbol);
504 if (!strcmp(IDVal, ".internal"))
505 return ParseDirectiveSymbolAttribute(MCStreamer::Internal);
506 if (!strcmp(IDVal, ".lazy_reference"))
507 return ParseDirectiveSymbolAttribute(MCStreamer::LazyReference);
508 if (!strcmp(IDVal, ".no_dead_strip"))
509 return ParseDirectiveSymbolAttribute(MCStreamer::NoDeadStrip);
510 if (!strcmp(IDVal, ".private_extern"))
511 return ParseDirectiveSymbolAttribute(MCStreamer::PrivateExtern);
512 if (!strcmp(IDVal, ".protected"))
513 return ParseDirectiveSymbolAttribute(MCStreamer::Protected);
514 if (!strcmp(IDVal, ".reference"))
515 return ParseDirectiveSymbolAttribute(MCStreamer::Reference);
516 if (!strcmp(IDVal, ".weak"))
517 return ParseDirectiveSymbolAttribute(MCStreamer::Weak);
518 if (!strcmp(IDVal, ".weak_definition"))
519 return ParseDirectiveSymbolAttribute(MCStreamer::WeakDefinition);
520 if (!strcmp(IDVal, ".weak_reference"))
521 return ParseDirectiveSymbolAttribute(MCStreamer::WeakReference);
522
Chris Lattner4e4db7a2009-07-07 20:30:46 +0000523 if (!strcmp(IDVal, ".comm"))
524 return ParseDirectiveComm();
525
Daniel Dunbar3fb76832009-06-30 00:49:23 +0000526 Warning(IDLoc, "ignoring directive for now");
Chris Lattner2cf5f142009-06-22 01:29:09 +0000527 EatToEndOfStatement();
528 return false;
529 }
Chris Lattnerb0789ed2009-06-21 20:54:55 +0000530
Chris Lattner29dfe7c2009-06-23 18:41:30 +0000531 MCInst Inst;
Daniel Dunbard9627e12009-06-30 23:38:38 +0000532 if (ParseX86InstOperands(IDVal, Inst))
Chris Lattner29dfe7c2009-06-23 18:41:30 +0000533 return true;
Chris Lattner2cf5f142009-06-22 01:29:09 +0000534
535 if (Lexer.isNot(asmtok::EndOfStatement))
Chris Lattner9a023f72009-06-24 04:43:34 +0000536 return TokError("unexpected token in argument list");
Chris Lattner2cf5f142009-06-22 01:29:09 +0000537
538 // Eat the end of statement marker.
539 Lexer.Lex();
540
541 // Instruction is good, process it.
Daniel Dunbar0eebb052009-07-01 06:35:48 +0000542 Out.EmitInstruction(Inst);
Chris Lattner2cf5f142009-06-22 01:29:09 +0000543
544 // Skip to end of line for now.
Chris Lattner27aa7d22009-06-21 20:16:42 +0000545 return false;
546}
Chris Lattner9a023f72009-06-24 04:43:34 +0000547
Daniel Dunbar8f780cd2009-06-25 21:56:11 +0000548bool AsmParser::ParseAssignment(const char *Name, bool IsDotSet) {
Daniel Dunbardce0f3c2009-06-29 23:43:14 +0000549 // FIXME: Use better location, we should use proper tokens.
550 SMLoc EqualLoc = Lexer.getLoc();
551
Daniel Dunbarf4b830f2009-06-30 02:10:03 +0000552 MCValue Value;
553 if (ParseRelocatableExpression(Value))
Daniel Dunbar8f780cd2009-06-25 21:56:11 +0000554 return true;
555
556 if (Lexer.isNot(asmtok::EndOfStatement))
557 return TokError("unexpected token in assignment");
558
559 // Eat the end of statement marker.
560 Lexer.Lex();
561
Daniel Dunbardce0f3c2009-06-29 23:43:14 +0000562 // Diagnose assignment to a label.
563 //
564 // FIXME: Diagnostics. Note the location of the definition as a label.
565 // FIXME: This doesn't diagnose assignment to a symbol which has been
566 // implicitly marked as external.
Daniel Dunbar8f780cd2009-06-25 21:56:11 +0000567 // FIXME: Handle '.'.
Daniel Dunbardce0f3c2009-06-29 23:43:14 +0000568 // FIXME: Diagnose assignment to protected identifier (e.g., register name).
Daniel Dunbar8f780cd2009-06-25 21:56:11 +0000569 MCSymbol *Sym = Ctx.GetOrCreateSymbol(Name);
Daniel Dunbardce0f3c2009-06-29 23:43:14 +0000570 if (Sym->getSection())
571 return Error(EqualLoc, "invalid assignment to symbol emitted as a label");
572 if (Sym->isExternal())
573 return Error(EqualLoc, "invalid assignment to external symbol");
574
575 // Do the assignment.
Daniel Dunbarf4b830f2009-06-30 02:10:03 +0000576 Out.EmitAssignment(Sym, Value, IsDotSet);
Daniel Dunbar8f780cd2009-06-25 21:56:11 +0000577
578 return false;
579}
580
581/// ParseDirectiveSet:
582/// ::= .set identifier ',' expression
583bool AsmParser::ParseDirectiveSet() {
584 if (Lexer.isNot(asmtok::Identifier))
585 return TokError("expected identifier after '.set' directive");
586
587 const char *Name = Lexer.getCurStrVal();
588
589 if (Lexer.Lex() != asmtok::Comma)
590 return TokError("unexpected token in '.set'");
591 Lexer.Lex();
592
593 return ParseAssignment(Name, true);
594}
595
Chris Lattner9a023f72009-06-24 04:43:34 +0000596/// ParseDirectiveSection:
Chris Lattner529fb542009-06-24 05:13:15 +0000597/// ::= .section identifier (',' identifier)*
598/// FIXME: This should actually parse out the segment, section, attributes and
599/// sizeof_stub fields.
600bool AsmParser::ParseDirectiveDarwinSection() {
Chris Lattner9a023f72009-06-24 04:43:34 +0000601 if (Lexer.isNot(asmtok::Identifier))
602 return TokError("expected identifier after '.section' directive");
603
604 std::string Section = Lexer.getCurStrVal();
605 Lexer.Lex();
606
607 // Accept a comma separated list of modifiers.
608 while (Lexer.is(asmtok::Comma)) {
609 Lexer.Lex();
610
611 if (Lexer.isNot(asmtok::Identifier))
612 return TokError("expected identifier in '.section' directive");
613 Section += ',';
614 Section += Lexer.getCurStrVal();
615 Lexer.Lex();
616 }
617
618 if (Lexer.isNot(asmtok::EndOfStatement))
619 return TokError("unexpected token in '.section' directive");
620 Lexer.Lex();
621
622 Out.SwitchSection(Ctx.GetSection(Section.c_str()));
623 return false;
624}
625
Chris Lattner529fb542009-06-24 05:13:15 +0000626bool AsmParser::ParseDirectiveSectionSwitch(const char *Section,
627 const char *Directives) {
628 if (Lexer.isNot(asmtok::EndOfStatement))
629 return TokError("unexpected token in section switching directive");
630 Lexer.Lex();
631
632 std::string SectionStr = Section;
633 if (Directives && Directives[0]) {
634 SectionStr += ",";
635 SectionStr += Directives;
636 }
637
638 Out.SwitchSection(Ctx.GetSection(Section));
639 return false;
640}
Daniel Dunbara0d14262009-06-24 23:30:00 +0000641
642/// ParseDirectiveAscii:
Daniel Dunbar475839e2009-06-29 20:37:27 +0000643/// ::= ( .ascii | .asciz ) [ "string" ( , "string" )* ]
Daniel Dunbara0d14262009-06-24 23:30:00 +0000644bool AsmParser::ParseDirectiveAscii(bool ZeroTerminated) {
645 if (Lexer.isNot(asmtok::EndOfStatement)) {
646 for (;;) {
647 if (Lexer.isNot(asmtok::String))
648 return TokError("expected string in '.ascii' or '.asciz' directive");
649
650 // FIXME: This shouldn't use a const char* + strlen, the string could have
651 // embedded nulls.
652 // FIXME: Should have accessor for getting string contents.
653 const char *Str = Lexer.getCurStrVal();
654 Out.EmitBytes(Str + 1, strlen(Str) - 2);
655 if (ZeroTerminated)
656 Out.EmitBytes("\0", 1);
657
658 Lexer.Lex();
659
660 if (Lexer.is(asmtok::EndOfStatement))
661 break;
662
663 if (Lexer.isNot(asmtok::Comma))
664 return TokError("unexpected token in '.ascii' or '.asciz' directive");
665 Lexer.Lex();
666 }
667 }
668
669 Lexer.Lex();
670 return false;
671}
672
673/// ParseDirectiveValue
674/// ::= (.byte | .short | ... ) [ expression (, expression)* ]
675bool AsmParser::ParseDirectiveValue(unsigned Size) {
676 if (Lexer.isNot(asmtok::EndOfStatement)) {
677 for (;;) {
Daniel Dunbarf4b830f2009-06-30 02:10:03 +0000678 MCValue Expr;
679 if (ParseRelocatableExpression(Expr))
Daniel Dunbara0d14262009-06-24 23:30:00 +0000680 return true;
681
Daniel Dunbarf4b830f2009-06-30 02:10:03 +0000682 Out.EmitValue(Expr, Size);
Daniel Dunbara0d14262009-06-24 23:30:00 +0000683
684 if (Lexer.is(asmtok::EndOfStatement))
685 break;
686
687 // FIXME: Improve diagnostic.
688 if (Lexer.isNot(asmtok::Comma))
689 return TokError("unexpected token in directive");
690 Lexer.Lex();
691 }
692 }
693
694 Lexer.Lex();
695 return false;
696}
697
698/// ParseDirectiveSpace
699/// ::= .space expression [ , expression ]
700bool AsmParser::ParseDirectiveSpace() {
701 int64_t NumBytes;
Daniel Dunbar475839e2009-06-29 20:37:27 +0000702 if (ParseAbsoluteExpression(NumBytes))
Daniel Dunbara0d14262009-06-24 23:30:00 +0000703 return true;
704
705 int64_t FillExpr = 0;
706 bool HasFillExpr = false;
707 if (Lexer.isNot(asmtok::EndOfStatement)) {
708 if (Lexer.isNot(asmtok::Comma))
709 return TokError("unexpected token in '.space' directive");
710 Lexer.Lex();
711
Daniel Dunbar475839e2009-06-29 20:37:27 +0000712 if (ParseAbsoluteExpression(FillExpr))
Daniel Dunbara0d14262009-06-24 23:30:00 +0000713 return true;
714
715 HasFillExpr = true;
716
717 if (Lexer.isNot(asmtok::EndOfStatement))
718 return TokError("unexpected token in '.space' directive");
719 }
720
721 Lexer.Lex();
722
723 if (NumBytes <= 0)
724 return TokError("invalid number of bytes in '.space' directive");
725
726 // FIXME: Sometimes the fill expr is 'nop' if it isn't supplied, instead of 0.
727 for (uint64_t i = 0, e = NumBytes; i != e; ++i)
728 Out.EmitValue(MCValue::get(FillExpr), 1);
729
730 return false;
731}
732
733/// ParseDirectiveFill
734/// ::= .fill expression , expression , expression
735bool AsmParser::ParseDirectiveFill() {
736 int64_t NumValues;
Daniel Dunbar475839e2009-06-29 20:37:27 +0000737 if (ParseAbsoluteExpression(NumValues))
Daniel Dunbara0d14262009-06-24 23:30:00 +0000738 return true;
739
740 if (Lexer.isNot(asmtok::Comma))
741 return TokError("unexpected token in '.fill' directive");
742 Lexer.Lex();
743
744 int64_t FillSize;
Daniel Dunbar475839e2009-06-29 20:37:27 +0000745 if (ParseAbsoluteExpression(FillSize))
Daniel Dunbara0d14262009-06-24 23:30:00 +0000746 return true;
747
748 if (Lexer.isNot(asmtok::Comma))
749 return TokError("unexpected token in '.fill' directive");
750 Lexer.Lex();
751
752 int64_t FillExpr;
Daniel Dunbar475839e2009-06-29 20:37:27 +0000753 if (ParseAbsoluteExpression(FillExpr))
Daniel Dunbara0d14262009-06-24 23:30:00 +0000754 return true;
755
756 if (Lexer.isNot(asmtok::EndOfStatement))
757 return TokError("unexpected token in '.fill' directive");
758
759 Lexer.Lex();
760
761 if (FillSize != 1 && FillSize != 2 && FillSize != 4)
762 return TokError("invalid '.fill' size, expected 1, 2, or 4");
763
764 for (uint64_t i = 0, e = NumValues; i != e; ++i)
765 Out.EmitValue(MCValue::get(FillExpr), FillSize);
766
767 return false;
768}
Daniel Dunbarc238b582009-06-25 22:44:51 +0000769
770/// ParseDirectiveOrg
771/// ::= .org expression [ , expression ]
772bool AsmParser::ParseDirectiveOrg() {
Daniel Dunbarf4b830f2009-06-30 02:10:03 +0000773 MCValue Offset;
774 if (ParseRelocatableExpression(Offset))
Daniel Dunbarc238b582009-06-25 22:44:51 +0000775 return true;
776
777 // Parse optional fill expression.
778 int64_t FillExpr = 0;
779 if (Lexer.isNot(asmtok::EndOfStatement)) {
780 if (Lexer.isNot(asmtok::Comma))
781 return TokError("unexpected token in '.org' directive");
782 Lexer.Lex();
783
Daniel Dunbar475839e2009-06-29 20:37:27 +0000784 if (ParseAbsoluteExpression(FillExpr))
Daniel Dunbarc238b582009-06-25 22:44:51 +0000785 return true;
786
787 if (Lexer.isNot(asmtok::EndOfStatement))
788 return TokError("unexpected token in '.org' directive");
789 }
790
791 Lexer.Lex();
Daniel Dunbarf4b830f2009-06-30 02:10:03 +0000792
793 // FIXME: Only limited forms of relocatable expressions are accepted here, it
794 // has to be relative to the current section.
795 Out.EmitValueToOffset(Offset, FillExpr);
Daniel Dunbarc238b582009-06-25 22:44:51 +0000796
797 return false;
798}
Daniel Dunbarc29dfa72009-06-29 23:46:59 +0000799
800/// ParseDirectiveAlign
801/// ::= {.align, ...} expression [ , expression [ , expression ]]
802bool AsmParser::ParseDirectiveAlign(bool IsPow2, unsigned ValueSize) {
803 int64_t Alignment;
804 if (ParseAbsoluteExpression(Alignment))
805 return true;
806
807 SMLoc MaxBytesLoc;
808 bool HasFillExpr = false;
809 int64_t FillExpr = 0;
810 int64_t MaxBytesToFill = 0;
811 if (Lexer.isNot(asmtok::EndOfStatement)) {
812 if (Lexer.isNot(asmtok::Comma))
813 return TokError("unexpected token in directive");
814 Lexer.Lex();
815
816 // The fill expression can be omitted while specifying a maximum number of
817 // alignment bytes, e.g:
818 // .align 3,,4
819 if (Lexer.isNot(asmtok::Comma)) {
820 HasFillExpr = true;
821 if (ParseAbsoluteExpression(FillExpr))
822 return true;
823 }
824
825 if (Lexer.isNot(asmtok::EndOfStatement)) {
826 if (Lexer.isNot(asmtok::Comma))
827 return TokError("unexpected token in directive");
828 Lexer.Lex();
829
830 MaxBytesLoc = Lexer.getLoc();
831 if (ParseAbsoluteExpression(MaxBytesToFill))
832 return true;
833
834 if (Lexer.isNot(asmtok::EndOfStatement))
835 return TokError("unexpected token in directive");
836 }
837 }
838
839 Lexer.Lex();
840
841 if (!HasFillExpr) {
842 // FIXME: Sometimes fill with nop.
843 FillExpr = 0;
844 }
845
846 // Compute alignment in bytes.
847 if (IsPow2) {
848 // FIXME: Diagnose overflow.
849 Alignment = 1 << Alignment;
850 }
851
852 // Diagnose non-sensical max bytes to fill.
853 if (MaxBytesLoc.isValid()) {
854 if (MaxBytesToFill < 1) {
Daniel Dunbar3fb76832009-06-30 00:49:23 +0000855 Warning(MaxBytesLoc, "alignment directive can never be satisfied in this "
856 "many bytes, ignoring");
Daniel Dunbarc29dfa72009-06-29 23:46:59 +0000857 return false;
858 }
859
860 if (MaxBytesToFill >= Alignment) {
Daniel Dunbar3fb76832009-06-30 00:49:23 +0000861 Warning(MaxBytesLoc, "maximum bytes expression exceeds alignment and "
862 "has no effect");
Daniel Dunbarc29dfa72009-06-29 23:46:59 +0000863 MaxBytesToFill = 0;
864 }
865 }
866
867 // FIXME: Target specific behavior about how the "extra" bytes are filled.
868 Out.EmitValueToAlignment(Alignment, FillExpr, ValueSize, MaxBytesToFill);
869
870 return false;
871}
872
Daniel Dunbard7b267b2009-06-30 00:33:19 +0000873/// ParseDirectiveSymbolAttribute
874/// ::= { ".globl", ".weak", ... } [ identifier ( , identifier )* ]
875bool AsmParser::ParseDirectiveSymbolAttribute(MCStreamer::SymbolAttr Attr) {
876 if (Lexer.isNot(asmtok::EndOfStatement)) {
877 for (;;) {
878 if (Lexer.isNot(asmtok::Identifier))
879 return TokError("expected identifier in directive");
880
881 MCSymbol *Sym = Ctx.GetOrCreateSymbol(Lexer.getCurStrVal());
882 Lexer.Lex();
883
884 // If this is use of an undefined symbol then mark it external.
885 if (!Sym->getSection() && !Ctx.GetSymbolValue(Sym))
886 Sym->setExternal(true);
887
888 Out.EmitSymbolAttribute(Sym, Attr);
889
890 if (Lexer.is(asmtok::EndOfStatement))
891 break;
892
893 if (Lexer.isNot(asmtok::Comma))
894 return TokError("unexpected token in directive");
895 Lexer.Lex();
896 }
897 }
898
899 Lexer.Lex();
900 return false;
901}
Chris Lattner4e4db7a2009-07-07 20:30:46 +0000902
903/// ParseDirectiveComm
904/// ::= .comm identifier , size_expression [ , align_expression ]
905bool AsmParser::ParseDirectiveComm() {
906 if (Lexer.isNot(asmtok::Identifier))
907 return TokError("expected identifier in directive");
908
909 // handle the identifier as the key symbol.
910 SMLoc IDLoc = Lexer.getLoc();
911 MCSymbol *Sym = Ctx.GetOrCreateSymbol(Lexer.getCurStrVal());
912 Lexer.Lex();
913
914 if (Lexer.isNot(asmtok::Comma))
915 return TokError("unexpected token in directive");
916 Lexer.Lex();
917
918 int64_t Size;
919 SMLoc SizeLoc = Lexer.getLoc();
920 if (ParseAbsoluteExpression(Size))
921 return true;
922
923 int64_t Pow2Alignment = 0;
924 SMLoc Pow2AlignmentLoc;
925 if (Lexer.is(asmtok::Comma)) {
926 Lexer.Lex();
927 Pow2AlignmentLoc = Lexer.getLoc();
928 if (ParseAbsoluteExpression(Pow2Alignment))
929 return true;
930 }
931
932 if (Lexer.isNot(asmtok::EndOfStatement))
933 return TokError("unexpected token in '.comm' directive");
934
935 Lexer.Lex();
936
937 // NOTE: a size of zero should create a undefined symbol
938 if (Size < 0)
939 return Error(SizeLoc, "invalid '.comm' size, can't be less than zero");
940
941 // NOTE: The alignment in the directive is a power of 2 value, the assember
942 // may internally end up wanting an alignment in bytes.
943 // FIXME: Diagnose overflow.
944 if (Pow2Alignment < 0)
945 return Error(Pow2AlignmentLoc, "invalid '.comm' alignment, can't be less "
946 "than zero");
947
948 // TODO: Symbol must be undefined or it is a error to re-defined the symbol
949 if (Sym->getSection() || Ctx.GetSymbolValue(Sym))
950 return Error(IDLoc, "invalid symbol redefinition");
951
952 // TODO: Symbol to be made into a common with this Size and Pow2Alignment
953
954 Out.EmitCommonSymbol(Sym, Size, Pow2Alignment);
955
956 return false;
957}