blob: 1950c1da195ee39b0d33ffff06cbdccadc1eca99 [file] [log] [blame]
Daniel Dunbar71475772009-07-17 20:42:00 +00001//===-- X86AsmParser.cpp - Parse X86 assembly to MCInst instructions ------===//
2//
3// The LLVM Compiler Infrastructure
4//
5// This file is distributed under the University of Illinois Open Source
6// License. See LICENSE.TXT for details.
7//
8//===----------------------------------------------------------------------===//
9
Chris Lattnerf29c0b62010-01-14 22:21:20 +000010#include "llvm/Target/TargetAsmParser.h"
Daniel Dunbar67038c12009-07-18 23:03:22 +000011#include "X86.h"
Daniel Dunbareefe8612010-07-19 05:44:09 +000012#include "X86Subtarget.h"
Daniel Dunbar2ecc3bb2010-08-12 00:55:38 +000013#include "llvm/ADT/SmallString.h"
Daniel Dunbar2b11c7d2009-07-20 20:01:54 +000014#include "llvm/ADT/SmallVector.h"
Daniel Dunbar3e0c9792010-02-10 21:19:28 +000015#include "llvm/ADT/StringSwitch.h"
Daniel Dunbare1fdb0e2009-07-28 22:40:46 +000016#include "llvm/ADT/Twine.h"
Kevin Enderbyce4bec82009-09-10 20:51:44 +000017#include "llvm/MC/MCStreamer.h"
Daniel Dunbar73da11e2009-08-31 08:08:38 +000018#include "llvm/MC/MCExpr.h"
Daniel Dunbarb6d6aa22009-07-31 02:32:59 +000019#include "llvm/MC/MCInst.h"
Chris Lattner00646cf2010-01-22 01:44:57 +000020#include "llvm/MC/MCParser/MCAsmLexer.h"
21#include "llvm/MC/MCParser/MCAsmParser.h"
22#include "llvm/MC/MCParser/MCParsedAsmOperand.h"
Daniel Dunbare1fdb0e2009-07-28 22:40:46 +000023#include "llvm/Support/SourceMgr.h"
Daniel Dunbar7d7b4d12010-08-12 00:55:42 +000024#include "llvm/Support/raw_ostream.h"
Daniel Dunbar71475772009-07-17 20:42:00 +000025#include "llvm/Target/TargetRegistry.h"
26#include "llvm/Target/TargetAsmParser.h"
27using namespace llvm;
28
29namespace {
Benjamin Kramerb60210e2009-07-31 11:35:26 +000030struct X86Operand;
Daniel Dunbare1fdb0e2009-07-28 22:40:46 +000031
32class X86ATTAsmParser : public TargetAsmParser {
33 MCAsmParser &Parser;
Daniel Dunbar419197c2010-07-19 00:33:49 +000034 TargetMachine &TM;
Daniel Dunbare1fdb0e2009-07-28 22:40:46 +000035
Daniel Dunbar63ec0932010-03-18 20:06:02 +000036protected:
37 unsigned Is64Bit : 1;
38
Daniel Dunbare1fdb0e2009-07-28 22:40:46 +000039private:
Daniel Dunbare1fdb0e2009-07-28 22:40:46 +000040 MCAsmParser &getParser() const { return Parser; }
41
42 MCAsmLexer &getLexer() const { return Parser.getLexer(); }
43
Daniel Dunbare1fdb0e2009-07-28 22:40:46 +000044 bool Error(SMLoc L, const Twine &Msg) { return Parser.Error(L, Msg); }
45
Chris Lattner0c2538f2010-01-15 18:51:29 +000046 bool ParseRegister(unsigned &RegNo, SMLoc &StartLoc, SMLoc &EndLoc);
Daniel Dunbare1fdb0e2009-07-28 22:40:46 +000047
Chris Lattnera2bbb7c2010-01-15 18:44:13 +000048 X86Operand *ParseOperand();
Chris Lattnerb9270732010-04-17 18:56:34 +000049 X86Operand *ParseMemOperand(unsigned SegReg, SMLoc StartLoc);
Kevin Enderbyce4bec82009-09-10 20:51:44 +000050
51 bool ParseDirectiveWord(unsigned Size, SMLoc L);
52
Daniel Dunbar2ecc3bb2010-08-12 00:55:38 +000053 bool MatchInstruction(SMLoc IDLoc,
54 const SmallVectorImpl<MCParsedAsmOperand*> &Operands,
Daniel Dunbare10787e2009-08-07 08:26:05 +000055 MCInst &Inst);
56
Daniel Dunbareefe8612010-07-19 05:44:09 +000057 /// @name Auto-generated Matcher Functions
58 /// {
Chris Lattner3e4582a2010-09-06 19:11:01 +000059
60#define GET_ASSEMBLER_HEADER
61#include "X86GenAsmMatcher.inc"
62
Daniel Dunbar00331992009-07-29 00:02:19 +000063 /// }
Daniel Dunbare1fdb0e2009-07-28 22:40:46 +000064
65public:
Daniel Dunbar419197c2010-07-19 00:33:49 +000066 X86ATTAsmParser(const Target &T, MCAsmParser &_Parser, TargetMachine &TM)
Daniel Dunbareefe8612010-07-19 05:44:09 +000067 : TargetAsmParser(T), Parser(_Parser), TM(TM) {
68
69 // Initialize the set of available features.
70 setAvailableFeatures(ComputeAvailableFeatures(
71 &TM.getSubtarget<X86Subtarget>()));
72 }
Daniel Dunbare1fdb0e2009-07-28 22:40:46 +000073
Benjamin Kramer92d89982010-07-14 22:38:02 +000074 virtual bool ParseInstruction(StringRef Name, SMLoc NameLoc,
Chris Lattnerf29c0b62010-01-14 22:21:20 +000075 SmallVectorImpl<MCParsedAsmOperand*> &Operands);
Kevin Enderbyce4bec82009-09-10 20:51:44 +000076
77 virtual bool ParseDirective(AsmToken DirectiveID);
Daniel Dunbare1fdb0e2009-07-28 22:40:46 +000078};
Bruno Cardoso Lopesd65cd1d2010-07-23 22:15:26 +000079
Daniel Dunbar63ec0932010-03-18 20:06:02 +000080class X86_32ATTAsmParser : public X86ATTAsmParser {
81public:
Daniel Dunbar419197c2010-07-19 00:33:49 +000082 X86_32ATTAsmParser(const Target &T, MCAsmParser &_Parser, TargetMachine &TM)
83 : X86ATTAsmParser(T, _Parser, TM) {
Daniel Dunbar63ec0932010-03-18 20:06:02 +000084 Is64Bit = false;
85 }
86};
87
88class X86_64ATTAsmParser : public X86ATTAsmParser {
89public:
Daniel Dunbar419197c2010-07-19 00:33:49 +000090 X86_64ATTAsmParser(const Target &T, MCAsmParser &_Parser, TargetMachine &TM)
91 : X86ATTAsmParser(T, _Parser, TM) {
Daniel Dunbar63ec0932010-03-18 20:06:02 +000092 Is64Bit = true;
93 }
94};
95
Chris Lattner4eb9df02009-07-29 06:33:53 +000096} // end anonymous namespace
97
Sean Callanan86c11812010-01-23 00:40:33 +000098/// @name Auto-generated Match Functions
Bruno Cardoso Lopesd65cd1d2010-07-23 22:15:26 +000099/// {
Sean Callanan86c11812010-01-23 00:40:33 +0000100
Chris Lattner60db0a62010-02-09 00:34:28 +0000101static unsigned MatchRegisterName(StringRef Name);
Sean Callanan86c11812010-01-23 00:40:33 +0000102
103/// }
Chris Lattner4eb9df02009-07-29 06:33:53 +0000104
105namespace {
Daniel Dunbare1fdb0e2009-07-28 22:40:46 +0000106
107/// X86Operand - Instances of this class represent a parsed X86 machine
108/// instruction.
Chris Lattner872501b2010-01-14 21:20:55 +0000109struct X86Operand : public MCParsedAsmOperand {
Chris Lattner86e61532010-01-15 19:06:59 +0000110 enum KindTy {
Daniel Dunbare10787e2009-08-07 08:26:05 +0000111 Token,
Daniel Dunbare1fdb0e2009-07-28 22:40:46 +0000112 Register,
113 Immediate,
114 Memory
115 } Kind;
116
Chris Lattner0c2538f2010-01-15 18:51:29 +0000117 SMLoc StartLoc, EndLoc;
Bruno Cardoso Lopesd65cd1d2010-07-23 22:15:26 +0000118
Daniel Dunbare1fdb0e2009-07-28 22:40:46 +0000119 union {
120 struct {
Daniel Dunbare10787e2009-08-07 08:26:05 +0000121 const char *Data;
122 unsigned Length;
123 } Tok;
124
125 struct {
Daniel Dunbare1fdb0e2009-07-28 22:40:46 +0000126 unsigned RegNo;
127 } Reg;
128
129 struct {
Daniel Dunbar73da11e2009-08-31 08:08:38 +0000130 const MCExpr *Val;
Daniel Dunbare1fdb0e2009-07-28 22:40:46 +0000131 } Imm;
132
133 struct {
134 unsigned SegReg;
Daniel Dunbar73da11e2009-08-31 08:08:38 +0000135 const MCExpr *Disp;
Daniel Dunbare1fdb0e2009-07-28 22:40:46 +0000136 unsigned BaseReg;
137 unsigned IndexReg;
138 unsigned Scale;
139 } Mem;
Daniel Dunbar2b11c7d2009-07-20 20:01:54 +0000140 };
Daniel Dunbar71475772009-07-17 20:42:00 +0000141
Chris Lattner015cfb12010-01-15 19:33:43 +0000142 X86Operand(KindTy K, SMLoc Start, SMLoc End)
Chris Lattner86e61532010-01-15 19:06:59 +0000143 : Kind(K), StartLoc(Start), EndLoc(End) {}
Daniel Dunbar9b816a12010-05-04 16:12:42 +0000144
Chris Lattner86e61532010-01-15 19:06:59 +0000145 /// getStartLoc - Get the location of the first token of this operand.
146 SMLoc getStartLoc() const { return StartLoc; }
147 /// getEndLoc - Get the location of the last token of this operand.
148 SMLoc getEndLoc() const { return EndLoc; }
149
Daniel Dunbarebace222010-08-11 06:37:04 +0000150 virtual void dump(raw_ostream &OS) const {}
151
Daniel Dunbare10787e2009-08-07 08:26:05 +0000152 StringRef getToken() const {
153 assert(Kind == Token && "Invalid access!");
154 return StringRef(Tok.Data, Tok.Length);
155 }
Daniel Dunbar9b816a12010-05-04 16:12:42 +0000156 void setTokenValue(StringRef Value) {
157 assert(Kind == Token && "Invalid access!");
158 Tok.Data = Value.data();
159 Tok.Length = Value.size();
160 }
Daniel Dunbare10787e2009-08-07 08:26:05 +0000161
Daniel Dunbare1fdb0e2009-07-28 22:40:46 +0000162 unsigned getReg() const {
163 assert(Kind == Register && "Invalid access!");
164 return Reg.RegNo;
165 }
Daniel Dunbarf59ee962009-07-28 20:47:52 +0000166
Daniel Dunbar73da11e2009-08-31 08:08:38 +0000167 const MCExpr *getImm() const {
Daniel Dunbar3ebf8482009-07-31 20:53:16 +0000168 assert(Kind == Immediate && "Invalid access!");
169 return Imm.Val;
170 }
171
Daniel Dunbar73da11e2009-08-31 08:08:38 +0000172 const MCExpr *getMemDisp() const {
Daniel Dunbar3ebf8482009-07-31 20:53:16 +0000173 assert(Kind == Memory && "Invalid access!");
174 return Mem.Disp;
175 }
176 unsigned getMemSegReg() const {
177 assert(Kind == Memory && "Invalid access!");
178 return Mem.SegReg;
179 }
180 unsigned getMemBaseReg() const {
181 assert(Kind == Memory && "Invalid access!");
182 return Mem.BaseReg;
183 }
184 unsigned getMemIndexReg() const {
185 assert(Kind == Memory && "Invalid access!");
186 return Mem.IndexReg;
187 }
188 unsigned getMemScale() const {
189 assert(Kind == Memory && "Invalid access!");
190 return Mem.Scale;
191 }
192
Daniel Dunbar541efcc2009-08-08 07:50:56 +0000193 bool isToken() const {return Kind == Token; }
Daniel Dunbare10787e2009-08-07 08:26:05 +0000194
195 bool isImm() const { return Kind == Immediate; }
Bruno Cardoso Lopesd65cd1d2010-07-23 22:15:26 +0000196
Daniel Dunbarb52fcd62010-05-22 21:02:33 +0000197 bool isImmSExti16i8() const {
Daniel Dunbar8e33cb22009-08-09 07:20:21 +0000198 if (!isImm())
199 return false;
200
Daniel Dunbarb52fcd62010-05-22 21:02:33 +0000201 // If this isn't a constant expr, just assume it fits and let relaxation
202 // handle it.
203 const MCConstantExpr *CE = dyn_cast<MCConstantExpr>(getImm());
204 if (!CE)
205 return true;
Daniel Dunbar8e33cb22009-08-09 07:20:21 +0000206
Daniel Dunbarb52fcd62010-05-22 21:02:33 +0000207 // Otherwise, check the value is in a range that makes sense for this
208 // extension.
209 uint64_t Value = CE->getValue();
210 return (( Value <= 0x000000000000007FULL)||
211 (0x000000000000FF80ULL <= Value && Value <= 0x000000000000FFFFULL)||
212 (0xFFFFFFFFFFFFFF80ULL <= Value && Value <= 0xFFFFFFFFFFFFFFFFULL));
Daniel Dunbar8e33cb22009-08-09 07:20:21 +0000213 }
Daniel Dunbarb52fcd62010-05-22 21:02:33 +0000214 bool isImmSExti32i8() const {
Daniel Dunbar61655aa2010-05-20 20:20:39 +0000215 if (!isImm())
216 return false;
217
Daniel Dunbarb52fcd62010-05-22 21:02:33 +0000218 // If this isn't a constant expr, just assume it fits and let relaxation
219 // handle it.
220 const MCConstantExpr *CE = dyn_cast<MCConstantExpr>(getImm());
221 if (!CE)
222 return true;
Daniel Dunbar61655aa2010-05-20 20:20:39 +0000223
Daniel Dunbarb52fcd62010-05-22 21:02:33 +0000224 // Otherwise, check the value is in a range that makes sense for this
225 // extension.
226 uint64_t Value = CE->getValue();
227 return (( Value <= 0x000000000000007FULL)||
228 (0x00000000FFFFFF80ULL <= Value && Value <= 0x00000000FFFFFFFFULL)||
229 (0xFFFFFFFFFFFFFF80ULL <= Value && Value <= 0xFFFFFFFFFFFFFFFFULL));
230 }
231 bool isImmSExti64i8() const {
232 if (!isImm())
233 return false;
234
235 // If this isn't a constant expr, just assume it fits and let relaxation
236 // handle it.
237 const MCConstantExpr *CE = dyn_cast<MCConstantExpr>(getImm());
238 if (!CE)
239 return true;
240
241 // Otherwise, check the value is in a range that makes sense for this
242 // extension.
243 uint64_t Value = CE->getValue();
244 return (( Value <= 0x000000000000007FULL)||
245 (0xFFFFFFFFFFFFFF80ULL <= Value && Value <= 0xFFFFFFFFFFFFFFFFULL));
246 }
247 bool isImmSExti64i32() const {
248 if (!isImm())
249 return false;
250
251 // If this isn't a constant expr, just assume it fits and let relaxation
252 // handle it.
253 const MCConstantExpr *CE = dyn_cast<MCConstantExpr>(getImm());
254 if (!CE)
255 return true;
256
257 // Otherwise, check the value is in a range that makes sense for this
258 // extension.
259 uint64_t Value = CE->getValue();
260 return (( Value <= 0x000000007FFFFFFFULL)||
261 (0xFFFFFFFF80000000ULL <= Value && Value <= 0xFFFFFFFFFFFFFFFFULL));
Daniel Dunbar61655aa2010-05-20 20:20:39 +0000262 }
263
Daniel Dunbare10787e2009-08-07 08:26:05 +0000264 bool isMem() const { return Kind == Memory; }
265
Daniel Dunbar76e5d702010-01-30 01:02:48 +0000266 bool isAbsMem() const {
267 return Kind == Memory && !getMemSegReg() && !getMemBaseReg() &&
Daniel Dunbar3184f222010-02-02 21:44:16 +0000268 !getMemIndexReg() && getMemScale() == 1;
Daniel Dunbar76e5d702010-01-30 01:02:48 +0000269 }
270
Daniel Dunbare10787e2009-08-07 08:26:05 +0000271 bool isReg() const { return Kind == Register; }
272
Daniel Dunbar224340ca2010-02-13 00:17:21 +0000273 void addExpr(MCInst &Inst, const MCExpr *Expr) const {
274 // Add as immediates when possible.
275 if (const MCConstantExpr *CE = dyn_cast<MCConstantExpr>(Expr))
276 Inst.addOperand(MCOperand::CreateImm(CE->getValue()));
277 else
278 Inst.addOperand(MCOperand::CreateExpr(Expr));
279 }
280
Daniel Dunbaraeb1feb2009-08-10 21:00:45 +0000281 void addRegOperands(MCInst &Inst, unsigned N) const {
Daniel Dunbare10787e2009-08-07 08:26:05 +0000282 assert(N == 1 && "Invalid number of operands!");
283 Inst.addOperand(MCOperand::CreateReg(getReg()));
284 }
285
Daniel Dunbaraeb1feb2009-08-10 21:00:45 +0000286 void addImmOperands(MCInst &Inst, unsigned N) const {
Daniel Dunbare10787e2009-08-07 08:26:05 +0000287 assert(N == 1 && "Invalid number of operands!");
Daniel Dunbar224340ca2010-02-13 00:17:21 +0000288 addExpr(Inst, getImm());
Daniel Dunbare10787e2009-08-07 08:26:05 +0000289 }
290
Daniel Dunbaraeb1feb2009-08-10 21:00:45 +0000291 void addMemOperands(MCInst &Inst, unsigned N) const {
Daniel Dunbara97adee2010-01-30 00:24:00 +0000292 assert((N == 5) && "Invalid number of operands!");
Daniel Dunbare10787e2009-08-07 08:26:05 +0000293 Inst.addOperand(MCOperand::CreateReg(getMemBaseReg()));
294 Inst.addOperand(MCOperand::CreateImm(getMemScale()));
295 Inst.addOperand(MCOperand::CreateReg(getMemIndexReg()));
Daniel Dunbar224340ca2010-02-13 00:17:21 +0000296 addExpr(Inst, getMemDisp());
Daniel Dunbara97adee2010-01-30 00:24:00 +0000297 Inst.addOperand(MCOperand::CreateReg(getMemSegReg()));
298 }
Daniel Dunbare10787e2009-08-07 08:26:05 +0000299
Daniel Dunbar76e5d702010-01-30 01:02:48 +0000300 void addAbsMemOperands(MCInst &Inst, unsigned N) const {
301 assert((N == 1) && "Invalid number of operands!");
302 Inst.addOperand(MCOperand::CreateExpr(getMemDisp()));
303 }
304
Chris Lattner528d00b2010-01-15 19:28:38 +0000305 static X86Operand *CreateToken(StringRef Str, SMLoc Loc) {
306 X86Operand *Res = new X86Operand(Token, Loc, Loc);
Chris Lattner0c2538f2010-01-15 18:51:29 +0000307 Res->Tok.Data = Str.data();
308 Res->Tok.Length = Str.size();
Daniel Dunbare10787e2009-08-07 08:26:05 +0000309 return Res;
310 }
311
Chris Lattner0c2538f2010-01-15 18:51:29 +0000312 static X86Operand *CreateReg(unsigned RegNo, SMLoc StartLoc, SMLoc EndLoc) {
Chris Lattner86e61532010-01-15 19:06:59 +0000313 X86Operand *Res = new X86Operand(Register, StartLoc, EndLoc);
Chris Lattner0c2538f2010-01-15 18:51:29 +0000314 Res->Reg.RegNo = RegNo;
Chris Lattner0c2538f2010-01-15 18:51:29 +0000315 return Res;
Daniel Dunbare1fdb0e2009-07-28 22:40:46 +0000316 }
Daniel Dunbare10787e2009-08-07 08:26:05 +0000317
Chris Lattner528d00b2010-01-15 19:28:38 +0000318 static X86Operand *CreateImm(const MCExpr *Val, SMLoc StartLoc, SMLoc EndLoc){
319 X86Operand *Res = new X86Operand(Immediate, StartLoc, EndLoc);
Chris Lattner0c2538f2010-01-15 18:51:29 +0000320 Res->Imm.Val = Val;
321 return Res;
Daniel Dunbare1fdb0e2009-07-28 22:40:46 +0000322 }
Daniel Dunbare10787e2009-08-07 08:26:05 +0000323
Daniel Dunbar76e5d702010-01-30 01:02:48 +0000324 /// Create an absolute memory operand.
325 static X86Operand *CreateMem(const MCExpr *Disp, SMLoc StartLoc,
326 SMLoc EndLoc) {
327 X86Operand *Res = new X86Operand(Memory, StartLoc, EndLoc);
328 Res->Mem.SegReg = 0;
329 Res->Mem.Disp = Disp;
330 Res->Mem.BaseReg = 0;
331 Res->Mem.IndexReg = 0;
Daniel Dunbar3184f222010-02-02 21:44:16 +0000332 Res->Mem.Scale = 1;
Daniel Dunbar76e5d702010-01-30 01:02:48 +0000333 return Res;
334 }
335
336 /// Create a generalized memory operand.
Chris Lattnera2bbb7c2010-01-15 18:44:13 +0000337 static X86Operand *CreateMem(unsigned SegReg, const MCExpr *Disp,
338 unsigned BaseReg, unsigned IndexReg,
Chris Lattner015cfb12010-01-15 19:33:43 +0000339 unsigned Scale, SMLoc StartLoc, SMLoc EndLoc) {
Daniel Dunbar76e5d702010-01-30 01:02:48 +0000340 // We should never just have a displacement, that should be parsed as an
341 // absolute memory operand.
Daniel Dunbara4fc8d92009-07-31 22:22:54 +0000342 assert((SegReg || BaseReg || IndexReg) && "Invalid memory operand!");
343
Daniel Dunbar3ebf8482009-07-31 20:53:16 +0000344 // The scale should always be one of {1,2,4,8}.
345 assert(((Scale == 1 || Scale == 2 || Scale == 4 || Scale == 8)) &&
Daniel Dunbare1fdb0e2009-07-28 22:40:46 +0000346 "Invalid scale!");
Chris Lattner015cfb12010-01-15 19:33:43 +0000347 X86Operand *Res = new X86Operand(Memory, StartLoc, EndLoc);
Chris Lattner0c2538f2010-01-15 18:51:29 +0000348 Res->Mem.SegReg = SegReg;
349 Res->Mem.Disp = Disp;
350 Res->Mem.BaseReg = BaseReg;
351 Res->Mem.IndexReg = IndexReg;
352 Res->Mem.Scale = Scale;
353 return Res;
Daniel Dunbare1fdb0e2009-07-28 22:40:46 +0000354 }
355};
Daniel Dunbar3c2a8932009-07-20 18:55:04 +0000356
Chris Lattner4eb9df02009-07-29 06:33:53 +0000357} // end anonymous namespace.
Daniel Dunbarf59ee962009-07-28 20:47:52 +0000358
Daniel Dunbare1fdb0e2009-07-28 22:40:46 +0000359
Chris Lattner0c2538f2010-01-15 18:51:29 +0000360bool X86ATTAsmParser::ParseRegister(unsigned &RegNo,
361 SMLoc &StartLoc, SMLoc &EndLoc) {
Chris Lattnercc2ad082010-01-15 18:27:19 +0000362 RegNo = 0;
Sean Callanan936b0d32010-01-19 21:44:56 +0000363 const AsmToken &TokPercent = Parser.getTok();
Kevin Enderby7d912182009-09-03 17:15:07 +0000364 assert(TokPercent.is(AsmToken::Percent) && "Invalid token kind!");
Chris Lattner0c2538f2010-01-15 18:51:29 +0000365 StartLoc = TokPercent.getLoc();
Sean Callanana83fd7d2010-01-19 20:27:46 +0000366 Parser.Lex(); // Eat percent token.
Kevin Enderby7d912182009-09-03 17:15:07 +0000367
Sean Callanan936b0d32010-01-19 21:44:56 +0000368 const AsmToken &Tok = Parser.getTok();
Kevin Enderbyc0edda32009-09-16 17:18:29 +0000369 if (Tok.isNot(AsmToken::Identifier))
370 return Error(Tok.getLoc(), "invalid register name");
Daniel Dunbare1fdb0e2009-07-28 22:40:46 +0000371
Daniel Dunbar00331992009-07-29 00:02:19 +0000372 // FIXME: Validate register for the current architecture; we have to do
373 // validation later, so maybe there is no need for this here.
Kevin Enderby7d912182009-09-03 17:15:07 +0000374 RegNo = MatchRegisterName(Tok.getString());
Bruno Cardoso Lopesd65cd1d2010-07-23 22:15:26 +0000375
Bruno Cardoso Lopes306a1f92010-07-24 00:06:39 +0000376 // FIXME: This should be done using Requires<In32BitMode> and
377 // Requires<In64BitMode> so "eiz" usage in 64-bit instructions
378 // can be also checked.
379 if (RegNo == X86::RIZ && !Is64Bit)
380 return Error(Tok.getLoc(), "riz register in 64-bit mode only");
381
Chris Lattnerd00faaa2010-02-09 00:49:22 +0000382 // Parse %st(1) and "%st" as "%st(0)"
383 if (RegNo == 0 && Tok.getString() == "st") {
384 RegNo = X86::ST0;
385 EndLoc = Tok.getLoc();
386 Parser.Lex(); // Eat 'st'
Bruno Cardoso Lopesd65cd1d2010-07-23 22:15:26 +0000387
Chris Lattnerd00faaa2010-02-09 00:49:22 +0000388 // Check to see if we have '(4)' after %st.
389 if (getLexer().isNot(AsmToken::LParen))
390 return false;
391 // Lex the paren.
392 getParser().Lex();
393
394 const AsmToken &IntTok = Parser.getTok();
395 if (IntTok.isNot(AsmToken::Integer))
396 return Error(IntTok.getLoc(), "expected stack index");
397 switch (IntTok.getIntVal()) {
398 case 0: RegNo = X86::ST0; break;
399 case 1: RegNo = X86::ST1; break;
400 case 2: RegNo = X86::ST2; break;
401 case 3: RegNo = X86::ST3; break;
402 case 4: RegNo = X86::ST4; break;
403 case 5: RegNo = X86::ST5; break;
404 case 6: RegNo = X86::ST6; break;
405 case 7: RegNo = X86::ST7; break;
406 default: return Error(IntTok.getLoc(), "invalid stack index");
407 }
Bruno Cardoso Lopesd65cd1d2010-07-23 22:15:26 +0000408
Chris Lattnerd00faaa2010-02-09 00:49:22 +0000409 if (getParser().Lex().isNot(AsmToken::RParen))
410 return Error(Parser.getTok().getLoc(), "expected ')'");
Bruno Cardoso Lopesd65cd1d2010-07-23 22:15:26 +0000411
Chris Lattnerd00faaa2010-02-09 00:49:22 +0000412 EndLoc = Tok.getLoc();
413 Parser.Lex(); // Eat ')'
414 return false;
415 }
Bruno Cardoso Lopesd65cd1d2010-07-23 22:15:26 +0000416
Chris Lattner80486622010-06-24 07:29:18 +0000417 // If this is "db[0-7]", match it as an alias
418 // for dr[0-7].
419 if (RegNo == 0 && Tok.getString().size() == 3 &&
420 Tok.getString().startswith("db")) {
421 switch (Tok.getString()[2]) {
422 case '0': RegNo = X86::DR0; break;
423 case '1': RegNo = X86::DR1; break;
424 case '2': RegNo = X86::DR2; break;
425 case '3': RegNo = X86::DR3; break;
426 case '4': RegNo = X86::DR4; break;
427 case '5': RegNo = X86::DR5; break;
428 case '6': RegNo = X86::DR6; break;
429 case '7': RegNo = X86::DR7; break;
430 }
Bruno Cardoso Lopesd65cd1d2010-07-23 22:15:26 +0000431
Chris Lattner80486622010-06-24 07:29:18 +0000432 if (RegNo != 0) {
433 EndLoc = Tok.getLoc();
434 Parser.Lex(); // Eat it.
435 return false;
436 }
437 }
Bruno Cardoso Lopesd65cd1d2010-07-23 22:15:26 +0000438
Daniel Dunbar66f4f542009-08-08 21:22:41 +0000439 if (RegNo == 0)
Daniel Dunbar00331992009-07-29 00:02:19 +0000440 return Error(Tok.getLoc(), "invalid register name");
441
Chris Lattner0c2538f2010-01-15 18:51:29 +0000442 EndLoc = Tok.getLoc();
Sean Callanana83fd7d2010-01-19 20:27:46 +0000443 Parser.Lex(); // Eat identifier token.
Daniel Dunbare1fdb0e2009-07-28 22:40:46 +0000444 return false;
Daniel Dunbar71475772009-07-17 20:42:00 +0000445}
446
Chris Lattnera2bbb7c2010-01-15 18:44:13 +0000447X86Operand *X86ATTAsmParser::ParseOperand() {
Daniel Dunbare1fdb0e2009-07-28 22:40:46 +0000448 switch (getLexer().getKind()) {
449 default:
Chris Lattnerb9270732010-04-17 18:56:34 +0000450 // Parse a memory operand with no segment register.
451 return ParseMemOperand(0, Parser.getTok().getLoc());
Chris Lattnercc2ad082010-01-15 18:27:19 +0000452 case AsmToken::Percent: {
Chris Lattnerb9270732010-04-17 18:56:34 +0000453 // Read the register.
Chris Lattnercc2ad082010-01-15 18:27:19 +0000454 unsigned RegNo;
Chris Lattner0c2538f2010-01-15 18:51:29 +0000455 SMLoc Start, End;
456 if (ParseRegister(RegNo, Start, End)) return 0;
Bruno Cardoso Lopes306a1f92010-07-24 00:06:39 +0000457 if (RegNo == X86::EIZ || RegNo == X86::RIZ) {
458 Error(Start, "eiz and riz can only be used as index registers");
459 return 0;
460 }
Bruno Cardoso Lopesd65cd1d2010-07-23 22:15:26 +0000461
Chris Lattnerb9270732010-04-17 18:56:34 +0000462 // If this is a segment register followed by a ':', then this is the start
463 // of a memory reference, otherwise this is a normal register reference.
464 if (getLexer().isNot(AsmToken::Colon))
465 return X86Operand::CreateReg(RegNo, Start, End);
Bruno Cardoso Lopesd65cd1d2010-07-23 22:15:26 +0000466
467
Chris Lattnerb9270732010-04-17 18:56:34 +0000468 getParser().Lex(); // Eat the colon.
469 return ParseMemOperand(RegNo, Start);
Chris Lattnercc2ad082010-01-15 18:27:19 +0000470 }
Daniel Dunbare1fdb0e2009-07-28 22:40:46 +0000471 case AsmToken::Dollar: {
472 // $42 -> immediate.
Sean Callanan936b0d32010-01-19 21:44:56 +0000473 SMLoc Start = Parser.getTok().getLoc(), End;
Sean Callanana83fd7d2010-01-19 20:27:46 +0000474 Parser.Lex();
Daniel Dunbar73da11e2009-08-31 08:08:38 +0000475 const MCExpr *Val;
Chris Lattnere17df0b2010-01-15 19:39:23 +0000476 if (getParser().ParseExpression(Val, End))
Chris Lattnera2bbb7c2010-01-15 18:44:13 +0000477 return 0;
Chris Lattner528d00b2010-01-15 19:28:38 +0000478 return X86Operand::CreateImm(Val, Start, End);
Daniel Dunbare1fdb0e2009-07-28 22:40:46 +0000479 }
Daniel Dunbare1fdb0e2009-07-28 22:40:46 +0000480 }
Daniel Dunbar2b11c7d2009-07-20 20:01:54 +0000481}
482
Chris Lattnerb9270732010-04-17 18:56:34 +0000483/// ParseMemOperand: segment: disp(basereg, indexreg, scale). The '%ds:' prefix
484/// has already been parsed if present.
485X86Operand *X86ATTAsmParser::ParseMemOperand(unsigned SegReg, SMLoc MemStart) {
Bruno Cardoso Lopesd65cd1d2010-07-23 22:15:26 +0000486
Daniel Dunbare1fdb0e2009-07-28 22:40:46 +0000487 // We have to disambiguate a parenthesized expression "(4+5)" from the start
488 // of a memory operand with a missing displacement "(%ebx)" or "(,%eax)". The
Chris Lattner807a3bc2010-01-24 01:07:33 +0000489 // only way to do this without lookahead is to eat the '(' and see what is
490 // after it.
Daniel Dunbar73da11e2009-08-31 08:08:38 +0000491 const MCExpr *Disp = MCConstantExpr::Create(0, getParser().getContext());
Daniel Dunbare1fdb0e2009-07-28 22:40:46 +0000492 if (getLexer().isNot(AsmToken::LParen)) {
Chris Lattnere17df0b2010-01-15 19:39:23 +0000493 SMLoc ExprEnd;
494 if (getParser().ParseExpression(Disp, ExprEnd)) return 0;
Bruno Cardoso Lopesd65cd1d2010-07-23 22:15:26 +0000495
Daniel Dunbare1fdb0e2009-07-28 22:40:46 +0000496 // After parsing the base expression we could either have a parenthesized
497 // memory address or not. If not, return now. If so, eat the (.
498 if (getLexer().isNot(AsmToken::LParen)) {
Daniel Dunbara4fc8d92009-07-31 22:22:54 +0000499 // Unless we have a segment register, treat this as an immediate.
Chris Lattnera2bbb7c2010-01-15 18:44:13 +0000500 if (SegReg == 0)
Daniel Dunbar76e5d702010-01-30 01:02:48 +0000501 return X86Operand::CreateMem(Disp, MemStart, ExprEnd);
Chris Lattner015cfb12010-01-15 19:33:43 +0000502 return X86Operand::CreateMem(SegReg, Disp, 0, 0, 1, MemStart, ExprEnd);
Daniel Dunbare1fdb0e2009-07-28 22:40:46 +0000503 }
Bruno Cardoso Lopesd65cd1d2010-07-23 22:15:26 +0000504
Daniel Dunbare1fdb0e2009-07-28 22:40:46 +0000505 // Eat the '('.
Sean Callanana83fd7d2010-01-19 20:27:46 +0000506 Parser.Lex();
Daniel Dunbare1fdb0e2009-07-28 22:40:46 +0000507 } else {
508 // Okay, we have a '('. We don't know if this is an expression or not, but
509 // so we have to eat the ( to see beyond it.
Sean Callanan936b0d32010-01-19 21:44:56 +0000510 SMLoc LParenLoc = Parser.getTok().getLoc();
Sean Callanana83fd7d2010-01-19 20:27:46 +0000511 Parser.Lex(); // Eat the '('.
Bruno Cardoso Lopesd65cd1d2010-07-23 22:15:26 +0000512
Kevin Enderby7d912182009-09-03 17:15:07 +0000513 if (getLexer().is(AsmToken::Percent) || getLexer().is(AsmToken::Comma)) {
Daniel Dunbare1fdb0e2009-07-28 22:40:46 +0000514 // Nothing to do here, fall into the code below with the '(' part of the
515 // memory operand consumed.
516 } else {
Chris Lattner528d00b2010-01-15 19:28:38 +0000517 SMLoc ExprEnd;
Bruno Cardoso Lopesd65cd1d2010-07-23 22:15:26 +0000518
Daniel Dunbare1fdb0e2009-07-28 22:40:46 +0000519 // It must be an parenthesized expression, parse it now.
Chris Lattner528d00b2010-01-15 19:28:38 +0000520 if (getParser().ParseParenExpression(Disp, ExprEnd))
Chris Lattnera2bbb7c2010-01-15 18:44:13 +0000521 return 0;
Bruno Cardoso Lopesd65cd1d2010-07-23 22:15:26 +0000522
Daniel Dunbare1fdb0e2009-07-28 22:40:46 +0000523 // After parsing the base expression we could either have a parenthesized
524 // memory address or not. If not, return now. If so, eat the (.
525 if (getLexer().isNot(AsmToken::LParen)) {
Daniel Dunbara4fc8d92009-07-31 22:22:54 +0000526 // Unless we have a segment register, treat this as an immediate.
Chris Lattnera2bbb7c2010-01-15 18:44:13 +0000527 if (SegReg == 0)
Daniel Dunbar76e5d702010-01-30 01:02:48 +0000528 return X86Operand::CreateMem(Disp, LParenLoc, ExprEnd);
Chris Lattner015cfb12010-01-15 19:33:43 +0000529 return X86Operand::CreateMem(SegReg, Disp, 0, 0, 1, MemStart, ExprEnd);
Daniel Dunbare1fdb0e2009-07-28 22:40:46 +0000530 }
Bruno Cardoso Lopesd65cd1d2010-07-23 22:15:26 +0000531
Daniel Dunbare1fdb0e2009-07-28 22:40:46 +0000532 // Eat the '('.
Sean Callanana83fd7d2010-01-19 20:27:46 +0000533 Parser.Lex();
Daniel Dunbare1fdb0e2009-07-28 22:40:46 +0000534 }
535 }
Bruno Cardoso Lopesd65cd1d2010-07-23 22:15:26 +0000536
Daniel Dunbare1fdb0e2009-07-28 22:40:46 +0000537 // If we reached here, then we just ate the ( of the memory operand. Process
538 // the rest of the memory operand.
Daniel Dunbar3ebf8482009-07-31 20:53:16 +0000539 unsigned BaseReg = 0, IndexReg = 0, Scale = 1;
Bruno Cardoso Lopesd65cd1d2010-07-23 22:15:26 +0000540
Chris Lattner0c2538f2010-01-15 18:51:29 +0000541 if (getLexer().is(AsmToken::Percent)) {
542 SMLoc L;
543 if (ParseRegister(BaseReg, L, L)) return 0;
Bruno Cardoso Lopes306a1f92010-07-24 00:06:39 +0000544 if (BaseReg == X86::EIZ || BaseReg == X86::RIZ) {
545 Error(L, "eiz and riz can only be used as index registers");
546 return 0;
547 }
Chris Lattner0c2538f2010-01-15 18:51:29 +0000548 }
Bruno Cardoso Lopesd65cd1d2010-07-23 22:15:26 +0000549
Daniel Dunbare1fdb0e2009-07-28 22:40:46 +0000550 if (getLexer().is(AsmToken::Comma)) {
Sean Callanana83fd7d2010-01-19 20:27:46 +0000551 Parser.Lex(); // Eat the comma.
Daniel Dunbare1fdb0e2009-07-28 22:40:46 +0000552
553 // Following the comma we should have either an index register, or a scale
554 // value. We don't support the later form, but we want to parse it
555 // correctly.
556 //
557 // Not that even though it would be completely consistent to support syntax
Bruno Cardoso Lopes306a1f92010-07-24 00:06:39 +0000558 // like "1(%eax,,1)", the assembler doesn't. Use "eiz" or "riz" for this.
Kevin Enderby7d912182009-09-03 17:15:07 +0000559 if (getLexer().is(AsmToken::Percent)) {
Chris Lattner0c2538f2010-01-15 18:51:29 +0000560 SMLoc L;
561 if (ParseRegister(IndexReg, L, L)) return 0;
Bruno Cardoso Lopesd65cd1d2010-07-23 22:15:26 +0000562
Daniel Dunbare1fdb0e2009-07-28 22:40:46 +0000563 if (getLexer().isNot(AsmToken::RParen)) {
564 // Parse the scale amount:
565 // ::= ',' [scale-expression]
Chris Lattnera2bbb7c2010-01-15 18:44:13 +0000566 if (getLexer().isNot(AsmToken::Comma)) {
Sean Callanan936b0d32010-01-19 21:44:56 +0000567 Error(Parser.getTok().getLoc(),
Chris Lattnera2bbb7c2010-01-15 18:44:13 +0000568 "expected comma in scale expression");
569 return 0;
570 }
Sean Callanana83fd7d2010-01-19 20:27:46 +0000571 Parser.Lex(); // Eat the comma.
Daniel Dunbare1fdb0e2009-07-28 22:40:46 +0000572
573 if (getLexer().isNot(AsmToken::RParen)) {
Sean Callanan936b0d32010-01-19 21:44:56 +0000574 SMLoc Loc = Parser.getTok().getLoc();
Daniel Dunbare1fdb0e2009-07-28 22:40:46 +0000575
576 int64_t ScaleVal;
577 if (getParser().ParseAbsoluteExpression(ScaleVal))
Chris Lattnera2bbb7c2010-01-15 18:44:13 +0000578 return 0;
Bruno Cardoso Lopesd65cd1d2010-07-23 22:15:26 +0000579
Daniel Dunbare1fdb0e2009-07-28 22:40:46 +0000580 // Validate the scale amount.
Chris Lattnera2bbb7c2010-01-15 18:44:13 +0000581 if (ScaleVal != 1 && ScaleVal != 2 && ScaleVal != 4 && ScaleVal != 8){
582 Error(Loc, "scale factor in address must be 1, 2, 4 or 8");
583 return 0;
584 }
Daniel Dunbare1fdb0e2009-07-28 22:40:46 +0000585 Scale = (unsigned)ScaleVal;
586 }
587 }
588 } else if (getLexer().isNot(AsmToken::RParen)) {
Daniel Dunbar94b84a12010-08-24 19:13:38 +0000589 // A scale amount without an index is ignored.
Daniel Dunbare1fdb0e2009-07-28 22:40:46 +0000590 // index.
Sean Callanan936b0d32010-01-19 21:44:56 +0000591 SMLoc Loc = Parser.getTok().getLoc();
Daniel Dunbare1fdb0e2009-07-28 22:40:46 +0000592
593 int64_t Value;
594 if (getParser().ParseAbsoluteExpression(Value))
Chris Lattnera2bbb7c2010-01-15 18:44:13 +0000595 return 0;
Bruno Cardoso Lopesd65cd1d2010-07-23 22:15:26 +0000596
Daniel Dunbar94b84a12010-08-24 19:13:38 +0000597 if (Value != 1)
598 Warning(Loc, "scale factor without index register is ignored");
599 Scale = 1;
Daniel Dunbare1fdb0e2009-07-28 22:40:46 +0000600 }
601 }
Bruno Cardoso Lopesd65cd1d2010-07-23 22:15:26 +0000602
Daniel Dunbare1fdb0e2009-07-28 22:40:46 +0000603 // Ok, we've eaten the memory operand, verify we have a ')' and eat it too.
Chris Lattnera2bbb7c2010-01-15 18:44:13 +0000604 if (getLexer().isNot(AsmToken::RParen)) {
Sean Callanan936b0d32010-01-19 21:44:56 +0000605 Error(Parser.getTok().getLoc(), "unexpected token in memory operand");
Chris Lattnera2bbb7c2010-01-15 18:44:13 +0000606 return 0;
607 }
Sean Callanan936b0d32010-01-19 21:44:56 +0000608 SMLoc MemEnd = Parser.getTok().getLoc();
Sean Callanana83fd7d2010-01-19 20:27:46 +0000609 Parser.Lex(); // Eat the ')'.
Bruno Cardoso Lopesd65cd1d2010-07-23 22:15:26 +0000610
Chris Lattner015cfb12010-01-15 19:33:43 +0000611 return X86Operand::CreateMem(SegReg, Disp, BaseReg, IndexReg, Scale,
612 MemStart, MemEnd);
Daniel Dunbare1fdb0e2009-07-28 22:40:46 +0000613}
614
Chris Lattnerf29c0b62010-01-14 22:21:20 +0000615bool X86ATTAsmParser::
Benjamin Kramer92d89982010-07-14 22:38:02 +0000616ParseInstruction(StringRef Name, SMLoc NameLoc,
Chris Lattnerf29c0b62010-01-14 22:21:20 +0000617 SmallVectorImpl<MCParsedAsmOperand*> &Operands) {
Dan Gohman29790ed2010-05-20 16:16:00 +0000618
Kevin Enderby0de0f3f2010-06-08 23:48:44 +0000619 // The "Jump if rCX Zero" form jcxz is not allowed in 64-bit mode and
620 // the form jrcxz is not allowed in 32-bit mode.
621 if (Is64Bit) {
Chris Lattnerb4be28f2010-09-06 20:08:02 +0000622 // FIXME: We can do jcxz/jecxz, we just don't have the encoding right yet.
623 if (Name == "jcxz" || Name == "jecxz")
624 return Error(NameLoc, Name + " cannot be encoded in 64-bit mode");
Kevin Enderby0de0f3f2010-06-08 23:48:44 +0000625 }
626
Daniel Dunbar3e0c9792010-02-10 21:19:28 +0000627 // FIXME: Hack to recognize "sal..." and "rep..." for now. We need a way to
628 // represent alternative syntaxes in the .td file, without requiring
629 // instruction duplication.
630 StringRef PatchedName = StringSwitch<StringRef>(Name)
631 .Case("sal", "shl")
632 .Case("salb", "shlb")
633 .Case("sall", "shll")
634 .Case("salq", "shlq")
635 .Case("salw", "shlw")
636 .Case("repe", "rep")
637 .Case("repz", "rep")
638 .Case("repnz", "repne")
Chris Lattner415e04f2010-09-06 23:40:56 +0000639 .Case("push", Is64Bit ? "pushq" : "pushl")
Dan Gohman29790ed2010-05-20 16:16:00 +0000640 .Case("pushf", Is64Bit ? "pushfq" : "pushfl")
641 .Case("popf", Is64Bit ? "popfq" : "popfl")
Kevin Enderby7e7482c2010-05-21 23:01:38 +0000642 .Case("retl", Is64Bit ? "retl" : "ret")
643 .Case("retq", Is64Bit ? "ret" : "retq")
Daniel Dunbard459e292010-05-22 06:37:33 +0000644 .Case("setz", "sete")
645 .Case("setnz", "setne")
646 .Case("jz", "je")
647 .Case("jnz", "jne")
Kevin Enderby9738f642010-05-27 21:33:19 +0000648 .Case("jc", "jb")
Kevin Enderby0de0f3f2010-06-08 23:48:44 +0000649 // FIXME: in 32-bit mode jcxz requires an AdSize prefix. In 64-bit mode
650 // jecxz requires an AdSize prefix but jecxz does not have a prefix in
651 // 32-bit mode.
Kevin Enderby9738f642010-05-27 21:33:19 +0000652 .Case("jecxz", "jcxz")
Chris Lattner31c63fb2010-09-06 20:10:12 +0000653 .Case("jrcxz", Is64Bit ? "jcxz" : "jrcxz")
Kevin Enderby9738f642010-05-27 21:33:19 +0000654 .Case("jna", "jbe")
655 .Case("jnae", "jb")
656 .Case("jnb", "jae")
657 .Case("jnbe", "ja")
658 .Case("jnc", "jae")
659 .Case("jng", "jle")
660 .Case("jnge", "jl")
661 .Case("jnl", "jge")
662 .Case("jnle", "jg")
663 .Case("jpe", "jp")
664 .Case("jpo", "jnp")
Chris Lattner30bb3842010-09-07 00:05:45 +0000665 // Condition code aliases for 16-bit, 32-bit, 64-bit and unspec operands.
666 .Case("cmovcw", "cmovbw") .Case("cmovcl", "cmovbl")
667 .Case("cmovcq", "cmovbq") .Case("cmovc", "cmovb")
668 .Case("cmovnaw", "cmovbew").Case("cmovnal", "cmovbel")
669 .Case("cmovnaq", "cmovbeq").Case("cmovna", "cmovbe")
670 .Case("cmovnbw", "cmovaew").Case("cmovnbl", "cmovael")
671 .Case("cmovnbq", "cmovaeq").Case("cmovnb", "cmovae")
672 .Case("cmovnbew","cmovaw") .Case("cmovnbel","cmoval")
673 .Case("cmovnbeq","cmovaq") .Case("cmovnbe", "cmova")
674 .Case("cmovncw", "cmovaew").Case("cmovncl", "cmovael")
675 .Case("cmovncq", "cmovaeq").Case("cmovnc", "cmovae")
676 .Case("cmovngw", "cmovlew").Case("cmovngl", "cmovlel")
677 .Case("cmovngq", "cmovleq").Case("cmovng", "cmovle")
678 .Case("cmovnw", "cmovgew").Case("cmovnl", "cmovgel")
679 .Case("cmovnq", "cmovgeq").Case("cmovn", "cmovge")
680 .Case("cmovngw", "cmovlew").Case("cmovngl", "cmovlel")
681 .Case("cmovngq", "cmovleq").Case("cmovng", "cmovle")
682 .Case("cmovngew","cmovlw") .Case("cmovngel","cmovll")
683 .Case("cmovngeq","cmovlq") .Case("cmovnge", "cmovl")
684 .Case("cmovnlw", "cmovgew").Case("cmovnll", "cmovgel")
685 .Case("cmovnlq", "cmovgeq").Case("cmovnl", "cmovge")
686 .Case("cmovnlew","cmovgw") .Case("cmovnlel","cmovgl")
687 .Case("cmovnleq","cmovgq") .Case("cmovnle", "cmovg")
688 .Case("cmovnzw", "cmovnew").Case("cmovnzl", "cmovnel")
689 .Case("cmovnzq", "cmovneq").Case("cmovnz", "cmovne")
690 .Case("cmovzw", "cmovew") .Case("cmovzl", "cmovel")
691 .Case("cmovzq", "cmoveq") .Case("cmovz", "cmove")
Kevin Enderbyb2922892010-05-28 20:59:10 +0000692 .Case("fwait", "wait")
Kevin Enderby4c71e082010-05-28 21:20:21 +0000693 .Case("movzx", "movzb")
Daniel Dunbar3e0c9792010-02-10 21:19:28 +0000694 .Default(Name);
Daniel Dunbar0e767d72010-05-25 19:49:32 +0000695
696 // FIXME: Hack to recognize cmp<comparison code>{ss,sd,ps,pd}.
697 const MCExpr *ExtraImmOp = 0;
Bruno Cardoso Lopes3183dd52010-06-23 21:10:57 +0000698 if ((PatchedName.startswith("cmp") || PatchedName.startswith("vcmp")) &&
Daniel Dunbar0e767d72010-05-25 19:49:32 +0000699 (PatchedName.endswith("ss") || PatchedName.endswith("sd") ||
700 PatchedName.endswith("ps") || PatchedName.endswith("pd"))) {
Bruno Cardoso Lopes3183dd52010-06-23 21:10:57 +0000701 bool IsVCMP = PatchedName.startswith("vcmp");
702 unsigned SSECCIdx = IsVCMP ? 4 : 3;
Daniel Dunbar0e767d72010-05-25 19:49:32 +0000703 unsigned SSEComparisonCode = StringSwitch<unsigned>(
Bruno Cardoso Lopes3183dd52010-06-23 21:10:57 +0000704 PatchedName.slice(SSECCIdx, PatchedName.size() - 2))
Bruno Cardoso Lopes6c614512010-07-07 22:24:03 +0000705 .Case("eq", 0)
706 .Case("lt", 1)
707 .Case("le", 2)
708 .Case("unord", 3)
709 .Case("neq", 4)
710 .Case("nlt", 5)
711 .Case("nle", 6)
712 .Case("ord", 7)
713 .Case("eq_uq", 8)
714 .Case("nge", 9)
715 .Case("ngt", 0x0A)
716 .Case("false", 0x0B)
717 .Case("neq_oq", 0x0C)
718 .Case("ge", 0x0D)
719 .Case("gt", 0x0E)
720 .Case("true", 0x0F)
721 .Case("eq_os", 0x10)
722 .Case("lt_oq", 0x11)
723 .Case("le_oq", 0x12)
724 .Case("unord_s", 0x13)
725 .Case("neq_us", 0x14)
726 .Case("nlt_uq", 0x15)
727 .Case("nle_uq", 0x16)
728 .Case("ord_s", 0x17)
729 .Case("eq_us", 0x18)
730 .Case("nge_uq", 0x19)
731 .Case("ngt_uq", 0x1A)
732 .Case("false_os", 0x1B)
733 .Case("neq_os", 0x1C)
734 .Case("ge_oq", 0x1D)
735 .Case("gt_oq", 0x1E)
736 .Case("true_us", 0x1F)
Daniel Dunbar0e767d72010-05-25 19:49:32 +0000737 .Default(~0U);
738 if (SSEComparisonCode != ~0U) {
739 ExtraImmOp = MCConstantExpr::Create(SSEComparisonCode,
740 getParser().getContext());
741 if (PatchedName.endswith("ss")) {
Bruno Cardoso Lopes3183dd52010-06-23 21:10:57 +0000742 PatchedName = IsVCMP ? "vcmpss" : "cmpss";
Daniel Dunbar0e767d72010-05-25 19:49:32 +0000743 } else if (PatchedName.endswith("sd")) {
Bruno Cardoso Lopes3183dd52010-06-23 21:10:57 +0000744 PatchedName = IsVCMP ? "vcmpsd" : "cmpsd";
Daniel Dunbar0e767d72010-05-25 19:49:32 +0000745 } else if (PatchedName.endswith("ps")) {
Bruno Cardoso Lopes3183dd52010-06-23 21:10:57 +0000746 PatchedName = IsVCMP ? "vcmpps" : "cmpps";
Daniel Dunbar0e767d72010-05-25 19:49:32 +0000747 } else {
748 assert(PatchedName.endswith("pd") && "Unexpected mnemonic!");
Bruno Cardoso Lopes3183dd52010-06-23 21:10:57 +0000749 PatchedName = IsVCMP ? "vcmppd" : "cmppd";
Daniel Dunbar0e767d72010-05-25 19:49:32 +0000750 }
751 }
752 }
Bruno Cardoso Lopesea0e05a2010-07-23 18:41:12 +0000753
754 // FIXME: Hack to recognize vpclmul<src1_quadword, src2_quadword>dq
755 if (PatchedName.startswith("vpclmul")) {
756 unsigned CLMULQuadWordSelect = StringSwitch<unsigned>(
757 PatchedName.slice(7, PatchedName.size() - 2))
758 .Case("lqlq", 0x00) // src1[63:0], src2[63:0]
759 .Case("hqlq", 0x01) // src1[127:64], src2[63:0]
760 .Case("lqhq", 0x10) // src1[63:0], src2[127:64]
761 .Case("hqhq", 0x11) // src1[127:64], src2[127:64]
762 .Default(~0U);
763 if (CLMULQuadWordSelect != ~0U) {
764 ExtraImmOp = MCConstantExpr::Create(CLMULQuadWordSelect,
765 getParser().getContext());
766 assert(PatchedName.endswith("dq") && "Unexpected mnemonic!");
767 PatchedName = "vpclmulqdq";
768 }
769 }
Daniel Dunbar3e0c9792010-02-10 21:19:28 +0000770 Operands.push_back(X86Operand::CreateToken(PatchedName, NameLoc));
Daniel Dunbare1fdb0e2009-07-28 22:40:46 +0000771
Daniel Dunbar0e767d72010-05-25 19:49:32 +0000772 if (ExtraImmOp)
773 Operands.push_back(X86Operand::CreateImm(ExtraImmOp, NameLoc, NameLoc));
774
Chris Lattner4cfbcdc2010-09-06 18:32:06 +0000775
776 // This does the actual operand parsing.
Daniel Dunbare1fdb0e2009-07-28 22:40:46 +0000777 if (getLexer().isNot(AsmToken::EndOfStatement)) {
Daniel Dunbar71527c12009-08-11 05:00:25 +0000778
779 // Parse '*' modifier.
780 if (getLexer().is(AsmToken::Star)) {
Sean Callanan936b0d32010-01-19 21:44:56 +0000781 SMLoc Loc = Parser.getTok().getLoc();
Chris Lattner528d00b2010-01-15 19:28:38 +0000782 Operands.push_back(X86Operand::CreateToken("*", Loc));
Sean Callanana83fd7d2010-01-19 20:27:46 +0000783 Parser.Lex(); // Eat the star.
Daniel Dunbar71527c12009-08-11 05:00:25 +0000784 }
785
Daniel Dunbare1fdb0e2009-07-28 22:40:46 +0000786 // Read the first operand.
Chris Lattnera2bbb7c2010-01-15 18:44:13 +0000787 if (X86Operand *Op = ParseOperand())
788 Operands.push_back(Op);
789 else
Daniel Dunbare1fdb0e2009-07-28 22:40:46 +0000790 return true;
Daniel Dunbar0e767d72010-05-25 19:49:32 +0000791
Daniel Dunbare1fdb0e2009-07-28 22:40:46 +0000792 while (getLexer().is(AsmToken::Comma)) {
Sean Callanana83fd7d2010-01-19 20:27:46 +0000793 Parser.Lex(); // Eat the comma.
Daniel Dunbare1fdb0e2009-07-28 22:40:46 +0000794
795 // Parse and remember the operand.
Chris Lattnera2bbb7c2010-01-15 18:44:13 +0000796 if (X86Operand *Op = ParseOperand())
797 Operands.push_back(Op);
798 else
Daniel Dunbare1fdb0e2009-07-28 22:40:46 +0000799 return true;
800 }
801 }
802
Daniel Dunbar18fc3442010-03-13 00:47:29 +0000803 // FIXME: Hack to handle recognizing s{hr,ar,hl}? $1.
804 if ((Name.startswith("shr") || Name.startswith("sar") ||
805 Name.startswith("shl")) &&
Chris Lattner4cfbcdc2010-09-06 18:32:06 +0000806 Operands.size() == 3) {
807 X86Operand *Op1 = static_cast<X86Operand*>(Operands[1]);
808 if (Op1->isImm() && isa<MCConstantExpr>(Op1->getImm()) &&
809 cast<MCConstantExpr>(Op1->getImm())->getValue() == 1) {
810 delete Operands[1];
811 Operands.erase(Operands.begin() + 1);
812 }
Daniel Dunbarfbd12cc2010-03-20 22:36:38 +0000813 }
Daniel Dunbar18fc3442010-03-13 00:47:29 +0000814
Kevin Enderby492d4f42010-05-25 20:52:34 +0000815 // FIXME: Hack to handle "f{mul*,add*,sub*,div*} $op, st(0)" the same as
816 // "f{mul*,add*,sub*,div*} $op"
817 if ((Name.startswith("fmul") || Name.startswith("fadd") ||
818 Name.startswith("fsub") || Name.startswith("fdiv")) &&
819 Operands.size() == 3 &&
820 static_cast<X86Operand*>(Operands[2])->isReg() &&
821 static_cast<X86Operand*>(Operands[2])->getReg() == X86::ST0) {
822 delete Operands[2];
823 Operands.erase(Operands.begin() + 2);
824 }
825
Daniel Dunbar1c8d7772010-08-24 19:37:56 +0000826 // FIXME: Hack to handle "imul <imm>, B" which is an alias for "imul <imm>, B,
827 // B".
Daniel Dunbar09392782010-08-24 19:24:18 +0000828 if (Name.startswith("imul") && Operands.size() == 3 &&
Daniel Dunbar1c8d7772010-08-24 19:37:56 +0000829 static_cast<X86Operand*>(Operands[1])->isImm() &&
Daniel Dunbar09392782010-08-24 19:24:18 +0000830 static_cast<X86Operand*>(Operands.back())->isReg()) {
831 X86Operand *Op = static_cast<X86Operand*>(Operands.back());
832 Operands.push_back(X86Operand::CreateReg(Op->getReg(), Op->getStartLoc(),
833 Op->getEndLoc()));
834 }
Chris Lattner7ece7162010-09-06 23:51:44 +0000835
836 // 'sldt <mem>' can be encoded with either sldtw or sldtq with the same
837 // effect (both store to a 16-bit mem). Force to sldtw to avoid ambiguity
838 // errors, since its encoding is the most compact.
839 if (Name == "sldt" && Operands.size() == 2 &&
Benjamin Kramer1ecb9782010-09-07 14:40:58 +0000840 static_cast<X86Operand*>(Operands[1])->isMem()) {
841 delete Operands[0];
Chris Lattner7ece7162010-09-06 23:51:44 +0000842 Operands[0] = X86Operand::CreateToken("sldtw", NameLoc);
Benjamin Kramer1ecb9782010-09-07 14:40:58 +0000843 }
Daniel Dunbar09392782010-08-24 19:24:18 +0000844
Chris Lattnerf29c0b62010-01-14 22:21:20 +0000845 return false;
Daniel Dunbar3c2a8932009-07-20 18:55:04 +0000846}
847
Kevin Enderbyce4bec82009-09-10 20:51:44 +0000848bool X86ATTAsmParser::ParseDirective(AsmToken DirectiveID) {
849 StringRef IDVal = DirectiveID.getIdentifier();
850 if (IDVal == ".word")
851 return ParseDirectiveWord(2, DirectiveID.getLoc());
852 return true;
853}
854
855/// ParseDirectiveWord
856/// ::= .word [ expression (, expression)* ]
857bool X86ATTAsmParser::ParseDirectiveWord(unsigned Size, SMLoc L) {
858 if (getLexer().isNot(AsmToken::EndOfStatement)) {
859 for (;;) {
860 const MCExpr *Value;
861 if (getParser().ParseExpression(Value))
862 return true;
863
Chris Lattnerc35681b2010-01-19 19:46:13 +0000864 getParser().getStreamer().EmitValue(Value, Size, 0 /*addrspace*/);
Kevin Enderbyce4bec82009-09-10 20:51:44 +0000865
866 if (getLexer().is(AsmToken::EndOfStatement))
867 break;
Bruno Cardoso Lopesd65cd1d2010-07-23 22:15:26 +0000868
Kevin Enderbyce4bec82009-09-10 20:51:44 +0000869 // FIXME: Improve diagnostic.
870 if (getLexer().isNot(AsmToken::Comma))
871 return Error(L, "unexpected token in directive");
Sean Callanana83fd7d2010-01-19 20:27:46 +0000872 Parser.Lex();
Kevin Enderbyce4bec82009-09-10 20:51:44 +0000873 }
874 }
875
Sean Callanana83fd7d2010-01-19 20:27:46 +0000876 Parser.Lex();
Kevin Enderbyce4bec82009-09-10 20:51:44 +0000877 return false;
878}
879
Daniel Dunbar2ecc3bb2010-08-12 00:55:38 +0000880
Daniel Dunbar9b816a12010-05-04 16:12:42 +0000881bool
Daniel Dunbar2ecc3bb2010-08-12 00:55:38 +0000882X86ATTAsmParser::MatchInstruction(SMLoc IDLoc,
883 const SmallVectorImpl<MCParsedAsmOperand*>
Daniel Dunbar9b816a12010-05-04 16:12:42 +0000884 &Operands,
885 MCInst &Inst) {
Daniel Dunbar2ecc3bb2010-08-12 00:55:38 +0000886 assert(!Operands.empty() && "Unexpect empty operand list!");
887
Chris Lattner628fbec2010-09-06 21:54:15 +0000888 bool WasOriginallyInvalidOperand = false;
Chris Lattner339cc7b2010-09-06 22:11:18 +0000889 unsigned OrigErrorInfo;
Chris Lattner628fbec2010-09-06 21:54:15 +0000890
Daniel Dunbar9b816a12010-05-04 16:12:42 +0000891 // First, try a direct match.
Chris Lattner339cc7b2010-09-06 22:11:18 +0000892 switch (MatchInstructionImpl(Operands, Inst, OrigErrorInfo)) {
Chris Lattnerb4be28f2010-09-06 20:08:02 +0000893 case Match_Success:
Daniel Dunbar9b816a12010-05-04 16:12:42 +0000894 return false;
Chris Lattnerb4be28f2010-09-06 20:08:02 +0000895 case Match_MissingFeature:
896 Error(IDLoc, "instruction requires a CPU feature not currently enabled");
897 return true;
Chris Lattner628fbec2010-09-06 21:54:15 +0000898 case Match_InvalidOperand:
899 WasOriginallyInvalidOperand = true;
900 break;
901 case Match_MnemonicFail:
Chris Lattnerb4be28f2010-09-06 20:08:02 +0000902 break;
903 }
Daniel Dunbar9b816a12010-05-04 16:12:42 +0000904
Daniel Dunbar9b816a12010-05-04 16:12:42 +0000905 // FIXME: Ideally, we would only attempt suffix matches for things which are
906 // valid prefixes, and we could just infer the right unambiguous
907 // type. However, that requires substantially more matcher support than the
908 // following hack.
909
Chris Lattner3e4582a2010-09-06 19:11:01 +0000910 X86Operand *Op = static_cast<X86Operand*>(Operands[0]);
911 assert(Op->isToken() && "Leading operand should always be a mnemonic!");
912
Daniel Dunbar9b816a12010-05-04 16:12:42 +0000913 // Change the operand to point to a temporary token.
Daniel Dunbar9b816a12010-05-04 16:12:42 +0000914 StringRef Base = Op->getToken();
Daniel Dunbar2ecc3bb2010-08-12 00:55:38 +0000915 SmallString<16> Tmp;
916 Tmp += Base;
917 Tmp += ' ';
918 Op->setTokenValue(Tmp.str());
Daniel Dunbar9b816a12010-05-04 16:12:42 +0000919
920 // Check for the various suffix matches.
921 Tmp[Base.size()] = 'b';
Chris Lattner339cc7b2010-09-06 22:11:18 +0000922 unsigned BErrorInfo, WErrorInfo, LErrorInfo, QErrorInfo;
923 MatchResultTy MatchB = MatchInstructionImpl(Operands, Inst, BErrorInfo);
Daniel Dunbar9b816a12010-05-04 16:12:42 +0000924 Tmp[Base.size()] = 'w';
Chris Lattner339cc7b2010-09-06 22:11:18 +0000925 MatchResultTy MatchW = MatchInstructionImpl(Operands, Inst, WErrorInfo);
Daniel Dunbar9b816a12010-05-04 16:12:42 +0000926 Tmp[Base.size()] = 'l';
Chris Lattner339cc7b2010-09-06 22:11:18 +0000927 MatchResultTy MatchL = MatchInstructionImpl(Operands, Inst, LErrorInfo);
Daniel Dunbar059379a2010-05-12 00:54:20 +0000928 Tmp[Base.size()] = 'q';
Chris Lattner339cc7b2010-09-06 22:11:18 +0000929 MatchResultTy MatchQ = MatchInstructionImpl(Operands, Inst, QErrorInfo);
Daniel Dunbar9b816a12010-05-04 16:12:42 +0000930
931 // Restore the old token.
932 Op->setTokenValue(Base);
933
934 // If exactly one matched, then we treat that as a successful match (and the
935 // instruction will already have been filled in correctly, since the failing
936 // matches won't have modified it).
Chris Lattnerb4be28f2010-09-06 20:08:02 +0000937 unsigned NumSuccessfulMatches =
938 (MatchB == Match_Success) + (MatchW == Match_Success) +
939 (MatchL == Match_Success) + (MatchQ == Match_Success);
940 if (NumSuccessfulMatches == 1)
Daniel Dunbar9b816a12010-05-04 16:12:42 +0000941 return false;
942
Chris Lattnerb4be28f2010-09-06 20:08:02 +0000943 // Otherwise, the match failed, try to produce a decent error message.
Daniel Dunbar2ecc3bb2010-08-12 00:55:38 +0000944
Daniel Dunbar7d7b4d12010-08-12 00:55:42 +0000945 // If we had multiple suffix matches, then identify this as an ambiguous
946 // match.
Chris Lattnerb4be28f2010-09-06 20:08:02 +0000947 if (NumSuccessfulMatches > 1) {
Daniel Dunbar7d7b4d12010-08-12 00:55:42 +0000948 char MatchChars[4];
949 unsigned NumMatches = 0;
Chris Lattnerb4be28f2010-09-06 20:08:02 +0000950 if (MatchB == Match_Success)
Daniel Dunbar7d7b4d12010-08-12 00:55:42 +0000951 MatchChars[NumMatches++] = 'b';
Chris Lattnerb4be28f2010-09-06 20:08:02 +0000952 if (MatchW == Match_Success)
Daniel Dunbar7d7b4d12010-08-12 00:55:42 +0000953 MatchChars[NumMatches++] = 'w';
Chris Lattnerb4be28f2010-09-06 20:08:02 +0000954 if (MatchL == Match_Success)
Daniel Dunbar7d7b4d12010-08-12 00:55:42 +0000955 MatchChars[NumMatches++] = 'l';
Chris Lattnerb4be28f2010-09-06 20:08:02 +0000956 if (MatchQ == Match_Success)
Daniel Dunbar7d7b4d12010-08-12 00:55:42 +0000957 MatchChars[NumMatches++] = 'q';
958
959 SmallString<126> Msg;
960 raw_svector_ostream OS(Msg);
961 OS << "ambiguous instructions require an explicit suffix (could be ";
962 for (unsigned i = 0; i != NumMatches; ++i) {
963 if (i != 0)
964 OS << ", ";
965 if (i + 1 == NumMatches)
966 OS << "or ";
967 OS << "'" << Base << MatchChars[i] << "'";
968 }
969 OS << ")";
970 Error(IDLoc, OS.str());
Chris Lattnerb4be28f2010-09-06 20:08:02 +0000971 return true;
Daniel Dunbar7d7b4d12010-08-12 00:55:42 +0000972 }
Chris Lattnerb4be28f2010-09-06 20:08:02 +0000973
Chris Lattner628fbec2010-09-06 21:54:15 +0000974 // Okay, we know that none of the variants matched successfully.
Chris Lattnerb4be28f2010-09-06 20:08:02 +0000975
Chris Lattner628fbec2010-09-06 21:54:15 +0000976 // If all of the instructions reported an invalid mnemonic, then the original
977 // mnemonic was invalid.
978 if ((MatchB == Match_MnemonicFail) && (MatchW == Match_MnemonicFail) &&
979 (MatchL == Match_MnemonicFail) && (MatchQ == Match_MnemonicFail)) {
Chris Lattner339cc7b2010-09-06 22:11:18 +0000980 if (!WasOriginallyInvalidOperand) {
Chris Lattner628fbec2010-09-06 21:54:15 +0000981 Error(IDLoc, "invalid instruction mnemonic '" + Base + "'");
Chris Lattner339cc7b2010-09-06 22:11:18 +0000982 return true;
983 }
984
985 // Recover location info for the operand if we know which was the problem.
986 SMLoc ErrorLoc = IDLoc;
987 if (OrigErrorInfo != ~0U) {
988 ErrorLoc = ((X86Operand*)Operands[OrigErrorInfo])->getStartLoc();
989 if (ErrorLoc == SMLoc()) ErrorLoc = IDLoc;
990 }
991
992 Error(ErrorLoc, "invalid operand for instruction");
Chris Lattner628fbec2010-09-06 21:54:15 +0000993 return true;
994 }
Chris Lattnerb4be28f2010-09-06 20:08:02 +0000995
996 // If one instruction matched with a missing feature, report this as a
997 // missing feature.
998 if ((MatchB == Match_MissingFeature) + (MatchW == Match_MissingFeature) +
Chris Lattner628fbec2010-09-06 21:54:15 +0000999 (MatchL == Match_MissingFeature) + (MatchQ == Match_MissingFeature) == 1){
Chris Lattnerb4be28f2010-09-06 20:08:02 +00001000 Error(IDLoc, "instruction requires a CPU feature not currently enabled");
1001 return true;
1002 }
1003
Chris Lattner628fbec2010-09-06 21:54:15 +00001004 // If one instruction matched with an invalid operand, report this as an
1005 // operand failure.
1006 if ((MatchB == Match_InvalidOperand) + (MatchW == Match_InvalidOperand) +
1007 (MatchL == Match_InvalidOperand) + (MatchQ == Match_InvalidOperand) == 1){
1008 Error(IDLoc, "invalid operand for instruction");
1009 return true;
1010 }
1011
Chris Lattnerb4be28f2010-09-06 20:08:02 +00001012 // If all of these were an outright failure, report it in a useless way.
1013 // FIXME: We should give nicer diagnostics about the exact failure.
Chris Lattner628fbec2010-09-06 21:54:15 +00001014 Error(IDLoc, "unknown use of instruction mnemonic without a size suffix");
Daniel Dunbar9b816a12010-05-04 16:12:42 +00001015 return true;
1016}
1017
1018
Sean Callanan5051cb82010-01-23 02:43:15 +00001019extern "C" void LLVMInitializeX86AsmLexer();
1020
Daniel Dunbar71475772009-07-17 20:42:00 +00001021// Force static initialization.
1022extern "C" void LLVMInitializeX86AsmParser() {
Daniel Dunbar63ec0932010-03-18 20:06:02 +00001023 RegisterAsmParser<X86_32ATTAsmParser> X(TheX86_32Target);
1024 RegisterAsmParser<X86_64ATTAsmParser> Y(TheX86_64Target);
Sean Callanan5051cb82010-01-23 02:43:15 +00001025 LLVMInitializeX86AsmLexer();
Daniel Dunbar71475772009-07-17 20:42:00 +00001026}
Daniel Dunbar00331992009-07-29 00:02:19 +00001027
Chris Lattner3e4582a2010-09-06 19:11:01 +00001028#define GET_REGISTER_MATCHER
1029#define GET_MATCHER_IMPLEMENTATION
Daniel Dunbar00331992009-07-29 00:02:19 +00001030#include "X86GenAsmMatcher.inc"