blob: cbb86f7f006ce3f28a621e9803e4a7681ecd148f [file] [log] [blame]
Sean Callanan5051cb82010-01-23 02:43:15 +00001//===-- X86AsmLexer.cpp - Tokenize X86 assembly to AsmTokens --------------===//
2//
3// The LLVM Compiler Infrastructure
4//
5// This file is distributed under the University of Illinois Open Source
6// License. See LICENSE.TXT for details.
7//
8//===----------------------------------------------------------------------===//
9
Evan Cheng11424442011-07-26 00:24:13 +000010#include "MCTargetDesc/X86BaseInfo.h"
Sean Callanan66549312010-01-25 21:59:20 +000011#include "llvm/MC/MCAsmInfo.h"
Sean Callanan5051cb82010-01-23 02:43:15 +000012#include "llvm/MC/MCParser/MCAsmLexer.h"
13#include "llvm/MC/MCParser/MCParsedAsmOperand.h"
Evan Cheng11424442011-07-26 00:24:13 +000014#include "llvm/MC/MCTargetAsmLexer.h"
Evan Chengf2596bc2011-07-23 00:45:41 +000015#include "llvm/Target/TargetRegistry.h"
16#include "llvm/ADT/SmallVector.h"
17#include "llvm/ADT/StringExtras.h"
Sean Callanan5051cb82010-01-23 02:43:15 +000018
19using namespace llvm;
20
21namespace {
22
Evan Cheng11424442011-07-26 00:24:13 +000023class X86AsmLexer : public MCTargetAsmLexer {
Sean Callanan5051cb82010-01-23 02:43:15 +000024 const MCAsmInfo &AsmInfo;
Sean Callananad857fc2010-01-26 00:08:25 +000025
26 bool tentativeIsValid;
27 AsmToken tentativeToken;
28
29 const AsmToken &lexTentative() {
Sean Callanan9aeccad2010-01-31 02:28:18 +000030 tentativeToken = getLexer()->Lex();
Sean Callananad857fc2010-01-26 00:08:25 +000031 tentativeIsValid = true;
32 return tentativeToken;
33 }
34
35 const AsmToken &lexDefinite() {
Chris Lattnerc4e84302010-06-24 07:18:14 +000036 if (tentativeIsValid) {
Sean Callananad857fc2010-01-26 00:08:25 +000037 tentativeIsValid = false;
38 return tentativeToken;
39 }
Chris Lattnerc4e84302010-06-24 07:18:14 +000040 return getLexer()->Lex();
Sean Callananad857fc2010-01-26 00:08:25 +000041 }
Sean Callanan66549312010-01-25 21:59:20 +000042
43 AsmToken LexTokenATT();
44 AsmToken LexTokenIntel();
Sean Callanan5051cb82010-01-23 02:43:15 +000045protected:
Sean Callanan66549312010-01-25 21:59:20 +000046 AsmToken LexToken() {
Sean Callananad857fc2010-01-26 00:08:25 +000047 if (!Lexer) {
48 SetError(SMLoc(), "No MCAsmLexer installed");
49 return AsmToken(AsmToken::Error, "", 0);
50 }
51
Sean Callanan66549312010-01-25 21:59:20 +000052 switch (AsmInfo.getAssemblerDialect()) {
53 default:
54 SetError(SMLoc(), "Unhandled dialect");
55 return AsmToken(AsmToken::Error, "", 0);
56 case 0:
57 return LexTokenATT();
58 case 1:
59 return LexTokenIntel();
60 }
61 }
Sean Callanan5051cb82010-01-23 02:43:15 +000062public:
Evan Chengf60768a2011-07-25 20:53:02 +000063 X86AsmLexer(const Target &T, const MCRegisterInfo &MRI, const MCAsmInfo &MAI)
Evan Cheng11424442011-07-26 00:24:13 +000064 : MCTargetAsmLexer(T), AsmInfo(MAI), tentativeIsValid(false) {
Sean Callanan5051cb82010-01-23 02:43:15 +000065 }
66};
67
Chris Lattner3e4582a2010-09-06 19:11:01 +000068} // end anonymous namespace
Sean Callanan5051cb82010-01-23 02:43:15 +000069
Chris Lattner3e4582a2010-09-06 19:11:01 +000070#define GET_REGISTER_MATCHER
71#include "X86GenAsmMatcher.inc"
Sean Callananad857fc2010-01-26 00:08:25 +000072
Sean Callanan66549312010-01-25 21:59:20 +000073AsmToken X86AsmLexer::LexTokenATT() {
Chris Lattnerc4e84302010-06-24 07:18:14 +000074 AsmToken lexedToken = lexDefinite();
Sean Callananad857fc2010-01-26 00:08:25 +000075
76 switch (lexedToken.getKind()) {
77 default:
Chris Lattnerc4e84302010-06-24 07:18:14 +000078 return lexedToken;
Sean Callananad857fc2010-01-26 00:08:25 +000079 case AsmToken::Error:
80 SetError(Lexer->getErrLoc(), Lexer->getErr());
Chris Lattnerc4e84302010-06-24 07:18:14 +000081 return lexedToken;
82
83 case AsmToken::Percent: {
Sean Callananad857fc2010-01-26 00:08:25 +000084 const AsmToken &nextToken = lexTentative();
Chris Lattner056fd062010-06-24 07:16:25 +000085 if (nextToken.getKind() != AsmToken::Identifier)
Chris Lattnerc4e84302010-06-24 07:18:14 +000086 return lexedToken;
Chris Lattner056fd062010-06-24 07:16:25 +000087
88
89 if (unsigned regID = MatchRegisterName(nextToken.getString())) {
90 lexDefinite();
91
Chris Lattner80486622010-06-24 07:29:18 +000092 // FIXME: This is completely wrong when there is a space or other
93 // punctuation between the % and the register name.
Chris Lattner056fd062010-06-24 07:16:25 +000094 StringRef regStr(lexedToken.getString().data(),
95 lexedToken.getString().size() +
96 nextToken.getString().size());
97
Chris Lattnerc4e84302010-06-24 07:18:14 +000098 return AsmToken(AsmToken::Register, regStr,
Chris Lattner056fd062010-06-24 07:16:25 +000099 static_cast<int64_t>(regID));
Sean Callananad857fc2010-01-26 00:08:25 +0000100 }
Chris Lattner056fd062010-06-24 07:16:25 +0000101
Chris Lattner80486622010-06-24 07:29:18 +0000102 // Match register name failed. If this is "db[0-7]", match it as an alias
103 // for dr[0-7].
104 if (nextToken.getString().size() == 3 &&
105 nextToken.getString().startswith("db")) {
106 int RegNo = -1;
107 switch (nextToken.getString()[2]) {
108 case '0': RegNo = X86::DR0; break;
109 case '1': RegNo = X86::DR1; break;
110 case '2': RegNo = X86::DR2; break;
111 case '3': RegNo = X86::DR3; break;
112 case '4': RegNo = X86::DR4; break;
113 case '5': RegNo = X86::DR5; break;
114 case '6': RegNo = X86::DR6; break;
115 case '7': RegNo = X86::DR7; break;
116 }
117
118 if (RegNo != -1) {
119 lexDefinite();
120
121 // FIXME: This is completely wrong when there is a space or other
122 // punctuation between the % and the register name.
123 StringRef regStr(lexedToken.getString().data(),
124 lexedToken.getString().size() +
125 nextToken.getString().size());
126 return AsmToken(AsmToken::Register, regStr,
127 static_cast<int64_t>(RegNo));
128 }
129 }
130
131
Chris Lattnerc4e84302010-06-24 07:18:14 +0000132 return lexedToken;
Sean Callananad857fc2010-01-26 00:08:25 +0000133 }
134 }
Sean Callanan66549312010-01-25 21:59:20 +0000135}
136
137AsmToken X86AsmLexer::LexTokenIntel() {
Sean Callananeb182e92010-01-26 01:00:10 +0000138 const AsmToken &lexedToken = lexDefinite();
139
140 switch(lexedToken.getKind()) {
141 default:
Chris Lattnerc4e84302010-06-24 07:18:14 +0000142 return lexedToken;
Sean Callananeb182e92010-01-26 01:00:10 +0000143 case AsmToken::Error:
144 SetError(Lexer->getErrLoc(), Lexer->getErr());
Chris Lattnerc4e84302010-06-24 07:18:14 +0000145 return lexedToken;
146 case AsmToken::Identifier: {
Sean Callananeb182e92010-01-26 01:00:10 +0000147 std::string upperCase = lexedToken.getString().str();
148 std::string lowerCase = LowercaseString(upperCase);
149 StringRef lowerRef(lowerCase);
150
151 unsigned regID = MatchRegisterName(lowerRef);
152
Chris Lattnerc4e84302010-06-24 07:18:14 +0000153 if (regID)
Sean Callananeb182e92010-01-26 01:00:10 +0000154 return AsmToken(AsmToken::Register,
155 lexedToken.getString(),
156 static_cast<int64_t>(regID));
Chris Lattnerc4e84302010-06-24 07:18:14 +0000157 return lexedToken;
Sean Callananeb182e92010-01-26 01:00:10 +0000158 }
159 }
Sean Callanan5051cb82010-01-23 02:43:15 +0000160}
161
162extern "C" void LLVMInitializeX86AsmLexer() {
Evan Cheng11424442011-07-26 00:24:13 +0000163 RegisterMCAsmLexer<X86AsmLexer> X(TheX86_32Target);
164 RegisterMCAsmLexer<X86AsmLexer> Y(TheX86_64Target);
Sean Callanan5051cb82010-01-23 02:43:15 +0000165}