blob: ec73087a3305f67ecf4ddf30f5da3905bacc8f59 [file] [log] [blame]
Sean Callanane88f5522010-01-23 02:43:15 +00001//===-- X86AsmLexer.cpp - Tokenize X86 assembly to AsmTokens --------------===//
2//
3// The LLVM Compiler Infrastructure
4//
5// This file is distributed under the University of Illinois Open Source
6// License. See LICENSE.TXT for details.
7//
8//===----------------------------------------------------------------------===//
9
Sean Callanancf2e3d12010-01-26 00:08:25 +000010#include "llvm/ADT/SmallVector.h"
Sean Callanan7dcef4c2010-01-26 01:00:10 +000011#include "llvm/ADT/StringExtras.h"
Sean Callanane88f5522010-01-23 02:43:15 +000012#include "llvm/Target/TargetAsmLexer.h"
13#include "llvm/Target/TargetRegistry.h"
Sean Callanan436c4842010-01-25 21:59:20 +000014#include "llvm/MC/MCAsmInfo.h"
Sean Callanane88f5522010-01-23 02:43:15 +000015#include "llvm/MC/MCParser/MCAsmLexer.h"
16#include "llvm/MC/MCParser/MCParsedAsmOperand.h"
17#include "X86.h"
18
19using namespace llvm;
20
21namespace {
22
23class X86AsmLexer : public TargetAsmLexer {
24 const MCAsmInfo &AsmInfo;
Sean Callanancf2e3d12010-01-26 00:08:25 +000025
26 bool tentativeIsValid;
27 AsmToken tentativeToken;
28
29 const AsmToken &lexTentative() {
Sean Callanan894c1af2010-01-31 02:28:18 +000030 tentativeToken = getLexer()->Lex();
Sean Callanancf2e3d12010-01-26 00:08:25 +000031 tentativeIsValid = true;
32 return tentativeToken;
33 }
34
35 const AsmToken &lexDefinite() {
Chris Lattneradabe1a2010-06-24 07:18:14 +000036 if (tentativeIsValid) {
Sean Callanancf2e3d12010-01-26 00:08:25 +000037 tentativeIsValid = false;
38 return tentativeToken;
39 }
Chris Lattneradabe1a2010-06-24 07:18:14 +000040 return getLexer()->Lex();
Sean Callanancf2e3d12010-01-26 00:08:25 +000041 }
Sean Callanan436c4842010-01-25 21:59:20 +000042
43 AsmToken LexTokenATT();
44 AsmToken LexTokenIntel();
Sean Callanane88f5522010-01-23 02:43:15 +000045protected:
Sean Callanan436c4842010-01-25 21:59:20 +000046 AsmToken LexToken() {
Sean Callanancf2e3d12010-01-26 00:08:25 +000047 if (!Lexer) {
48 SetError(SMLoc(), "No MCAsmLexer installed");
49 return AsmToken(AsmToken::Error, "", 0);
50 }
51
Sean Callanan436c4842010-01-25 21:59:20 +000052 switch (AsmInfo.getAssemblerDialect()) {
53 default:
54 SetError(SMLoc(), "Unhandled dialect");
55 return AsmToken(AsmToken::Error, "", 0);
56 case 0:
57 return LexTokenATT();
58 case 1:
59 return LexTokenIntel();
60 }
61 }
Sean Callanane88f5522010-01-23 02:43:15 +000062public:
63 X86AsmLexer(const Target &T, const MCAsmInfo &MAI)
Sean Callanan894c1af2010-01-31 02:28:18 +000064 : TargetAsmLexer(T), AsmInfo(MAI), tentativeIsValid(false) {
Sean Callanane88f5522010-01-23 02:43:15 +000065 }
66};
67
Chris Lattner0692ee62010-09-06 19:11:01 +000068} // end anonymous namespace
Sean Callanane88f5522010-01-23 02:43:15 +000069
Chris Lattner0692ee62010-09-06 19:11:01 +000070#define GET_REGISTER_MATCHER
71#include "X86GenAsmMatcher.inc"
Sean Callanancf2e3d12010-01-26 00:08:25 +000072
Sean Callanan436c4842010-01-25 21:59:20 +000073AsmToken X86AsmLexer::LexTokenATT() {
Chris Lattneradabe1a2010-06-24 07:18:14 +000074 AsmToken lexedToken = lexDefinite();
Sean Callanancf2e3d12010-01-26 00:08:25 +000075
76 switch (lexedToken.getKind()) {
77 default:
Chris Lattneradabe1a2010-06-24 07:18:14 +000078 return lexedToken;
Sean Callanancf2e3d12010-01-26 00:08:25 +000079 case AsmToken::Error:
80 SetError(Lexer->getErrLoc(), Lexer->getErr());
Chris Lattneradabe1a2010-06-24 07:18:14 +000081 return lexedToken;
82
83 case AsmToken::Percent: {
Sean Callanancf2e3d12010-01-26 00:08:25 +000084 const AsmToken &nextToken = lexTentative();
Chris Lattner02758a42010-06-24 07:16:25 +000085 if (nextToken.getKind() != AsmToken::Identifier)
Chris Lattneradabe1a2010-06-24 07:18:14 +000086 return lexedToken;
Chris Lattner02758a42010-06-24 07:16:25 +000087
88
89 if (unsigned regID = MatchRegisterName(nextToken.getString())) {
90 lexDefinite();
91
Chris Lattner645b2092010-06-24 07:29:18 +000092 // FIXME: This is completely wrong when there is a space or other
93 // punctuation between the % and the register name.
Chris Lattner02758a42010-06-24 07:16:25 +000094 StringRef regStr(lexedToken.getString().data(),
95 lexedToken.getString().size() +
96 nextToken.getString().size());
97
Chris Lattneradabe1a2010-06-24 07:18:14 +000098 return AsmToken(AsmToken::Register, regStr,
Chris Lattner02758a42010-06-24 07:16:25 +000099 static_cast<int64_t>(regID));
Sean Callanancf2e3d12010-01-26 00:08:25 +0000100 }
Chris Lattner02758a42010-06-24 07:16:25 +0000101
Chris Lattner645b2092010-06-24 07:29:18 +0000102 // Match register name failed. If this is "db[0-7]", match it as an alias
103 // for dr[0-7].
104 if (nextToken.getString().size() == 3 &&
105 nextToken.getString().startswith("db")) {
106 int RegNo = -1;
107 switch (nextToken.getString()[2]) {
108 case '0': RegNo = X86::DR0; break;
109 case '1': RegNo = X86::DR1; break;
110 case '2': RegNo = X86::DR2; break;
111 case '3': RegNo = X86::DR3; break;
112 case '4': RegNo = X86::DR4; break;
113 case '5': RegNo = X86::DR5; break;
114 case '6': RegNo = X86::DR6; break;
115 case '7': RegNo = X86::DR7; break;
116 }
117
118 if (RegNo != -1) {
119 lexDefinite();
120
121 // FIXME: This is completely wrong when there is a space or other
122 // punctuation between the % and the register name.
123 StringRef regStr(lexedToken.getString().data(),
124 lexedToken.getString().size() +
125 nextToken.getString().size());
126 return AsmToken(AsmToken::Register, regStr,
127 static_cast<int64_t>(RegNo));
128 }
129 }
130
131
Chris Lattneradabe1a2010-06-24 07:18:14 +0000132 return lexedToken;
Sean Callanancf2e3d12010-01-26 00:08:25 +0000133 }
134 }
Sean Callanan436c4842010-01-25 21:59:20 +0000135}
136
137AsmToken X86AsmLexer::LexTokenIntel() {
Sean Callanan7dcef4c2010-01-26 01:00:10 +0000138 const AsmToken &lexedToken = lexDefinite();
139
140 switch(lexedToken.getKind()) {
141 default:
Chris Lattneradabe1a2010-06-24 07:18:14 +0000142 return lexedToken;
Sean Callanan7dcef4c2010-01-26 01:00:10 +0000143 case AsmToken::Error:
144 SetError(Lexer->getErrLoc(), Lexer->getErr());
Chris Lattneradabe1a2010-06-24 07:18:14 +0000145 return lexedToken;
146 case AsmToken::Identifier: {
Sean Callanan7dcef4c2010-01-26 01:00:10 +0000147 std::string upperCase = lexedToken.getString().str();
148 std::string lowerCase = LowercaseString(upperCase);
149 StringRef lowerRef(lowerCase);
150
151 unsigned regID = MatchRegisterName(lowerRef);
152
Chris Lattneradabe1a2010-06-24 07:18:14 +0000153 if (regID)
Sean Callanan7dcef4c2010-01-26 01:00:10 +0000154 return AsmToken(AsmToken::Register,
155 lexedToken.getString(),
156 static_cast<int64_t>(regID));
Chris Lattneradabe1a2010-06-24 07:18:14 +0000157 return lexedToken;
Sean Callanan7dcef4c2010-01-26 01:00:10 +0000158 }
159 }
Sean Callanane88f5522010-01-23 02:43:15 +0000160}
161
162extern "C" void LLVMInitializeX86AsmLexer() {
163 RegisterAsmLexer<X86AsmLexer> X(TheX86_32Target);
164 RegisterAsmLexer<X86AsmLexer> Y(TheX86_64Target);
165}