blob: 26797ab353b62b9de61adabc38bd4b05376587ef [file] [log] [blame]
Sean Callanane88f5522010-01-23 02:43:15 +00001//===-- X86AsmLexer.cpp - Tokenize X86 assembly to AsmTokens --------------===//
2//
3// The LLVM Compiler Infrastructure
4//
5// This file is distributed under the University of Illinois Open Source
6// License. See LICENSE.TXT for details.
7//
8//===----------------------------------------------------------------------===//
9
Sean Callanancf2e3d12010-01-26 00:08:25 +000010#include "llvm/ADT/SmallVector.h"
Sean Callanan7dcef4c2010-01-26 01:00:10 +000011#include "llvm/ADT/StringExtras.h"
Sean Callanane88f5522010-01-23 02:43:15 +000012#include "llvm/Target/TargetAsmLexer.h"
13#include "llvm/Target/TargetRegistry.h"
Sean Callanan436c4842010-01-25 21:59:20 +000014#include "llvm/MC/MCAsmInfo.h"
Sean Callanane88f5522010-01-23 02:43:15 +000015#include "llvm/MC/MCParser/MCAsmLexer.h"
16#include "llvm/MC/MCParser/MCParsedAsmOperand.h"
17#include "X86.h"
18
19using namespace llvm;
20
21namespace {
22
23class X86AsmLexer : public TargetAsmLexer {
24 const MCAsmInfo &AsmInfo;
Sean Callanancf2e3d12010-01-26 00:08:25 +000025
26 bool tentativeIsValid;
27 AsmToken tentativeToken;
28
29 const AsmToken &lexTentative() {
Sean Callanan894c1af2010-01-31 02:28:18 +000030 tentativeToken = getLexer()->Lex();
Sean Callanancf2e3d12010-01-26 00:08:25 +000031 tentativeIsValid = true;
32 return tentativeToken;
33 }
34
35 const AsmToken &lexDefinite() {
Chris Lattneradabe1a2010-06-24 07:18:14 +000036 if (tentativeIsValid) {
Sean Callanancf2e3d12010-01-26 00:08:25 +000037 tentativeIsValid = false;
38 return tentativeToken;
39 }
Chris Lattneradabe1a2010-06-24 07:18:14 +000040 return getLexer()->Lex();
Sean Callanancf2e3d12010-01-26 00:08:25 +000041 }
Sean Callanan436c4842010-01-25 21:59:20 +000042
43 AsmToken LexTokenATT();
44 AsmToken LexTokenIntel();
Sean Callanane88f5522010-01-23 02:43:15 +000045protected:
Sean Callanan436c4842010-01-25 21:59:20 +000046 AsmToken LexToken() {
Sean Callanancf2e3d12010-01-26 00:08:25 +000047 if (!Lexer) {
48 SetError(SMLoc(), "No MCAsmLexer installed");
49 return AsmToken(AsmToken::Error, "", 0);
50 }
51
Sean Callanan436c4842010-01-25 21:59:20 +000052 switch (AsmInfo.getAssemblerDialect()) {
53 default:
54 SetError(SMLoc(), "Unhandled dialect");
55 return AsmToken(AsmToken::Error, "", 0);
56 case 0:
57 return LexTokenATT();
58 case 1:
59 return LexTokenIntel();
60 }
61 }
Sean Callanane88f5522010-01-23 02:43:15 +000062public:
63 X86AsmLexer(const Target &T, const MCAsmInfo &MAI)
Sean Callanan894c1af2010-01-31 02:28:18 +000064 : TargetAsmLexer(T), AsmInfo(MAI), tentativeIsValid(false) {
Sean Callanane88f5522010-01-23 02:43:15 +000065 }
66};
67
68}
69
Chris Lattnerb8d6e982010-02-09 00:34:28 +000070static unsigned MatchRegisterName(StringRef Name);
Sean Callanancf2e3d12010-01-26 00:08:25 +000071
Sean Callanan436c4842010-01-25 21:59:20 +000072AsmToken X86AsmLexer::LexTokenATT() {
Chris Lattneradabe1a2010-06-24 07:18:14 +000073 AsmToken lexedToken = lexDefinite();
Sean Callanancf2e3d12010-01-26 00:08:25 +000074
75 switch (lexedToken.getKind()) {
76 default:
Chris Lattneradabe1a2010-06-24 07:18:14 +000077 return lexedToken;
Sean Callanancf2e3d12010-01-26 00:08:25 +000078 case AsmToken::Error:
79 SetError(Lexer->getErrLoc(), Lexer->getErr());
Chris Lattneradabe1a2010-06-24 07:18:14 +000080 return lexedToken;
81
82 case AsmToken::Percent: {
Sean Callanancf2e3d12010-01-26 00:08:25 +000083 const AsmToken &nextToken = lexTentative();
Chris Lattner02758a42010-06-24 07:16:25 +000084 if (nextToken.getKind() != AsmToken::Identifier)
Chris Lattneradabe1a2010-06-24 07:18:14 +000085 return lexedToken;
Chris Lattner02758a42010-06-24 07:16:25 +000086
87
88 if (unsigned regID = MatchRegisterName(nextToken.getString())) {
89 lexDefinite();
90
Chris Lattner645b2092010-06-24 07:29:18 +000091 // FIXME: This is completely wrong when there is a space or other
92 // punctuation between the % and the register name.
Chris Lattner02758a42010-06-24 07:16:25 +000093 StringRef regStr(lexedToken.getString().data(),
94 lexedToken.getString().size() +
95 nextToken.getString().size());
96
Chris Lattneradabe1a2010-06-24 07:18:14 +000097 return AsmToken(AsmToken::Register, regStr,
Chris Lattner02758a42010-06-24 07:16:25 +000098 static_cast<int64_t>(regID));
Sean Callanancf2e3d12010-01-26 00:08:25 +000099 }
Chris Lattner02758a42010-06-24 07:16:25 +0000100
Chris Lattner645b2092010-06-24 07:29:18 +0000101 // Match register name failed. If this is "db[0-7]", match it as an alias
102 // for dr[0-7].
103 if (nextToken.getString().size() == 3 &&
104 nextToken.getString().startswith("db")) {
105 int RegNo = -1;
106 switch (nextToken.getString()[2]) {
107 case '0': RegNo = X86::DR0; break;
108 case '1': RegNo = X86::DR1; break;
109 case '2': RegNo = X86::DR2; break;
110 case '3': RegNo = X86::DR3; break;
111 case '4': RegNo = X86::DR4; break;
112 case '5': RegNo = X86::DR5; break;
113 case '6': RegNo = X86::DR6; break;
114 case '7': RegNo = X86::DR7; break;
115 }
116
117 if (RegNo != -1) {
118 lexDefinite();
119
120 // FIXME: This is completely wrong when there is a space or other
121 // punctuation between the % and the register name.
122 StringRef regStr(lexedToken.getString().data(),
123 lexedToken.getString().size() +
124 nextToken.getString().size());
125 return AsmToken(AsmToken::Register, regStr,
126 static_cast<int64_t>(RegNo));
127 }
128 }
129
130
Chris Lattneradabe1a2010-06-24 07:18:14 +0000131 return lexedToken;
Sean Callanancf2e3d12010-01-26 00:08:25 +0000132 }
133 }
Sean Callanan436c4842010-01-25 21:59:20 +0000134}
135
136AsmToken X86AsmLexer::LexTokenIntel() {
Sean Callanan7dcef4c2010-01-26 01:00:10 +0000137 const AsmToken &lexedToken = lexDefinite();
138
139 switch(lexedToken.getKind()) {
140 default:
Chris Lattneradabe1a2010-06-24 07:18:14 +0000141 return lexedToken;
Sean Callanan7dcef4c2010-01-26 01:00:10 +0000142 case AsmToken::Error:
143 SetError(Lexer->getErrLoc(), Lexer->getErr());
Chris Lattneradabe1a2010-06-24 07:18:14 +0000144 return lexedToken;
145 case AsmToken::Identifier: {
Sean Callanan7dcef4c2010-01-26 01:00:10 +0000146 std::string upperCase = lexedToken.getString().str();
147 std::string lowerCase = LowercaseString(upperCase);
148 StringRef lowerRef(lowerCase);
149
150 unsigned regID = MatchRegisterName(lowerRef);
151
Chris Lattneradabe1a2010-06-24 07:18:14 +0000152 if (regID)
Sean Callanan7dcef4c2010-01-26 01:00:10 +0000153 return AsmToken(AsmToken::Register,
154 lexedToken.getString(),
155 static_cast<int64_t>(regID));
Chris Lattneradabe1a2010-06-24 07:18:14 +0000156 return lexedToken;
Sean Callanan7dcef4c2010-01-26 01:00:10 +0000157 }
158 }
Sean Callanane88f5522010-01-23 02:43:15 +0000159}
160
161extern "C" void LLVMInitializeX86AsmLexer() {
162 RegisterAsmLexer<X86AsmLexer> X(TheX86_32Target);
163 RegisterAsmLexer<X86AsmLexer> Y(TheX86_64Target);
164}
165
Sean Callanancf2e3d12010-01-26 00:08:25 +0000166#define REGISTERS_ONLY
Daniel Dunbarc690aab2010-01-26 03:56:22 +0000167#include "X86GenAsmMatcher.inc"
Sean Callanancf2e3d12010-01-26 00:08:25 +0000168#undef REGISTERS_ONLY