blob: 741c5381fc78a3511fdb130de2fb96e38f5daca5 [file] [log] [blame]
Chris Lattner8e3a8e02007-11-18 08:46:26 +00001//===- LLLexer.cpp - Lexer for .ll Files ----------------------------------===//
2//
3// The LLVM Compiler Infrastructure
4//
Chris Lattner4ee451d2007-12-29 20:36:04 +00005// This file is distributed under the University of Illinois Open Source
6// License. See LICENSE.TXT for details.
Chris Lattner8e3a8e02007-11-18 08:46:26 +00007//
8//===----------------------------------------------------------------------===//
9//
10// Implement the Lexer for .ll files.
11//
12//===----------------------------------------------------------------------===//
13
14#include "LLLexer.h"
Chris Lattnerdf986172009-01-02 07:01:27 +000015#include "llvm/DerivedTypes.h"
16#include "llvm/Instruction.h"
Chris Lattner8e3a8e02007-11-18 08:46:26 +000017#include "llvm/Support/MemoryBuffer.h"
Chris Lattnerd185f642007-12-08 19:03:30 +000018#include "llvm/Support/MathExtras.h"
Chris Lattner92bcb422009-07-02 22:46:18 +000019#include "llvm/Support/SourceMgr.h"
Chris Lattnerdf986172009-01-02 07:01:27 +000020#include "llvm/Support/raw_ostream.h"
21#include "llvm/Assembly/Parser.h"
Chris Lattnera8961762009-01-02 07:18:46 +000022#include <cstdlib>
Misha Brukman5679d182009-01-02 22:49:28 +000023#include <cstring>
Chris Lattner8e3a8e02007-11-18 08:46:26 +000024using namespace llvm;
25
Chris Lattnerdf986172009-01-02 07:01:27 +000026bool LLLexer::Error(LocTy ErrorLoc, const std::string &Msg) const {
Chris Lattnereeb4a842009-07-02 23:08:13 +000027 ErrorInfo = SM.GetMessage(ErrorLoc, Msg, "error");
Chris Lattnerdf986172009-01-02 07:01:27 +000028 return true;
29}
30
Chris Lattner8e3a8e02007-11-18 08:46:26 +000031//===----------------------------------------------------------------------===//
32// Helper functions.
33//===----------------------------------------------------------------------===//
34
35// atoull - Convert an ascii string of decimal digits into the unsigned long
36// long representation... this does not have to do input error checking,
37// because we know that the input will be matched by a suitable regex...
38//
Chris Lattnerdf986172009-01-02 07:01:27 +000039uint64_t LLLexer::atoull(const char *Buffer, const char *End) {
Chris Lattner8e3a8e02007-11-18 08:46:26 +000040 uint64_t Result = 0;
41 for (; Buffer != End; Buffer++) {
42 uint64_t OldRes = Result;
43 Result *= 10;
44 Result += *Buffer-'0';
45 if (Result < OldRes) { // Uh, oh, overflow detected!!!
Chris Lattnerdf986172009-01-02 07:01:27 +000046 Error("constant bigger than 64 bits detected!");
Chris Lattner8e3a8e02007-11-18 08:46:26 +000047 return 0;
48 }
49 }
50 return Result;
51}
52
Chris Lattnerdf986172009-01-02 07:01:27 +000053uint64_t LLLexer::HexIntToVal(const char *Buffer, const char *End) {
Chris Lattner8e3a8e02007-11-18 08:46:26 +000054 uint64_t Result = 0;
55 for (; Buffer != End; ++Buffer) {
56 uint64_t OldRes = Result;
57 Result *= 16;
58 char C = *Buffer;
59 if (C >= '0' && C <= '9')
60 Result += C-'0';
61 else if (C >= 'A' && C <= 'F')
62 Result += C-'A'+10;
63 else if (C >= 'a' && C <= 'f')
64 Result += C-'a'+10;
Bill Wendling2c6fd8c2007-12-16 09:16:12 +000065
Chris Lattner8e3a8e02007-11-18 08:46:26 +000066 if (Result < OldRes) { // Uh, oh, overflow detected!!!
Chris Lattnerdf986172009-01-02 07:01:27 +000067 Error("constant bigger than 64 bits detected!");
Chris Lattner8e3a8e02007-11-18 08:46:26 +000068 return 0;
69 }
70 }
71 return Result;
72}
73
Chris Lattnerdf986172009-01-02 07:01:27 +000074void LLLexer::HexToIntPair(const char *Buffer, const char *End,
75 uint64_t Pair[2]) {
Chris Lattner8e3a8e02007-11-18 08:46:26 +000076 Pair[0] = 0;
77 for (int i=0; i<16; i++, Buffer++) {
78 assert(Buffer != End);
79 Pair[0] *= 16;
80 char C = *Buffer;
81 if (C >= '0' && C <= '9')
82 Pair[0] += C-'0';
83 else if (C >= 'A' && C <= 'F')
84 Pair[0] += C-'A'+10;
85 else if (C >= 'a' && C <= 'f')
86 Pair[0] += C-'a'+10;
87 }
88 Pair[1] = 0;
89 for (int i=0; i<16 && Buffer != End; i++, Buffer++) {
90 Pair[1] *= 16;
91 char C = *Buffer;
92 if (C >= '0' && C <= '9')
93 Pair[1] += C-'0';
94 else if (C >= 'A' && C <= 'F')
95 Pair[1] += C-'A'+10;
96 else if (C >= 'a' && C <= 'f')
97 Pair[1] += C-'a'+10;
98 }
Chris Lattnerd343c6b2007-11-18 18:25:18 +000099 if (Buffer != End)
Chris Lattnerdf986172009-01-02 07:01:27 +0000100 Error("constant bigger than 128 bits detected!");
Chris Lattner8e3a8e02007-11-18 08:46:26 +0000101}
102
Dale Johannesen1b25cb22009-03-23 21:16:53 +0000103/// FP80HexToIntPair - translate an 80 bit FP80 number (20 hexits) into
104/// { low64, high16 } as usual for an APInt.
105void LLLexer::FP80HexToIntPair(const char *Buffer, const char *End,
106 uint64_t Pair[2]) {
107 Pair[1] = 0;
108 for (int i=0; i<4 && Buffer != End; i++, Buffer++) {
109 assert(Buffer != End);
110 Pair[1] *= 16;
111 char C = *Buffer;
112 if (C >= '0' && C <= '9')
113 Pair[1] += C-'0';
114 else if (C >= 'A' && C <= 'F')
115 Pair[1] += C-'A'+10;
116 else if (C >= 'a' && C <= 'f')
117 Pair[1] += C-'a'+10;
118 }
119 Pair[0] = 0;
120 for (int i=0; i<16; i++, Buffer++) {
121 Pair[0] *= 16;
122 char C = *Buffer;
123 if (C >= '0' && C <= '9')
124 Pair[0] += C-'0';
125 else if (C >= 'A' && C <= 'F')
126 Pair[0] += C-'A'+10;
127 else if (C >= 'a' && C <= 'f')
128 Pair[0] += C-'a'+10;
129 }
130 if (Buffer != End)
131 Error("constant bigger than 128 bits detected!");
132}
133
Chris Lattner8e3a8e02007-11-18 08:46:26 +0000134// UnEscapeLexed - Run through the specified buffer and change \xx codes to the
135// appropriate character.
136static void UnEscapeLexed(std::string &Str) {
137 if (Str.empty()) return;
Bill Wendling2c6fd8c2007-12-16 09:16:12 +0000138
Chris Lattner8e3a8e02007-11-18 08:46:26 +0000139 char *Buffer = &Str[0], *EndBuffer = Buffer+Str.size();
140 char *BOut = Buffer;
141 for (char *BIn = Buffer; BIn != EndBuffer; ) {
142 if (BIn[0] == '\\') {
143 if (BIn < EndBuffer-1 && BIn[1] == '\\') {
144 *BOut++ = '\\'; // Two \ becomes one
145 BIn += 2;
146 } else if (BIn < EndBuffer-2 && isxdigit(BIn[1]) && isxdigit(BIn[2])) {
147 char Tmp = BIn[3]; BIn[3] = 0; // Terminate string
148 *BOut = (char)strtol(BIn+1, 0, 16); // Convert to number
149 BIn[3] = Tmp; // Restore character
150 BIn += 3; // Skip over handled chars
151 ++BOut;
152 } else {
153 *BOut++ = *BIn++;
154 }
155 } else {
156 *BOut++ = *BIn++;
157 }
158 }
159 Str.resize(BOut-Buffer);
160}
161
162/// isLabelChar - Return true for [-a-zA-Z$._0-9].
163static bool isLabelChar(char C) {
164 return isalnum(C) || C == '-' || C == '$' || C == '.' || C == '_';
165}
166
167
168/// isLabelTail - Return true if this pointer points to a valid end of a label.
169static const char *isLabelTail(const char *CurPtr) {
170 while (1) {
171 if (CurPtr[0] == ':') return CurPtr+1;
172 if (!isLabelChar(CurPtr[0])) return 0;
173 ++CurPtr;
174 }
175}
176
177
178
179//===----------------------------------------------------------------------===//
180// Lexer definition.
181//===----------------------------------------------------------------------===//
182
Chris Lattnereeb4a842009-07-02 23:08:13 +0000183LLLexer::LLLexer(MemoryBuffer *StartBuf, SourceMgr &sm, SMDiagnostic &Err)
184 : CurBuf(StartBuf), ErrorInfo(Err), SM(sm), APFloatVal(0.0) {
Chris Lattner8e3a8e02007-11-18 08:46:26 +0000185 CurPtr = CurBuf->getBufferStart();
186}
187
188std::string LLLexer::getFilename() const {
189 return CurBuf->getBufferIdentifier();
190}
191
192int LLLexer::getNextChar() {
193 char CurChar = *CurPtr++;
194 switch (CurChar) {
195 default: return (unsigned char)CurChar;
196 case 0:
197 // A nul character in the stream is either the end of the current buffer or
198 // a random nul in the file. Disambiguate that here.
199 if (CurPtr-1 != CurBuf->getBufferEnd())
200 return 0; // Just whitespace.
Bill Wendling2c6fd8c2007-12-16 09:16:12 +0000201
Chris Lattner8e3a8e02007-11-18 08:46:26 +0000202 // Otherwise, return end of file.
Bill Wendling2c6fd8c2007-12-16 09:16:12 +0000203 --CurPtr; // Another call to lex will return EOF again.
Chris Lattner8e3a8e02007-11-18 08:46:26 +0000204 return EOF;
Bill Wendling2c6fd8c2007-12-16 09:16:12 +0000205 }
Chris Lattner8e3a8e02007-11-18 08:46:26 +0000206}
207
208
Chris Lattnerdf986172009-01-02 07:01:27 +0000209lltok::Kind LLLexer::LexToken() {
Chris Lattner8e3a8e02007-11-18 08:46:26 +0000210 TokStart = CurPtr;
Bill Wendling2c6fd8c2007-12-16 09:16:12 +0000211
Chris Lattner8e3a8e02007-11-18 08:46:26 +0000212 int CurChar = getNextChar();
Chris Lattner8e3a8e02007-11-18 08:46:26 +0000213 switch (CurChar) {
214 default:
215 // Handle letters: [a-zA-Z_]
216 if (isalpha(CurChar) || CurChar == '_')
217 return LexIdentifier();
Bill Wendling2c6fd8c2007-12-16 09:16:12 +0000218
Chris Lattnerdf986172009-01-02 07:01:27 +0000219 return lltok::Error;
220 case EOF: return lltok::Eof;
Chris Lattner8e3a8e02007-11-18 08:46:26 +0000221 case 0:
222 case ' ':
223 case '\t':
224 case '\n':
225 case '\r':
226 // Ignore whitespace.
227 return LexToken();
228 case '+': return LexPositive();
229 case '@': return LexAt();
230 case '%': return LexPercent();
231 case '"': return LexQuote();
232 case '.':
233 if (const char *Ptr = isLabelTail(CurPtr)) {
234 CurPtr = Ptr;
Chris Lattnerdf986172009-01-02 07:01:27 +0000235 StrVal.assign(TokStart, CurPtr-1);
236 return lltok::LabelStr;
Chris Lattner8e3a8e02007-11-18 08:46:26 +0000237 }
238 if (CurPtr[0] == '.' && CurPtr[1] == '.') {
239 CurPtr += 2;
Chris Lattnerdf986172009-01-02 07:01:27 +0000240 return lltok::dotdotdot;
Chris Lattner8e3a8e02007-11-18 08:46:26 +0000241 }
Chris Lattnerdf986172009-01-02 07:01:27 +0000242 return lltok::Error;
Chris Lattner8e3a8e02007-11-18 08:46:26 +0000243 case '$':
244 if (const char *Ptr = isLabelTail(CurPtr)) {
245 CurPtr = Ptr;
Chris Lattnerdf986172009-01-02 07:01:27 +0000246 StrVal.assign(TokStart, CurPtr-1);
247 return lltok::LabelStr;
Chris Lattner8e3a8e02007-11-18 08:46:26 +0000248 }
Chris Lattnerdf986172009-01-02 07:01:27 +0000249 return lltok::Error;
Chris Lattner8e3a8e02007-11-18 08:46:26 +0000250 case ';':
251 SkipLineComment();
252 return LexToken();
Nick Lewycky21cc4462009-04-04 07:22:01 +0000253 case '!': return lltok::Metadata;
Chris Lattner8e3a8e02007-11-18 08:46:26 +0000254 case '0': case '1': case '2': case '3': case '4':
255 case '5': case '6': case '7': case '8': case '9':
Bill Wendling2c6fd8c2007-12-16 09:16:12 +0000256 case '-':
Chris Lattner8e3a8e02007-11-18 08:46:26 +0000257 return LexDigitOrNegative();
Chris Lattnerdf986172009-01-02 07:01:27 +0000258 case '=': return lltok::equal;
259 case '[': return lltok::lsquare;
260 case ']': return lltok::rsquare;
261 case '{': return lltok::lbrace;
262 case '}': return lltok::rbrace;
263 case '<': return lltok::less;
264 case '>': return lltok::greater;
265 case '(': return lltok::lparen;
266 case ')': return lltok::rparen;
267 case ',': return lltok::comma;
268 case '*': return lltok::star;
269 case '\\': return lltok::backslash;
Chris Lattner8e3a8e02007-11-18 08:46:26 +0000270 }
271}
272
273void LLLexer::SkipLineComment() {
274 while (1) {
275 if (CurPtr[0] == '\n' || CurPtr[0] == '\r' || getNextChar() == EOF)
276 return;
277 }
278}
279
280/// LexAt - Lex all tokens that start with an @ character:
Chris Lattnerdf986172009-01-02 07:01:27 +0000281/// GlobalVar @\"[^\"]*\"
282/// GlobalVar @[-a-zA-Z$._][-a-zA-Z$._0-9]*
283/// GlobalVarID @[0-9]+
284lltok::Kind LLLexer::LexAt() {
Chris Lattner8e3a8e02007-11-18 08:46:26 +0000285 // Handle AtStringConstant: @\"[^\"]*\"
286 if (CurPtr[0] == '"') {
287 ++CurPtr;
Bill Wendling2c6fd8c2007-12-16 09:16:12 +0000288
Chris Lattner8e3a8e02007-11-18 08:46:26 +0000289 while (1) {
290 int CurChar = getNextChar();
Bill Wendling2c6fd8c2007-12-16 09:16:12 +0000291
292 if (CurChar == EOF) {
Chris Lattnerdf986172009-01-02 07:01:27 +0000293 Error("end of file in global variable name");
294 return lltok::Error;
Chris Lattner8e3a8e02007-11-18 08:46:26 +0000295 }
296 if (CurChar == '"') {
Chris Lattnerdf986172009-01-02 07:01:27 +0000297 StrVal.assign(TokStart+2, CurPtr-1);
298 UnEscapeLexed(StrVal);
299 return lltok::GlobalVar;
Chris Lattner8e3a8e02007-11-18 08:46:26 +0000300 }
301 }
302 }
Bill Wendling2c6fd8c2007-12-16 09:16:12 +0000303
Chris Lattner8e3a8e02007-11-18 08:46:26 +0000304 // Handle GlobalVarName: @[-a-zA-Z$._][-a-zA-Z$._0-9]*
Bill Wendling2c6fd8c2007-12-16 09:16:12 +0000305 if (isalpha(CurPtr[0]) || CurPtr[0] == '-' || CurPtr[0] == '$' ||
Chris Lattner8e3a8e02007-11-18 08:46:26 +0000306 CurPtr[0] == '.' || CurPtr[0] == '_') {
307 ++CurPtr;
Bill Wendling2c6fd8c2007-12-16 09:16:12 +0000308 while (isalnum(CurPtr[0]) || CurPtr[0] == '-' || CurPtr[0] == '$' ||
Chris Lattner8e3a8e02007-11-18 08:46:26 +0000309 CurPtr[0] == '.' || CurPtr[0] == '_')
310 ++CurPtr;
311
Chris Lattnerdf986172009-01-02 07:01:27 +0000312 StrVal.assign(TokStart+1, CurPtr); // Skip @
313 return lltok::GlobalVar;
Chris Lattner8e3a8e02007-11-18 08:46:26 +0000314 }
Bill Wendling2c6fd8c2007-12-16 09:16:12 +0000315
Chris Lattner8e3a8e02007-11-18 08:46:26 +0000316 // Handle GlobalVarID: @[0-9]+
317 if (isdigit(CurPtr[0])) {
Bill Wendling2c6fd8c2007-12-16 09:16:12 +0000318 for (++CurPtr; isdigit(CurPtr[0]); ++CurPtr)
319 /*empty*/;
320
Chris Lattner8e3a8e02007-11-18 08:46:26 +0000321 uint64_t Val = atoull(TokStart+1, CurPtr);
322 if ((unsigned)Val != Val)
Chris Lattnerdf986172009-01-02 07:01:27 +0000323 Error("invalid value number (too large)!");
324 UIntVal = unsigned(Val);
325 return lltok::GlobalID;
Chris Lattner8e3a8e02007-11-18 08:46:26 +0000326 }
Bill Wendling2c6fd8c2007-12-16 09:16:12 +0000327
Chris Lattnerdf986172009-01-02 07:01:27 +0000328 return lltok::Error;
Chris Lattner8e3a8e02007-11-18 08:46:26 +0000329}
330
331
332/// LexPercent - Lex all tokens that start with a % character:
Chris Lattnerdf986172009-01-02 07:01:27 +0000333/// LocalVar ::= %\"[^\"]*\"
334/// LocalVar ::= %[-a-zA-Z$._][-a-zA-Z$._0-9]*
335/// LocalVarID ::= %[0-9]+
336lltok::Kind LLLexer::LexPercent() {
337 // Handle LocalVarName: %\"[^\"]*\"
Chris Lattner8e3a8e02007-11-18 08:46:26 +0000338 if (CurPtr[0] == '"') {
339 ++CurPtr;
Bill Wendling2c6fd8c2007-12-16 09:16:12 +0000340
Chris Lattner8e3a8e02007-11-18 08:46:26 +0000341 while (1) {
342 int CurChar = getNextChar();
Bill Wendling2c6fd8c2007-12-16 09:16:12 +0000343
344 if (CurChar == EOF) {
Chris Lattnerdf986172009-01-02 07:01:27 +0000345 Error("end of file in string constant");
346 return lltok::Error;
Chris Lattner8e3a8e02007-11-18 08:46:26 +0000347 }
348 if (CurChar == '"') {
Chris Lattnerdf986172009-01-02 07:01:27 +0000349 StrVal.assign(TokStart+2, CurPtr-1);
350 UnEscapeLexed(StrVal);
351 return lltok::LocalVar;
Chris Lattner8e3a8e02007-11-18 08:46:26 +0000352 }
353 }
354 }
Bill Wendling2c6fd8c2007-12-16 09:16:12 +0000355
Chris Lattner8e3a8e02007-11-18 08:46:26 +0000356 // Handle LocalVarName: %[-a-zA-Z$._][-a-zA-Z$._0-9]*
Bill Wendling2c6fd8c2007-12-16 09:16:12 +0000357 if (isalpha(CurPtr[0]) || CurPtr[0] == '-' || CurPtr[0] == '$' ||
Chris Lattner8e3a8e02007-11-18 08:46:26 +0000358 CurPtr[0] == '.' || CurPtr[0] == '_') {
359 ++CurPtr;
Bill Wendling2c6fd8c2007-12-16 09:16:12 +0000360 while (isalnum(CurPtr[0]) || CurPtr[0] == '-' || CurPtr[0] == '$' ||
Chris Lattner8e3a8e02007-11-18 08:46:26 +0000361 CurPtr[0] == '.' || CurPtr[0] == '_')
362 ++CurPtr;
Bill Wendling2c6fd8c2007-12-16 09:16:12 +0000363
Chris Lattnerdf986172009-01-02 07:01:27 +0000364 StrVal.assign(TokStart+1, CurPtr); // Skip %
365 return lltok::LocalVar;
Chris Lattner8e3a8e02007-11-18 08:46:26 +0000366 }
Bill Wendling2c6fd8c2007-12-16 09:16:12 +0000367
Chris Lattner8e3a8e02007-11-18 08:46:26 +0000368 // Handle LocalVarID: %[0-9]+
369 if (isdigit(CurPtr[0])) {
Bill Wendling2c6fd8c2007-12-16 09:16:12 +0000370 for (++CurPtr; isdigit(CurPtr[0]); ++CurPtr)
371 /*empty*/;
372
Chris Lattner8e3a8e02007-11-18 08:46:26 +0000373 uint64_t Val = atoull(TokStart+1, CurPtr);
374 if ((unsigned)Val != Val)
Chris Lattnerdf986172009-01-02 07:01:27 +0000375 Error("invalid value number (too large)!");
376 UIntVal = unsigned(Val);
377 return lltok::LocalVarID;
Chris Lattner8e3a8e02007-11-18 08:46:26 +0000378 }
Bill Wendling2c6fd8c2007-12-16 09:16:12 +0000379
Chris Lattnerdf986172009-01-02 07:01:27 +0000380 return lltok::Error;
Chris Lattner8e3a8e02007-11-18 08:46:26 +0000381}
382
383/// LexQuote - Lex all tokens that start with a " character:
384/// QuoteLabel "[^"]+":
385/// StringConstant "[^"]*"
Chris Lattnerdf986172009-01-02 07:01:27 +0000386lltok::Kind LLLexer::LexQuote() {
Chris Lattner8e3a8e02007-11-18 08:46:26 +0000387 while (1) {
388 int CurChar = getNextChar();
Bill Wendling2c6fd8c2007-12-16 09:16:12 +0000389
390 if (CurChar == EOF) {
Chris Lattnerdf986172009-01-02 07:01:27 +0000391 Error("end of file in quoted string");
392 return lltok::Error;
Chris Lattner8e3a8e02007-11-18 08:46:26 +0000393 }
Bill Wendling2c6fd8c2007-12-16 09:16:12 +0000394
Chris Lattner8e3a8e02007-11-18 08:46:26 +0000395 if (CurChar != '"') continue;
396
397 if (CurPtr[0] != ':') {
Chris Lattnerdf986172009-01-02 07:01:27 +0000398 StrVal.assign(TokStart+1, CurPtr-1);
399 UnEscapeLexed(StrVal);
400 return lltok::StringConstant;
Chris Lattner8e3a8e02007-11-18 08:46:26 +0000401 }
Bill Wendling2c6fd8c2007-12-16 09:16:12 +0000402
Chris Lattner8e3a8e02007-11-18 08:46:26 +0000403 ++CurPtr;
Chris Lattnerdf986172009-01-02 07:01:27 +0000404 StrVal.assign(TokStart+1, CurPtr-2);
405 UnEscapeLexed(StrVal);
406 return lltok::LabelStr;
Chris Lattner8e3a8e02007-11-18 08:46:26 +0000407 }
408}
409
410static bool JustWhitespaceNewLine(const char *&Ptr) {
411 const char *ThisPtr = Ptr;
412 while (*ThisPtr == ' ' || *ThisPtr == '\t')
413 ++ThisPtr;
414 if (*ThisPtr == '\n' || *ThisPtr == '\r') {
415 Ptr = ThisPtr;
416 return true;
417 }
418 return false;
419}
420
421
422/// LexIdentifier: Handle several related productions:
423/// Label [-a-zA-Z$._0-9]+:
424/// IntegerType i[0-9]+
425/// Keyword sdiv, float, ...
426/// HexIntConstant [us]0x[0-9A-Fa-f]+
Chris Lattnerdf986172009-01-02 07:01:27 +0000427lltok::Kind LLLexer::LexIdentifier() {
Chris Lattner8e3a8e02007-11-18 08:46:26 +0000428 const char *StartChar = CurPtr;
429 const char *IntEnd = CurPtr[-1] == 'i' ? 0 : StartChar;
430 const char *KeywordEnd = 0;
Bill Wendling2c6fd8c2007-12-16 09:16:12 +0000431
Chris Lattner8e3a8e02007-11-18 08:46:26 +0000432 for (; isLabelChar(*CurPtr); ++CurPtr) {
433 // If we decide this is an integer, remember the end of the sequence.
434 if (!IntEnd && !isdigit(*CurPtr)) IntEnd = CurPtr;
435 if (!KeywordEnd && !isalnum(*CurPtr) && *CurPtr != '_') KeywordEnd = CurPtr;
436 }
Bill Wendling2c6fd8c2007-12-16 09:16:12 +0000437
Chris Lattner8e3a8e02007-11-18 08:46:26 +0000438 // If we stopped due to a colon, this really is a label.
439 if (*CurPtr == ':') {
Chris Lattnerdf986172009-01-02 07:01:27 +0000440 StrVal.assign(StartChar-1, CurPtr++);
441 return lltok::LabelStr;
Chris Lattner8e3a8e02007-11-18 08:46:26 +0000442 }
Bill Wendling2c6fd8c2007-12-16 09:16:12 +0000443
Chris Lattner8e3a8e02007-11-18 08:46:26 +0000444 // Otherwise, this wasn't a label. If this was valid as an integer type,
445 // return it.
446 if (IntEnd == 0) IntEnd = CurPtr;
447 if (IntEnd != StartChar) {
448 CurPtr = IntEnd;
449 uint64_t NumBits = atoull(StartChar, CurPtr);
Bill Wendling2c6fd8c2007-12-16 09:16:12 +0000450 if (NumBits < IntegerType::MIN_INT_BITS ||
Chris Lattner8e3a8e02007-11-18 08:46:26 +0000451 NumBits > IntegerType::MAX_INT_BITS) {
Chris Lattnerdf986172009-01-02 07:01:27 +0000452 Error("bitwidth for integer type out of range!");
453 return lltok::Error;
Chris Lattner8e3a8e02007-11-18 08:46:26 +0000454 }
Chris Lattnerdf986172009-01-02 07:01:27 +0000455 TyVal = IntegerType::get(NumBits);
456 return lltok::Type;
Chris Lattner8e3a8e02007-11-18 08:46:26 +0000457 }
Bill Wendling2c6fd8c2007-12-16 09:16:12 +0000458
Chris Lattner8e3a8e02007-11-18 08:46:26 +0000459 // Otherwise, this was a letter sequence. See which keyword this is.
460 if (KeywordEnd == 0) KeywordEnd = CurPtr;
461 CurPtr = KeywordEnd;
462 --StartChar;
463 unsigned Len = CurPtr-StartChar;
Chris Lattnerdf986172009-01-02 07:01:27 +0000464#define KEYWORD(STR) \
465 if (Len == strlen(#STR) && !memcmp(StartChar, #STR, strlen(#STR))) \
466 return lltok::kw_##STR;
Chris Lattner8e3a8e02007-11-18 08:46:26 +0000467
Chris Lattnerdf986172009-01-02 07:01:27 +0000468 KEYWORD(begin); KEYWORD(end);
469 KEYWORD(true); KEYWORD(false);
470 KEYWORD(declare); KEYWORD(define);
471 KEYWORD(global); KEYWORD(constant);
Bill Wendling2c6fd8c2007-12-16 09:16:12 +0000472
Rafael Espindolabb46f522009-01-15 20:18:42 +0000473 KEYWORD(private);
Chris Lattnerdf986172009-01-02 07:01:27 +0000474 KEYWORD(internal);
Chris Lattner266c7bb2009-04-13 05:44:34 +0000475 KEYWORD(available_externally);
Chris Lattnerdf986172009-01-02 07:01:27 +0000476 KEYWORD(linkonce);
Duncan Sands667d4b82009-03-07 15:45:40 +0000477 KEYWORD(linkonce_odr);
Chris Lattnerdf986172009-01-02 07:01:27 +0000478 KEYWORD(weak);
Duncan Sands667d4b82009-03-07 15:45:40 +0000479 KEYWORD(weak_odr);
Chris Lattnerdf986172009-01-02 07:01:27 +0000480 KEYWORD(appending);
481 KEYWORD(dllimport);
482 KEYWORD(dllexport);
483 KEYWORD(common);
484 KEYWORD(default);
485 KEYWORD(hidden);
486 KEYWORD(protected);
487 KEYWORD(extern_weak);
488 KEYWORD(external);
489 KEYWORD(thread_local);
490 KEYWORD(zeroinitializer);
491 KEYWORD(undef);
492 KEYWORD(null);
493 KEYWORD(to);
494 KEYWORD(tail);
495 KEYWORD(target);
496 KEYWORD(triple);
497 KEYWORD(deplibs);
498 KEYWORD(datalayout);
499 KEYWORD(volatile);
500 KEYWORD(align);
501 KEYWORD(addrspace);
502 KEYWORD(section);
503 KEYWORD(alias);
504 KEYWORD(module);
505 KEYWORD(asm);
506 KEYWORD(sideeffect);
507 KEYWORD(gc);
Bill Wendling2c6fd8c2007-12-16 09:16:12 +0000508
Chris Lattnerdf986172009-01-02 07:01:27 +0000509 KEYWORD(ccc);
510 KEYWORD(fastcc);
511 KEYWORD(coldcc);
512 KEYWORD(x86_stdcallcc);
513 KEYWORD(x86_fastcallcc);
Anton Korobeynikov385f5a92009-06-16 18:50:49 +0000514 KEYWORD(arm_apcscc);
515 KEYWORD(arm_aapcscc);
516 KEYWORD(arm_aapcs_vfpcc);
517
Chris Lattnerdf986172009-01-02 07:01:27 +0000518 KEYWORD(cc);
519 KEYWORD(c);
Bill Wendling2c6fd8c2007-12-16 09:16:12 +0000520
Chris Lattnerdf986172009-01-02 07:01:27 +0000521 KEYWORD(signext);
522 KEYWORD(zeroext);
523 KEYWORD(inreg);
524 KEYWORD(sret);
525 KEYWORD(nounwind);
526 KEYWORD(noreturn);
527 KEYWORD(noalias);
528 KEYWORD(nocapture);
529 KEYWORD(byval);
530 KEYWORD(nest);
531 KEYWORD(readnone);
532 KEYWORD(readonly);
Bill Wendling2c6fd8c2007-12-16 09:16:12 +0000533
Chris Lattnerdf986172009-01-02 07:01:27 +0000534 KEYWORD(noinline);
535 KEYWORD(alwaysinline);
536 KEYWORD(optsize);
537 KEYWORD(ssp);
538 KEYWORD(sspreq);
Devang Pateld18e31a2009-06-04 22:05:33 +0000539 KEYWORD(noredzone);
Devang Patel578efa92009-06-05 21:57:13 +0000540 KEYWORD(noimplicitfloat);
Devang Pateld4980812008-09-02 20:52:40 +0000541
Chris Lattnerdf986172009-01-02 07:01:27 +0000542 KEYWORD(type);
543 KEYWORD(opaque);
Chris Lattner8e3a8e02007-11-18 08:46:26 +0000544
Chris Lattnerdf986172009-01-02 07:01:27 +0000545 KEYWORD(eq); KEYWORD(ne); KEYWORD(slt); KEYWORD(sgt); KEYWORD(sle);
546 KEYWORD(sge); KEYWORD(ult); KEYWORD(ugt); KEYWORD(ule); KEYWORD(uge);
547 KEYWORD(oeq); KEYWORD(one); KEYWORD(olt); KEYWORD(ogt); KEYWORD(ole);
548 KEYWORD(oge); KEYWORD(ord); KEYWORD(uno); KEYWORD(ueq); KEYWORD(une);
Misha Brukman9ea40342009-01-02 22:46:48 +0000549
Chris Lattnerdf986172009-01-02 07:01:27 +0000550 KEYWORD(x);
Chris Lattner8e3a8e02007-11-18 08:46:26 +0000551#undef KEYWORD
552
553 // Keywords for types.
Chris Lattnerdf986172009-01-02 07:01:27 +0000554#define TYPEKEYWORD(STR, LLVMTY) \
Chris Lattner8e3a8e02007-11-18 08:46:26 +0000555 if (Len == strlen(STR) && !memcmp(StartChar, STR, strlen(STR))) { \
Chris Lattnerdf986172009-01-02 07:01:27 +0000556 TyVal = LLVMTY; return lltok::Type; }
557 TYPEKEYWORD("void", Type::VoidTy);
558 TYPEKEYWORD("float", Type::FloatTy);
559 TYPEKEYWORD("double", Type::DoubleTy);
560 TYPEKEYWORD("x86_fp80", Type::X86_FP80Ty);
561 TYPEKEYWORD("fp128", Type::FP128Ty);
562 TYPEKEYWORD("ppc_fp128", Type::PPC_FP128Ty);
563 TYPEKEYWORD("label", Type::LabelTy);
Nick Lewycky7a0370f2009-05-30 05:06:04 +0000564 TYPEKEYWORD("metadata", Type::MetadataTy);
Chris Lattner8e3a8e02007-11-18 08:46:26 +0000565#undef TYPEKEYWORD
566
567 // Handle special forms for autoupgrading. Drop these in LLVM 3.0. This is
568 // to avoid conflicting with the sext/zext instructions, below.
569 if (Len == 4 && !memcmp(StartChar, "sext", 4)) {
570 // Scan CurPtr ahead, seeing if there is just whitespace before the newline.
571 if (JustWhitespaceNewLine(CurPtr))
Chris Lattnerdf986172009-01-02 07:01:27 +0000572 return lltok::kw_signext;
Chris Lattner8e3a8e02007-11-18 08:46:26 +0000573 } else if (Len == 4 && !memcmp(StartChar, "zext", 4)) {
574 // Scan CurPtr ahead, seeing if there is just whitespace before the newline.
575 if (JustWhitespaceNewLine(CurPtr))
Chris Lattnerdf986172009-01-02 07:01:27 +0000576 return lltok::kw_zeroext;
Chris Lattner8e3a8e02007-11-18 08:46:26 +0000577 }
Bill Wendling2c6fd8c2007-12-16 09:16:12 +0000578
Chris Lattner8e3a8e02007-11-18 08:46:26 +0000579 // Keywords for instructions.
Chris Lattnerdf986172009-01-02 07:01:27 +0000580#define INSTKEYWORD(STR, Enum) \
581 if (Len == strlen(#STR) && !memcmp(StartChar, #STR, strlen(#STR))) { \
582 UIntVal = Instruction::Enum; return lltok::kw_##STR; }
Chris Lattner8e3a8e02007-11-18 08:46:26 +0000583
Dan Gohmanae3a0be2009-06-04 22:49:04 +0000584 INSTKEYWORD(add, Add); INSTKEYWORD(fadd, FAdd);
585 INSTKEYWORD(sub, Sub); INSTKEYWORD(fsub, FSub);
586 INSTKEYWORD(mul, Mul); INSTKEYWORD(fmul, FMul);
Chris Lattnerdf986172009-01-02 07:01:27 +0000587 INSTKEYWORD(udiv, UDiv); INSTKEYWORD(sdiv, SDiv); INSTKEYWORD(fdiv, FDiv);
588 INSTKEYWORD(urem, URem); INSTKEYWORD(srem, SRem); INSTKEYWORD(frem, FRem);
589 INSTKEYWORD(shl, Shl); INSTKEYWORD(lshr, LShr); INSTKEYWORD(ashr, AShr);
590 INSTKEYWORD(and, And); INSTKEYWORD(or, Or); INSTKEYWORD(xor, Xor);
591 INSTKEYWORD(icmp, ICmp); INSTKEYWORD(fcmp, FCmp);
592 INSTKEYWORD(vicmp, VICmp); INSTKEYWORD(vfcmp, VFCmp);
Chris Lattner8e3a8e02007-11-18 08:46:26 +0000593
Chris Lattnerdf986172009-01-02 07:01:27 +0000594 INSTKEYWORD(phi, PHI);
595 INSTKEYWORD(call, Call);
596 INSTKEYWORD(trunc, Trunc);
597 INSTKEYWORD(zext, ZExt);
598 INSTKEYWORD(sext, SExt);
599 INSTKEYWORD(fptrunc, FPTrunc);
600 INSTKEYWORD(fpext, FPExt);
601 INSTKEYWORD(uitofp, UIToFP);
602 INSTKEYWORD(sitofp, SIToFP);
603 INSTKEYWORD(fptoui, FPToUI);
604 INSTKEYWORD(fptosi, FPToSI);
605 INSTKEYWORD(inttoptr, IntToPtr);
606 INSTKEYWORD(ptrtoint, PtrToInt);
607 INSTKEYWORD(bitcast, BitCast);
608 INSTKEYWORD(select, Select);
609 INSTKEYWORD(va_arg, VAArg);
610 INSTKEYWORD(ret, Ret);
611 INSTKEYWORD(br, Br);
612 INSTKEYWORD(switch, Switch);
613 INSTKEYWORD(invoke, Invoke);
614 INSTKEYWORD(unwind, Unwind);
615 INSTKEYWORD(unreachable, Unreachable);
Chris Lattner8e3a8e02007-11-18 08:46:26 +0000616
Chris Lattnerdf986172009-01-02 07:01:27 +0000617 INSTKEYWORD(malloc, Malloc);
618 INSTKEYWORD(alloca, Alloca);
619 INSTKEYWORD(free, Free);
620 INSTKEYWORD(load, Load);
621 INSTKEYWORD(store, Store);
622 INSTKEYWORD(getelementptr, GetElementPtr);
Chris Lattner8e3a8e02007-11-18 08:46:26 +0000623
Chris Lattnerdf986172009-01-02 07:01:27 +0000624 INSTKEYWORD(extractelement, ExtractElement);
625 INSTKEYWORD(insertelement, InsertElement);
626 INSTKEYWORD(shufflevector, ShuffleVector);
627 INSTKEYWORD(getresult, ExtractValue);
628 INSTKEYWORD(extractvalue, ExtractValue);
629 INSTKEYWORD(insertvalue, InsertValue);
Bill Wendling2c6fd8c2007-12-16 09:16:12 +0000630#undef INSTKEYWORD
631
Chris Lattner8e3a8e02007-11-18 08:46:26 +0000632 // Check for [us]0x[0-9A-Fa-f]+ which are Hexadecimal constant generated by
633 // the CFE to avoid forcing it to deal with 64-bit numbers.
634 if ((TokStart[0] == 'u' || TokStart[0] == 's') &&
635 TokStart[1] == '0' && TokStart[2] == 'x' && isxdigit(TokStart[3])) {
636 int len = CurPtr-TokStart-3;
637 uint32_t bits = len * 4;
638 APInt Tmp(bits, TokStart+3, len, 16);
639 uint32_t activeBits = Tmp.getActiveBits();
640 if (activeBits > 0 && activeBits < bits)
641 Tmp.trunc(activeBits);
Chris Lattnerdf986172009-01-02 07:01:27 +0000642 APSIntVal = APSInt(Tmp, TokStart[0] == 'u');
643 return lltok::APSInt;
Chris Lattner8e3a8e02007-11-18 08:46:26 +0000644 }
Bill Wendling2c6fd8c2007-12-16 09:16:12 +0000645
Chris Lattner4ce0df62007-11-18 18:43:24 +0000646 // If this is "cc1234", return this as just "cc".
Chris Lattner8e3a8e02007-11-18 08:46:26 +0000647 if (TokStart[0] == 'c' && TokStart[1] == 'c') {
648 CurPtr = TokStart+2;
Chris Lattnerdf986172009-01-02 07:01:27 +0000649 return lltok::kw_cc;
Chris Lattner8e3a8e02007-11-18 08:46:26 +0000650 }
Bill Wendling2c6fd8c2007-12-16 09:16:12 +0000651
Chris Lattner4ce0df62007-11-18 18:43:24 +0000652 // If this starts with "call", return it as CALL. This is to support old
653 // broken .ll files. FIXME: remove this with LLVM 3.0.
654 if (CurPtr-TokStart > 4 && !memcmp(TokStart, "call", 4)) {
655 CurPtr = TokStart+4;
Chris Lattnerdf986172009-01-02 07:01:27 +0000656 UIntVal = Instruction::Call;
657 return lltok::kw_call;
Chris Lattner4ce0df62007-11-18 18:43:24 +0000658 }
Bill Wendling2c6fd8c2007-12-16 09:16:12 +0000659
Chris Lattnerdf986172009-01-02 07:01:27 +0000660 // Finally, if this isn't known, return an error.
Chris Lattner8e3a8e02007-11-18 08:46:26 +0000661 CurPtr = TokStart+1;
Chris Lattnerdf986172009-01-02 07:01:27 +0000662 return lltok::Error;
Chris Lattner8e3a8e02007-11-18 08:46:26 +0000663}
664
665
666/// Lex0x: Handle productions that start with 0x, knowing that it matches and
667/// that this is not a label:
668/// HexFPConstant 0x[0-9A-Fa-f]+
669/// HexFP80Constant 0xK[0-9A-Fa-f]+
670/// HexFP128Constant 0xL[0-9A-Fa-f]+
671/// HexPPC128Constant 0xM[0-9A-Fa-f]+
Chris Lattnerdf986172009-01-02 07:01:27 +0000672lltok::Kind LLLexer::Lex0x() {
Chris Lattner8e3a8e02007-11-18 08:46:26 +0000673 CurPtr = TokStart + 2;
Bill Wendling2c6fd8c2007-12-16 09:16:12 +0000674
Chris Lattner8e3a8e02007-11-18 08:46:26 +0000675 char Kind;
676 if (CurPtr[0] >= 'K' && CurPtr[0] <= 'M') {
677 Kind = *CurPtr++;
678 } else {
679 Kind = 'J';
680 }
681
682 if (!isxdigit(CurPtr[0])) {
Chris Lattnerdf986172009-01-02 07:01:27 +0000683 // Bad token, return it as an error.
Chris Lattner8e3a8e02007-11-18 08:46:26 +0000684 CurPtr = TokStart+1;
Chris Lattnerdf986172009-01-02 07:01:27 +0000685 return lltok::Error;
Chris Lattner8e3a8e02007-11-18 08:46:26 +0000686 }
Bill Wendling2c6fd8c2007-12-16 09:16:12 +0000687
Chris Lattner8e3a8e02007-11-18 08:46:26 +0000688 while (isxdigit(CurPtr[0]))
689 ++CurPtr;
Bill Wendling2c6fd8c2007-12-16 09:16:12 +0000690
Chris Lattner8e3a8e02007-11-18 08:46:26 +0000691 if (Kind == 'J') {
692 // HexFPConstant - Floating point constant represented in IEEE format as a
693 // hexadecimal number for when exponential notation is not precise enough.
694 // Float and double only.
Chris Lattnerdf986172009-01-02 07:01:27 +0000695 APFloatVal = APFloat(BitsToDouble(HexIntToVal(TokStart+2, CurPtr)));
696 return lltok::APFloat;
Chris Lattner8e3a8e02007-11-18 08:46:26 +0000697 }
Bill Wendling2c6fd8c2007-12-16 09:16:12 +0000698
Chris Lattner8e3a8e02007-11-18 08:46:26 +0000699 uint64_t Pair[2];
Chris Lattner8e3a8e02007-11-18 08:46:26 +0000700 switch (Kind) {
701 default: assert(0 && "Unknown kind!");
702 case 'K':
703 // F80HexFPConstant - x87 long double in hexadecimal format (10 bytes)
Dale Johannesen1b25cb22009-03-23 21:16:53 +0000704 FP80HexToIntPair(TokStart+3, CurPtr, Pair);
Chris Lattnerdf986172009-01-02 07:01:27 +0000705 APFloatVal = APFloat(APInt(80, 2, Pair));
706 return lltok::APFloat;
Chris Lattner8e3a8e02007-11-18 08:46:26 +0000707 case 'L':
708 // F128HexFPConstant - IEEE 128-bit in hexadecimal format (16 bytes)
Dale Johannesen1b25cb22009-03-23 21:16:53 +0000709 HexToIntPair(TokStart+3, CurPtr, Pair);
Chris Lattnerdf986172009-01-02 07:01:27 +0000710 APFloatVal = APFloat(APInt(128, 2, Pair), true);
711 return lltok::APFloat;
Chris Lattner8e3a8e02007-11-18 08:46:26 +0000712 case 'M':
713 // PPC128HexFPConstant - PowerPC 128-bit in hexadecimal format (16 bytes)
Dale Johannesen1b25cb22009-03-23 21:16:53 +0000714 HexToIntPair(TokStart+3, CurPtr, Pair);
Chris Lattnerdf986172009-01-02 07:01:27 +0000715 APFloatVal = APFloat(APInt(128, 2, Pair));
716 return lltok::APFloat;
Chris Lattner8e3a8e02007-11-18 08:46:26 +0000717 }
718}
719
720/// LexIdentifier: Handle several related productions:
721/// Label [-a-zA-Z$._0-9]+:
722/// NInteger -[0-9]+
723/// FPConstant [-+]?[0-9]+[.][0-9]*([eE][-+]?[0-9]+)?
724/// PInteger [0-9]+
725/// HexFPConstant 0x[0-9A-Fa-f]+
726/// HexFP80Constant 0xK[0-9A-Fa-f]+
727/// HexFP128Constant 0xL[0-9A-Fa-f]+
728/// HexPPC128Constant 0xM[0-9A-Fa-f]+
Chris Lattnerdf986172009-01-02 07:01:27 +0000729lltok::Kind LLLexer::LexDigitOrNegative() {
Chris Lattner8e3a8e02007-11-18 08:46:26 +0000730 // If the letter after the negative is a number, this is probably a label.
731 if (!isdigit(TokStart[0]) && !isdigit(CurPtr[0])) {
732 // Okay, this is not a number after the -, it's probably a label.
733 if (const char *End = isLabelTail(CurPtr)) {
Chris Lattnerdf986172009-01-02 07:01:27 +0000734 StrVal.assign(TokStart, End-1);
Chris Lattner8e3a8e02007-11-18 08:46:26 +0000735 CurPtr = End;
Chris Lattnerdf986172009-01-02 07:01:27 +0000736 return lltok::LabelStr;
Chris Lattner8e3a8e02007-11-18 08:46:26 +0000737 }
Bill Wendling2c6fd8c2007-12-16 09:16:12 +0000738
Chris Lattnerdf986172009-01-02 07:01:27 +0000739 return lltok::Error;
Chris Lattner8e3a8e02007-11-18 08:46:26 +0000740 }
Bill Wendling2c6fd8c2007-12-16 09:16:12 +0000741
Chris Lattner8e3a8e02007-11-18 08:46:26 +0000742 // At this point, it is either a label, int or fp constant.
Bill Wendling2c6fd8c2007-12-16 09:16:12 +0000743
Chris Lattner8e3a8e02007-11-18 08:46:26 +0000744 // Skip digits, we have at least one.
Bill Wendling2c6fd8c2007-12-16 09:16:12 +0000745 for (; isdigit(CurPtr[0]); ++CurPtr)
746 /*empty*/;
747
Chris Lattner8e3a8e02007-11-18 08:46:26 +0000748 // Check to see if this really is a label afterall, e.g. "-1:".
749 if (isLabelChar(CurPtr[0]) || CurPtr[0] == ':') {
750 if (const char *End = isLabelTail(CurPtr)) {
Chris Lattnerdf986172009-01-02 07:01:27 +0000751 StrVal.assign(TokStart, End-1);
Chris Lattner8e3a8e02007-11-18 08:46:26 +0000752 CurPtr = End;
Chris Lattnerdf986172009-01-02 07:01:27 +0000753 return lltok::LabelStr;
Chris Lattner8e3a8e02007-11-18 08:46:26 +0000754 }
755 }
Bill Wendling2c6fd8c2007-12-16 09:16:12 +0000756
Chris Lattner8e3a8e02007-11-18 08:46:26 +0000757 // If the next character is a '.', then it is a fp value, otherwise its
758 // integer.
759 if (CurPtr[0] != '.') {
760 if (TokStart[0] == '0' && TokStart[1] == 'x')
761 return Lex0x();
762 unsigned Len = CurPtr-TokStart;
763 uint32_t numBits = ((Len * 64) / 19) + 2;
764 APInt Tmp(numBits, TokStart, Len, 10);
765 if (TokStart[0] == '-') {
766 uint32_t minBits = Tmp.getMinSignedBits();
767 if (minBits > 0 && minBits < numBits)
768 Tmp.trunc(minBits);
Chris Lattnerdf986172009-01-02 07:01:27 +0000769 APSIntVal = APSInt(Tmp, false);
Chris Lattner8e3a8e02007-11-18 08:46:26 +0000770 } else {
771 uint32_t activeBits = Tmp.getActiveBits();
772 if (activeBits > 0 && activeBits < numBits)
773 Tmp.trunc(activeBits);
Chris Lattnerdf986172009-01-02 07:01:27 +0000774 APSIntVal = APSInt(Tmp, true);
Chris Lattner8e3a8e02007-11-18 08:46:26 +0000775 }
Chris Lattnerdf986172009-01-02 07:01:27 +0000776 return lltok::APSInt;
Chris Lattner8e3a8e02007-11-18 08:46:26 +0000777 }
778
779 ++CurPtr;
Bill Wendling2c6fd8c2007-12-16 09:16:12 +0000780
Chris Lattner8e3a8e02007-11-18 08:46:26 +0000781 // Skip over [0-9]*([eE][-+]?[0-9]+)?
782 while (isdigit(CurPtr[0])) ++CurPtr;
Bill Wendling2c6fd8c2007-12-16 09:16:12 +0000783
Chris Lattner8e3a8e02007-11-18 08:46:26 +0000784 if (CurPtr[0] == 'e' || CurPtr[0] == 'E') {
Bill Wendling2c6fd8c2007-12-16 09:16:12 +0000785 if (isdigit(CurPtr[1]) ||
Chris Lattner8e3a8e02007-11-18 08:46:26 +0000786 ((CurPtr[1] == '-' || CurPtr[1] == '+') && isdigit(CurPtr[2]))) {
787 CurPtr += 2;
788 while (isdigit(CurPtr[0])) ++CurPtr;
789 }
790 }
Bill Wendling2c6fd8c2007-12-16 09:16:12 +0000791
Chris Lattnerdf986172009-01-02 07:01:27 +0000792 APFloatVal = APFloat(atof(TokStart));
793 return lltok::APFloat;
Chris Lattner8e3a8e02007-11-18 08:46:26 +0000794}
795
796/// FPConstant [-+]?[0-9]+[.][0-9]*([eE][-+]?[0-9]+)?
Chris Lattnerdf986172009-01-02 07:01:27 +0000797lltok::Kind LLLexer::LexPositive() {
Chris Lattner8e3a8e02007-11-18 08:46:26 +0000798 // If the letter after the negative is a number, this is probably not a
799 // label.
800 if (!isdigit(CurPtr[0]))
Chris Lattnerdf986172009-01-02 07:01:27 +0000801 return lltok::Error;
Bill Wendling2c6fd8c2007-12-16 09:16:12 +0000802
Chris Lattner8e3a8e02007-11-18 08:46:26 +0000803 // Skip digits.
Bill Wendling2c6fd8c2007-12-16 09:16:12 +0000804 for (++CurPtr; isdigit(CurPtr[0]); ++CurPtr)
805 /*empty*/;
Chris Lattner8e3a8e02007-11-18 08:46:26 +0000806
807 // At this point, we need a '.'.
808 if (CurPtr[0] != '.') {
809 CurPtr = TokStart+1;
Chris Lattnerdf986172009-01-02 07:01:27 +0000810 return lltok::Error;
Chris Lattner8e3a8e02007-11-18 08:46:26 +0000811 }
Bill Wendling2c6fd8c2007-12-16 09:16:12 +0000812
Chris Lattner8e3a8e02007-11-18 08:46:26 +0000813 ++CurPtr;
Bill Wendling2c6fd8c2007-12-16 09:16:12 +0000814
Chris Lattner8e3a8e02007-11-18 08:46:26 +0000815 // Skip over [0-9]*([eE][-+]?[0-9]+)?
816 while (isdigit(CurPtr[0])) ++CurPtr;
Bill Wendling2c6fd8c2007-12-16 09:16:12 +0000817
Chris Lattner8e3a8e02007-11-18 08:46:26 +0000818 if (CurPtr[0] == 'e' || CurPtr[0] == 'E') {
Bill Wendling2c6fd8c2007-12-16 09:16:12 +0000819 if (isdigit(CurPtr[1]) ||
Chris Lattner8e3a8e02007-11-18 08:46:26 +0000820 ((CurPtr[1] == '-' || CurPtr[1] == '+') && isdigit(CurPtr[2]))) {
821 CurPtr += 2;
822 while (isdigit(CurPtr[0])) ++CurPtr;
823 }
824 }
Bill Wendling2c6fd8c2007-12-16 09:16:12 +0000825
Chris Lattnerdf986172009-01-02 07:01:27 +0000826 APFloatVal = APFloat(atof(TokStart));
827 return lltok::APFloat;
Chris Lattner8e3a8e02007-11-18 08:46:26 +0000828}