Chris Lattner | 32eecb0 | 2006-02-14 05:14:46 +0000 | [diff] [blame] | 1 | /*===-- Lexer.l - Scanner for llvm assembly files --------------*- C++ -*--===// |
| 2 | // |
| 3 | // The LLVM Compiler Infrastructure |
| 4 | // |
| 5 | // This file was developed by the LLVM research group and is distributed under |
| 6 | // the University of Illinois Open Source License. See LICENSE.TXT for details. |
| 7 | // |
| 8 | //===----------------------------------------------------------------------===// |
| 9 | // |
| 10 | // This file implements the flex scanner for LLVM assembly languages files. |
| 11 | // |
| 12 | //===----------------------------------------------------------------------===*/ |
| 13 | |
| 14 | %option prefix="llvmAsm" |
| 15 | %option yylineno |
| 16 | %option nostdinit |
| 17 | %option never-interactive |
| 18 | %option batch |
| 19 | %option noyywrap |
| 20 | %option nodefault |
| 21 | %option 8bit |
| 22 | %option outfile="Lexer.cpp" |
| 23 | %option ecs |
| 24 | %option noreject |
| 25 | %option noyymore |
| 26 | |
| 27 | %{ |
| 28 | #include "ParserInternals.h" |
| 29 | #include "llvm/Module.h" |
Chris Lattner | 8e00832 | 2007-05-22 06:47:55 +0000 | [diff] [blame^] | 30 | #include "llvm/Support/MathExtras.h" |
Chris Lattner | 32eecb0 | 2006-02-14 05:14:46 +0000 | [diff] [blame] | 31 | #include <list> |
| 32 | #include "llvmAsmParser.h" |
| 33 | #include <cctype> |
| 34 | #include <cstdlib> |
| 35 | |
| 36 | void set_scan_file(FILE * F){ |
| 37 | yy_switch_to_buffer(yy_create_buffer( F, YY_BUF_SIZE ) ); |
| 38 | } |
| 39 | void set_scan_string (const char * str) { |
| 40 | yy_scan_string (str); |
| 41 | } |
| 42 | |
Reid Spencer | 3ed469c | 2006-11-02 20:25:50 +0000 | [diff] [blame] | 43 | // Construct a token value for a non-obsolete token |
Chris Lattner | 32eecb0 | 2006-02-14 05:14:46 +0000 | [diff] [blame] | 44 | #define RET_TOK(type, Enum, sym) \ |
Reid Spencer | a132e04 | 2006-12-03 05:46:11 +0000 | [diff] [blame] | 45 | llvmAsmlval.type = Instruction::Enum; \ |
| 46 | return sym |
| 47 | |
Reid Spencer | 3ed469c | 2006-11-02 20:25:50 +0000 | [diff] [blame] | 48 | // Construct a token value for an obsolete token |
Reid Spencer | a132e04 | 2006-12-03 05:46:11 +0000 | [diff] [blame] | 49 | #define RET_TY(CTYPE, SYM) \ |
| 50 | llvmAsmlval.PrimType = CTYPE;\ |
Reid Spencer | 481169e | 2006-12-01 00:33:46 +0000 | [diff] [blame] | 51 | return SYM |
Chris Lattner | 32eecb0 | 2006-02-14 05:14:46 +0000 | [diff] [blame] | 52 | |
| 53 | namespace llvm { |
| 54 | |
| 55 | // TODO: All of the static identifiers are figured out by the lexer, |
| 56 | // these should be hashed to reduce the lexer size |
| 57 | |
| 58 | |
| 59 | // atoull - Convert an ascii string of decimal digits into the unsigned long |
| 60 | // long representation... this does not have to do input error checking, |
| 61 | // because we know that the input will be matched by a suitable regex... |
| 62 | // |
| 63 | static uint64_t atoull(const char *Buffer) { |
| 64 | uint64_t Result = 0; |
| 65 | for (; *Buffer; Buffer++) { |
| 66 | uint64_t OldRes = Result; |
| 67 | Result *= 10; |
| 68 | Result += *Buffer-'0'; |
| 69 | if (Result < OldRes) // Uh, oh, overflow detected!!! |
Reid Spencer | 61c83e0 | 2006-08-18 08:43:06 +0000 | [diff] [blame] | 70 | GenerateError("constant bigger than 64 bits detected!"); |
Chris Lattner | 32eecb0 | 2006-02-14 05:14:46 +0000 | [diff] [blame] | 71 | } |
| 72 | return Result; |
| 73 | } |
| 74 | |
| 75 | static uint64_t HexIntToVal(const char *Buffer) { |
| 76 | uint64_t Result = 0; |
| 77 | for (; *Buffer; ++Buffer) { |
| 78 | uint64_t OldRes = Result; |
| 79 | Result *= 16; |
| 80 | char C = *Buffer; |
| 81 | if (C >= '0' && C <= '9') |
| 82 | Result += C-'0'; |
| 83 | else if (C >= 'A' && C <= 'F') |
| 84 | Result += C-'A'+10; |
| 85 | else if (C >= 'a' && C <= 'f') |
| 86 | Result += C-'a'+10; |
| 87 | |
| 88 | if (Result < OldRes) // Uh, oh, overflow detected!!! |
Reid Spencer | 61c83e0 | 2006-08-18 08:43:06 +0000 | [diff] [blame] | 89 | GenerateError("constant bigger than 64 bits detected!"); |
Chris Lattner | 32eecb0 | 2006-02-14 05:14:46 +0000 | [diff] [blame] | 90 | } |
| 91 | return Result; |
| 92 | } |
| 93 | |
| 94 | |
| 95 | // HexToFP - Convert the ascii string in hexidecimal format to the floating |
| 96 | // point representation of it. |
| 97 | // |
| 98 | static double HexToFP(const char *Buffer) { |
Chris Lattner | 8e00832 | 2007-05-22 06:47:55 +0000 | [diff] [blame^] | 99 | return BitsToDouble(HexIntToVal(Buffer)); // Cast Hex constant to double |
Chris Lattner | 32eecb0 | 2006-02-14 05:14:46 +0000 | [diff] [blame] | 100 | } |
| 101 | |
| 102 | |
| 103 | // UnEscapeLexed - Run through the specified buffer and change \xx codes to the |
| 104 | // appropriate character. If AllowNull is set to false, a \00 value will cause |
| 105 | // an exception to be thrown. |
| 106 | // |
| 107 | // If AllowNull is set to true, the return value of the function points to the |
| 108 | // last character of the string in memory. |
| 109 | // |
| 110 | char *UnEscapeLexed(char *Buffer, bool AllowNull) { |
| 111 | char *BOut = Buffer; |
| 112 | for (char *BIn = Buffer; *BIn; ) { |
| 113 | if (BIn[0] == '\\' && isxdigit(BIn[1]) && isxdigit(BIn[2])) { |
| 114 | char Tmp = BIn[3]; BIn[3] = 0; // Terminate string |
| 115 | *BOut = (char)strtol(BIn+1, 0, 16); // Convert to number |
| 116 | if (!AllowNull && !*BOut) |
Reid Spencer | 61c83e0 | 2006-08-18 08:43:06 +0000 | [diff] [blame] | 117 | GenerateError("String literal cannot accept \\00 escape!"); |
Chris Lattner | 32eecb0 | 2006-02-14 05:14:46 +0000 | [diff] [blame] | 118 | |
| 119 | BIn[3] = Tmp; // Restore character |
| 120 | BIn += 3; // Skip over handled chars |
| 121 | ++BOut; |
| 122 | } else { |
| 123 | *BOut++ = *BIn++; |
| 124 | } |
| 125 | } |
| 126 | |
| 127 | return BOut; |
| 128 | } |
| 129 | |
| 130 | } // End llvm namespace |
| 131 | |
| 132 | using namespace llvm; |
| 133 | |
| 134 | #define YY_NEVER_INTERACTIVE 1 |
| 135 | %} |
| 136 | |
| 137 | |
| 138 | |
| 139 | /* Comments start with a ; and go till end of line */ |
| 140 | Comment ;.* |
| 141 | |
Reid Spencer | 41dff5e | 2007-01-26 08:05:27 +0000 | [diff] [blame] | 142 | /* Local Values and Type identifiers start with a % sign */ |
| 143 | LocalVarName %[-a-zA-Z$._][-a-zA-Z$._0-9]* |
| 144 | |
| 145 | /* Global Value identifiers start with an @ sign */ |
| 146 | GlobalVarName @[-a-zA-Z$._][-a-zA-Z$._0-9]* |
Chris Lattner | 32eecb0 | 2006-02-14 05:14:46 +0000 | [diff] [blame] | 147 | |
| 148 | /* Label identifiers end with a colon */ |
| 149 | Label [-a-zA-Z$._0-9]+: |
| 150 | QuoteLabel \"[^\"]+\": |
| 151 | |
| 152 | /* Quoted names can contain any character except " and \ */ |
| 153 | StringConstant \"[^\"]*\" |
Reid Spencer | 41dff5e | 2007-01-26 08:05:27 +0000 | [diff] [blame] | 154 | AtStringConstant @\"[^\"]*\" |
Reid Spencer | ed951ea | 2007-05-19 07:22:10 +0000 | [diff] [blame] | 155 | PctStringConstant %\"[^\"]*\" |
Reid Spencer | 41dff5e | 2007-01-26 08:05:27 +0000 | [diff] [blame] | 156 | |
| 157 | /* LocalVarID/GlobalVarID: match an unnamed local variable slot ID. */ |
| 158 | LocalVarID %[0-9]+ |
| 159 | GlobalVarID @[0-9]+ |
Chris Lattner | 32eecb0 | 2006-02-14 05:14:46 +0000 | [diff] [blame] | 160 | |
Reid Spencer | 41dff5e | 2007-01-26 08:05:27 +0000 | [diff] [blame] | 161 | /* Integer types are specified with i and a bitwidth */ |
Reid Spencer | 4db2063 | 2007-01-12 07:28:27 +0000 | [diff] [blame] | 162 | IntegerType i[0-9]+ |
Reid Spencer | a54b7cb | 2007-01-12 07:05:14 +0000 | [diff] [blame] | 163 | |
Reid Spencer | 41dff5e | 2007-01-26 08:05:27 +0000 | [diff] [blame] | 164 | /* E[PN]Integer: match positive and negative literal integer values. */ |
Chris Lattner | 32eecb0 | 2006-02-14 05:14:46 +0000 | [diff] [blame] | 165 | PInteger [0-9]+ |
| 166 | NInteger -[0-9]+ |
| 167 | |
| 168 | /* FPConstant - A Floating point constant. |
| 169 | */ |
| 170 | FPConstant [-+]?[0-9]+[.][0-9]*([eE][-+]?[0-9]+)? |
| 171 | |
| 172 | /* HexFPConstant - Floating point constant represented in IEEE format as a |
| 173 | * hexadecimal number for when exponential notation is not precise enough. |
| 174 | */ |
| 175 | HexFPConstant 0x[0-9A-Fa-f]+ |
| 176 | |
| 177 | /* HexIntConstant - Hexadecimal constant generated by the CFE to avoid forcing |
| 178 | * it to deal with 64 bit numbers. |
| 179 | */ |
| 180 | HexIntConstant [us]0x[0-9A-Fa-f]+ |
Reid Spencer | 38c91a9 | 2007-02-28 02:24:54 +0000 | [diff] [blame] | 181 | |
Chris Lattner | 32eecb0 | 2006-02-14 05:14:46 +0000 | [diff] [blame] | 182 | %% |
| 183 | |
| 184 | {Comment} { /* Ignore comments for now */ } |
| 185 | |
| 186 | begin { return BEGINTOK; } |
| 187 | end { return ENDTOK; } |
| 188 | true { return TRUETOK; } |
| 189 | false { return FALSETOK; } |
| 190 | declare { return DECLARE; } |
Reid Spencer | 6fd36ab | 2006-12-29 20:35:03 +0000 | [diff] [blame] | 191 | define { return DEFINE; } |
Chris Lattner | 32eecb0 | 2006-02-14 05:14:46 +0000 | [diff] [blame] | 192 | global { return GLOBAL; } |
| 193 | constant { return CONSTANT; } |
| 194 | internal { return INTERNAL; } |
| 195 | linkonce { return LINKONCE; } |
| 196 | weak { return WEAK; } |
| 197 | appending { return APPENDING; } |
Anton Korobeynikov | b74ed07 | 2006-09-14 18:23:27 +0000 | [diff] [blame] | 198 | dllimport { return DLLIMPORT; } |
| 199 | dllexport { return DLLEXPORT; } |
Anton Korobeynikov | 7f70559 | 2007-01-12 19:20:47 +0000 | [diff] [blame] | 200 | hidden { return HIDDEN; } |
Anton Korobeynikov | 6f9896f | 2007-04-29 18:35:00 +0000 | [diff] [blame] | 201 | protected { return PROTECTED; } |
Anton Korobeynikov | b74ed07 | 2006-09-14 18:23:27 +0000 | [diff] [blame] | 202 | extern_weak { return EXTERN_WEAK; } |
Chris Lattner | 32eecb0 | 2006-02-14 05:14:46 +0000 | [diff] [blame] | 203 | external { return EXTERNAL; } |
Lauro Ramos Venancio | c763552 | 2007-04-12 18:32:50 +0000 | [diff] [blame] | 204 | thread_local { return THREAD_LOCAL; } |
Chris Lattner | 32eecb0 | 2006-02-14 05:14:46 +0000 | [diff] [blame] | 205 | zeroinitializer { return ZEROINITIALIZER; } |
| 206 | \.\.\. { return DOTDOTDOT; } |
| 207 | undef { return UNDEF; } |
| 208 | null { return NULL_TOK; } |
| 209 | to { return TO; } |
Chris Lattner | 32eecb0 | 2006-02-14 05:14:46 +0000 | [diff] [blame] | 210 | tail { return TAIL; } |
| 211 | target { return TARGET; } |
| 212 | triple { return TRIPLE; } |
| 213 | deplibs { return DEPLIBS; } |
Chris Lattner | 1ae022f | 2006-10-22 06:08:13 +0000 | [diff] [blame] | 214 | datalayout { return DATALAYOUT; } |
Chris Lattner | 32eecb0 | 2006-02-14 05:14:46 +0000 | [diff] [blame] | 215 | volatile { return VOLATILE; } |
| 216 | align { return ALIGN; } |
| 217 | section { return SECTION; } |
Anton Korobeynikov | 77d0f97 | 2007-04-25 14:29:12 +0000 | [diff] [blame] | 218 | alias { return ALIAS; } |
Chris Lattner | 32eecb0 | 2006-02-14 05:14:46 +0000 | [diff] [blame] | 219 | module { return MODULE; } |
| 220 | asm { return ASM_TOK; } |
| 221 | sideeffect { return SIDEEFFECT; } |
| 222 | |
| 223 | cc { return CC_TOK; } |
| 224 | ccc { return CCC_TOK; } |
| 225 | fastcc { return FASTCC_TOK; } |
| 226 | coldcc { return COLDCC_TOK; } |
Anton Korobeynikov | bcb9770 | 2006-09-17 20:25:45 +0000 | [diff] [blame] | 227 | x86_stdcallcc { return X86_STDCALLCC_TOK; } |
| 228 | x86_fastcallcc { return X86_FASTCALLCC_TOK; } |
Chris Lattner | 32eecb0 | 2006-02-14 05:14:46 +0000 | [diff] [blame] | 229 | |
Reid Spencer | 832254e | 2007-02-02 02:16:23 +0000 | [diff] [blame] | 230 | inreg { return INREG; } |
| 231 | sret { return SRET; } |
Reid Spencer | 67d8ed9 | 2007-03-22 02:14:08 +0000 | [diff] [blame] | 232 | nounwind { return NOUNWIND; } |
| 233 | noreturn { return NORETURN; } |
Reid Spencer | 832254e | 2007-02-02 02:16:23 +0000 | [diff] [blame] | 234 | |
Reid Spencer | a132e04 | 2006-12-03 05:46:11 +0000 | [diff] [blame] | 235 | void { RET_TY(Type::VoidTy, VOID); } |
Reid Spencer | a132e04 | 2006-12-03 05:46:11 +0000 | [diff] [blame] | 236 | float { RET_TY(Type::FloatTy, FLOAT); } |
| 237 | double { RET_TY(Type::DoubleTy,DOUBLE);} |
| 238 | label { RET_TY(Type::LabelTy, LABEL); } |
Chris Lattner | 32eecb0 | 2006-02-14 05:14:46 +0000 | [diff] [blame] | 239 | type { return TYPE; } |
| 240 | opaque { return OPAQUE; } |
Reid Spencer | a54b7cb | 2007-01-12 07:05:14 +0000 | [diff] [blame] | 241 | {IntegerType} { uint64_t NumBits = atoull(yytext+1); |
| 242 | if (NumBits < IntegerType::MIN_INT_BITS || |
| 243 | NumBits > IntegerType::MAX_INT_BITS) |
| 244 | GenerateError("Bitwidth for integer type out of range!"); |
| 245 | const Type* Ty = IntegerType::get(NumBits); |
| 246 | RET_TY(Ty, INTTYPE); |
| 247 | } |
Chris Lattner | 32eecb0 | 2006-02-14 05:14:46 +0000 | [diff] [blame] | 248 | |
| 249 | add { RET_TOK(BinaryOpVal, Add, ADD); } |
| 250 | sub { RET_TOK(BinaryOpVal, Sub, SUB); } |
| 251 | mul { RET_TOK(BinaryOpVal, Mul, MUL); } |
Reid Spencer | 3ed469c | 2006-11-02 20:25:50 +0000 | [diff] [blame] | 252 | udiv { RET_TOK(BinaryOpVal, UDiv, UDIV); } |
| 253 | sdiv { RET_TOK(BinaryOpVal, SDiv, SDIV); } |
| 254 | fdiv { RET_TOK(BinaryOpVal, FDiv, FDIV); } |
Reid Spencer | 3ed469c | 2006-11-02 20:25:50 +0000 | [diff] [blame] | 255 | urem { RET_TOK(BinaryOpVal, URem, UREM); } |
| 256 | srem { RET_TOK(BinaryOpVal, SRem, SREM); } |
| 257 | frem { RET_TOK(BinaryOpVal, FRem, FREM); } |
Reid Spencer | 832254e | 2007-02-02 02:16:23 +0000 | [diff] [blame] | 258 | shl { RET_TOK(BinaryOpVal, Shl, SHL); } |
| 259 | lshr { RET_TOK(BinaryOpVal, LShr, LSHR); } |
| 260 | ashr { RET_TOK(BinaryOpVal, AShr, ASHR); } |
Chris Lattner | 32eecb0 | 2006-02-14 05:14:46 +0000 | [diff] [blame] | 261 | and { RET_TOK(BinaryOpVal, And, AND); } |
| 262 | or { RET_TOK(BinaryOpVal, Or , OR ); } |
| 263 | xor { RET_TOK(BinaryOpVal, Xor, XOR); } |
Reid Spencer | a132e04 | 2006-12-03 05:46:11 +0000 | [diff] [blame] | 264 | icmp { RET_TOK(OtherOpVal, ICmp, ICMP); } |
| 265 | fcmp { RET_TOK(OtherOpVal, FCmp, FCMP); } |
Reid Spencer | 832254e | 2007-02-02 02:16:23 +0000 | [diff] [blame] | 266 | |
Reid Spencer | 6e18b7d | 2006-12-03 06:59:29 +0000 | [diff] [blame] | 267 | eq { return EQ; } |
| 268 | ne { return NE; } |
| 269 | slt { return SLT; } |
| 270 | sgt { return SGT; } |
| 271 | sle { return SLE; } |
| 272 | sge { return SGE; } |
| 273 | ult { return ULT; } |
| 274 | ugt { return UGT; } |
| 275 | ule { return ULE; } |
| 276 | uge { return UGE; } |
| 277 | oeq { return OEQ; } |
| 278 | one { return ONE; } |
| 279 | olt { return OLT; } |
| 280 | ogt { return OGT; } |
| 281 | ole { return OLE; } |
| 282 | oge { return OGE; } |
| 283 | ord { return ORD; } |
| 284 | uno { return UNO; } |
| 285 | ueq { return UEQ; } |
| 286 | une { return UNE; } |
Chris Lattner | 32eecb0 | 2006-02-14 05:14:46 +0000 | [diff] [blame] | 287 | |
| 288 | phi { RET_TOK(OtherOpVal, PHI, PHI_TOK); } |
| 289 | call { RET_TOK(OtherOpVal, Call, CALL); } |
Reid Spencer | 3da59db | 2006-11-27 01:05:10 +0000 | [diff] [blame] | 290 | trunc { RET_TOK(CastOpVal, Trunc, TRUNC); } |
| 291 | zext { RET_TOK(CastOpVal, ZExt, ZEXT); } |
| 292 | sext { RET_TOK(CastOpVal, SExt, SEXT); } |
| 293 | fptrunc { RET_TOK(CastOpVal, FPTrunc, FPTRUNC); } |
| 294 | fpext { RET_TOK(CastOpVal, FPExt, FPEXT); } |
| 295 | uitofp { RET_TOK(CastOpVal, UIToFP, UITOFP); } |
| 296 | sitofp { RET_TOK(CastOpVal, SIToFP, SITOFP); } |
| 297 | fptoui { RET_TOK(CastOpVal, FPToUI, FPTOUI); } |
| 298 | fptosi { RET_TOK(CastOpVal, FPToSI, FPTOSI); } |
| 299 | inttoptr { RET_TOK(CastOpVal, IntToPtr, INTTOPTR); } |
| 300 | ptrtoint { RET_TOK(CastOpVal, PtrToInt, PTRTOINT); } |
| 301 | bitcast { RET_TOK(CastOpVal, BitCast, BITCAST); } |
Chris Lattner | 32eecb0 | 2006-02-14 05:14:46 +0000 | [diff] [blame] | 302 | select { RET_TOK(OtherOpVal, Select, SELECT); } |
Chris Lattner | 32eecb0 | 2006-02-14 05:14:46 +0000 | [diff] [blame] | 303 | va_arg { RET_TOK(OtherOpVal, VAArg , VAARG); } |
| 304 | ret { RET_TOK(TermOpVal, Ret, RET); } |
| 305 | br { RET_TOK(TermOpVal, Br, BR); } |
| 306 | switch { RET_TOK(TermOpVal, Switch, SWITCH); } |
| 307 | invoke { RET_TOK(TermOpVal, Invoke, INVOKE); } |
| 308 | unwind { RET_TOK(TermOpVal, Unwind, UNWIND); } |
| 309 | unreachable { RET_TOK(TermOpVal, Unreachable, UNREACHABLE); } |
| 310 | |
| 311 | malloc { RET_TOK(MemOpVal, Malloc, MALLOC); } |
| 312 | alloca { RET_TOK(MemOpVal, Alloca, ALLOCA); } |
| 313 | free { RET_TOK(MemOpVal, Free, FREE); } |
| 314 | load { RET_TOK(MemOpVal, Load, LOAD); } |
| 315 | store { RET_TOK(MemOpVal, Store, STORE); } |
| 316 | getelementptr { RET_TOK(MemOpVal, GetElementPtr, GETELEMENTPTR); } |
| 317 | |
| 318 | extractelement { RET_TOK(OtherOpVal, ExtractElement, EXTRACTELEMENT); } |
| 319 | insertelement { RET_TOK(OtherOpVal, InsertElement, INSERTELEMENT); } |
Chris Lattner | d5efe84 | 2006-04-08 01:18:56 +0000 | [diff] [blame] | 320 | shufflevector { RET_TOK(OtherOpVal, ShuffleVector, SHUFFLEVECTOR); } |
Chris Lattner | 32eecb0 | 2006-02-14 05:14:46 +0000 | [diff] [blame] | 321 | |
| 322 | |
Reid Spencer | 41dff5e | 2007-01-26 08:05:27 +0000 | [diff] [blame] | 323 | {LocalVarName} { |
Chris Lattner | 32eecb0 | 2006-02-14 05:14:46 +0000 | [diff] [blame] | 324 | UnEscapeLexed(yytext+1); |
| 325 | llvmAsmlval.StrVal = strdup(yytext+1); // Skip % |
Reid Spencer | 41dff5e | 2007-01-26 08:05:27 +0000 | [diff] [blame] | 326 | return LOCALVAR; |
| 327 | } |
| 328 | {GlobalVarName} { |
| 329 | UnEscapeLexed(yytext+1); |
| 330 | llvmAsmlval.StrVal = strdup(yytext+1); // Skip @ |
| 331 | return GLOBALVAR; |
Chris Lattner | 32eecb0 | 2006-02-14 05:14:46 +0000 | [diff] [blame] | 332 | } |
| 333 | {Label} { |
| 334 | yytext[strlen(yytext)-1] = 0; // nuke colon |
| 335 | UnEscapeLexed(yytext); |
| 336 | llvmAsmlval.StrVal = strdup(yytext); |
| 337 | return LABELSTR; |
| 338 | } |
| 339 | {QuoteLabel} { |
| 340 | yytext[strlen(yytext)-2] = 0; // nuke colon, end quote |
| 341 | UnEscapeLexed(yytext+1); |
| 342 | llvmAsmlval.StrVal = strdup(yytext+1); |
| 343 | return LABELSTR; |
| 344 | } |
| 345 | |
| 346 | {StringConstant} { // Note that we cannot unescape a string constant here! The |
| 347 | // string constant might contain a \00 which would not be |
| 348 | // understood by the string stuff. It is valid to make a |
| 349 | // [sbyte] c"Hello World\00" constant, for example. |
| 350 | // |
| 351 | yytext[strlen(yytext)-1] = 0; // nuke end quote |
| 352 | llvmAsmlval.StrVal = strdup(yytext+1); // Nuke start quote |
| 353 | return STRINGCONSTANT; |
| 354 | } |
Reid Spencer | 41dff5e | 2007-01-26 08:05:27 +0000 | [diff] [blame] | 355 | {AtStringConstant} { |
| 356 | yytext[strlen(yytext)-1] = 0; // nuke end quote |
| 357 | llvmAsmlval.StrVal = strdup(yytext+2); // Nuke @, quote |
| 358 | return ATSTRINGCONSTANT; |
| 359 | } |
| 360 | |
Reid Spencer | ed951ea | 2007-05-19 07:22:10 +0000 | [diff] [blame] | 361 | {PctStringConstant} { |
| 362 | yytext[strlen(yytext)-1] = 0; // nuke end quote |
| 363 | llvmAsmlval.StrVal = strdup(yytext+2); // Nuke @, quote |
| 364 | return PCTSTRINGCONSTANT; |
| 365 | } |
Reid Spencer | 38c91a9 | 2007-02-28 02:24:54 +0000 | [diff] [blame] | 366 | {PInteger} { int len = strlen(yytext); |
| 367 | uint32_t numBits = ((len * 64) / 19) + 1; |
| 368 | APInt Tmp(numBits, yytext, len, 10); |
| 369 | uint32_t activeBits = Tmp.getActiveBits(); |
| 370 | if (activeBits > 0 && activeBits < numBits) |
| 371 | Tmp.trunc(activeBits); |
| 372 | if (Tmp.getBitWidth() > 64) { |
| 373 | llvmAsmlval.APIntVal = new APInt(Tmp); |
| 374 | return EUAPINTVAL; |
| 375 | } else { |
| 376 | llvmAsmlval.UInt64Val = Tmp.getZExtValue(); |
| 377 | return EUINT64VAL; |
| 378 | } |
Chris Lattner | 32eecb0 | 2006-02-14 05:14:46 +0000 | [diff] [blame] | 379 | } |
Reid Spencer | 38c91a9 | 2007-02-28 02:24:54 +0000 | [diff] [blame] | 380 | {NInteger} { int len = strlen(yytext); |
Reid Spencer | afc3782 | 2007-03-09 21:19:09 +0000 | [diff] [blame] | 381 | uint32_t numBits = (((len-1) * 64) / 19) + 2; |
Reid Spencer | 38c91a9 | 2007-02-28 02:24:54 +0000 | [diff] [blame] | 382 | APInt Tmp(numBits, yytext, len, 10); |
| 383 | uint32_t minBits = Tmp.getMinSignedBits(); |
| 384 | if (minBits > 0 && minBits < numBits) |
| 385 | Tmp.trunc(minBits); |
| 386 | if (Tmp.getBitWidth() > 64) { |
| 387 | llvmAsmlval.APIntVal = new APInt(Tmp); |
| 388 | return ESAPINTVAL; |
| 389 | } else { |
| 390 | llvmAsmlval.SInt64Val = Tmp.getSExtValue(); |
| 391 | return ESINT64VAL; |
| 392 | } |
| 393 | } |
| 394 | |
| 395 | {HexIntConstant} { int len = strlen(yytext+3) - 3; |
| 396 | uint32_t bits = len * 4; |
| 397 | APInt Tmp(bits, yytext+3, len, 16); |
| 398 | uint32_t activeBits = Tmp.getActiveBits(); |
| 399 | if (activeBits > 0 && activeBits < bits) |
| 400 | Tmp.trunc(activeBits); |
| 401 | if (Tmp.getBitWidth() > 64) { |
| 402 | llvmAsmlval.APIntVal = new APInt(Tmp); |
| 403 | return yytext[0] == 's' ? ESAPINTVAL : EUAPINTVAL; |
| 404 | } else if (yytext[0] == 's') { |
| 405 | llvmAsmlval.SInt64Val = Tmp.getSExtValue(); |
| 406 | return ESINT64VAL; |
| 407 | } else { |
| 408 | llvmAsmlval.UInt64Val = Tmp.getZExtValue(); |
| 409 | return EUINT64VAL; |
| 410 | } |
Chris Lattner | 32eecb0 | 2006-02-14 05:14:46 +0000 | [diff] [blame] | 411 | } |
| 412 | |
Reid Spencer | 41dff5e | 2007-01-26 08:05:27 +0000 | [diff] [blame] | 413 | {LocalVarID} { |
Chris Lattner | 32eecb0 | 2006-02-14 05:14:46 +0000 | [diff] [blame] | 414 | uint64_t Val = atoull(yytext+1); |
| 415 | if ((unsigned)Val != Val) |
Reid Spencer | 61c83e0 | 2006-08-18 08:43:06 +0000 | [diff] [blame] | 416 | GenerateError("Invalid value number (too large)!"); |
Chris Lattner | 32eecb0 | 2006-02-14 05:14:46 +0000 | [diff] [blame] | 417 | llvmAsmlval.UIntVal = unsigned(Val); |
Reid Spencer | 41dff5e | 2007-01-26 08:05:27 +0000 | [diff] [blame] | 418 | return LOCALVAL_ID; |
Chris Lattner | 32eecb0 | 2006-02-14 05:14:46 +0000 | [diff] [blame] | 419 | } |
Reid Spencer | 41dff5e | 2007-01-26 08:05:27 +0000 | [diff] [blame] | 420 | {GlobalVarID} { |
| 421 | uint64_t Val = atoull(yytext+1); |
| 422 | if ((unsigned)Val != Val) |
| 423 | GenerateError("Invalid value number (too large)!"); |
| 424 | llvmAsmlval.UIntVal = unsigned(Val); |
| 425 | return GLOBALVAL_ID; |
Chris Lattner | 32eecb0 | 2006-02-14 05:14:46 +0000 | [diff] [blame] | 426 | } |
| 427 | |
| 428 | {FPConstant} { llvmAsmlval.FPVal = atof(yytext); return FPVAL; } |
| 429 | {HexFPConstant} { llvmAsmlval.FPVal = HexToFP(yytext); return FPVAL; } |
| 430 | |
| 431 | <<EOF>> { |
| 432 | /* Make sure to free the internal buffers for flex when we are |
| 433 | * done reading our input! |
| 434 | */ |
| 435 | yy_delete_buffer(YY_CURRENT_BUFFER); |
| 436 | return EOF; |
| 437 | } |
| 438 | |
| 439 | [ \r\t\n] { /* Ignore whitespace */ } |
| 440 | . { return yytext[0]; } |
| 441 | |
| 442 | %% |