| Alex Lorenz | 91370c5 | 2015-06-22 20:37:46 +0000 | [diff] [blame] | 1 | //===- MILexer.h - Lexer for machine instructions -------------------------===// |
| 2 | // |
| 3 | // The LLVM Compiler Infrastructure |
| 4 | // |
| 5 | // This file is distributed under the University of Illinois Open Source |
| 6 | // License. See LICENSE.TXT for details. |
| 7 | // |
| 8 | //===----------------------------------------------------------------------===// |
| 9 | // |
| 10 | // This file declares the function that lexes the machine instruction source |
| 11 | // string. |
| 12 | // |
| 13 | //===----------------------------------------------------------------------===// |
| 14 | |
| 15 | #ifndef LLVM_LIB_CODEGEN_MIRPARSER_MILEXER_H |
| 16 | #define LLVM_LIB_CODEGEN_MIRPARSER_MILEXER_H |
| 17 | |
| Alex Lorenz | 240fc1e | 2015-06-23 23:42:28 +0000 | [diff] [blame] | 18 | #include "llvm/ADT/APSInt.h" |
| Alex Lorenz | 91370c5 | 2015-06-22 20:37:46 +0000 | [diff] [blame] | 19 | #include "llvm/ADT/StringRef.h" |
| 20 | #include "llvm/ADT/STLExtras.h" |
| 21 | #include <functional> |
| 22 | |
| 23 | namespace llvm { |
| 24 | |
| 25 | class Twine; |
| 26 | |
| 27 | /// A token produced by the machine instruction lexer. |
| 28 | struct MIToken { |
| 29 | enum TokenKind { |
| 30 | // Markers |
| 31 | Eof, |
| 32 | Error, |
| 33 | |
| Alex Lorenz | f3db51de | 2015-06-23 16:35:26 +0000 | [diff] [blame] | 34 | // Tokens with no info. |
| 35 | comma, |
| 36 | equal, |
| Alex Lorenz | 12b554e | 2015-06-24 17:34:58 +0000 | [diff] [blame] | 37 | underscore, |
| Alex Lorenz | 2eacca8 | 2015-07-13 23:24:34 +0000 | [diff] [blame] | 38 | colon, |
| Alex Lorenz | f3db51de | 2015-06-23 16:35:26 +0000 | [diff] [blame] | 39 | |
| Alex Lorenz | cb268d4 | 2015-07-06 23:07:26 +0000 | [diff] [blame] | 40 | // Keywords |
| 41 | kw_implicit, |
| 42 | kw_implicit_define, |
| Alex Lorenz | cbbfd0b | 2015-07-07 20:34:53 +0000 | [diff] [blame] | 43 | kw_dead, |
| Alex Lorenz | 495ad87 | 2015-07-08 21:23:34 +0000 | [diff] [blame] | 44 | kw_killed, |
| Alex Lorenz | 4d026b89 | 2015-07-08 23:58:31 +0000 | [diff] [blame] | 45 | kw_undef, |
| Alex Lorenz | e5a4466 | 2015-07-17 00:24:15 +0000 | [diff] [blame] | 46 | kw_frame_setup, |
| Alex Lorenz | f4baeb5 | 2015-07-21 22:28:27 +0000 | [diff] [blame^] | 47 | kw_cfi_def_cfa_offset, |
| Alex Lorenz | cb268d4 | 2015-07-06 23:07:26 +0000 | [diff] [blame] | 48 | |
| Alex Lorenz | 91370c5 | 2015-06-22 20:37:46 +0000 | [diff] [blame] | 49 | // Identifier tokens |
| Alex Lorenz | f3db51de | 2015-06-23 16:35:26 +0000 | [diff] [blame] | 50 | Identifier, |
| Alex Lorenz | 240fc1e | 2015-06-23 23:42:28 +0000 | [diff] [blame] | 51 | NamedRegister, |
| Alex Lorenz | 33f0aef | 2015-06-26 16:46:11 +0000 | [diff] [blame] | 52 | MachineBasicBlock, |
| Alex Lorenz | 7feaf7c | 2015-07-16 23:37:45 +0000 | [diff] [blame] | 53 | StackObject, |
| 54 | FixedStackObject, |
| Alex Lorenz | 5d6108e | 2015-06-26 22:56:48 +0000 | [diff] [blame] | 55 | NamedGlobalValue, |
| Alex Lorenz | b29554d | 2015-07-20 20:31:01 +0000 | [diff] [blame] | 56 | QuotedNamedGlobalValue, |
| Alex Lorenz | 5d6108e | 2015-06-26 22:56:48 +0000 | [diff] [blame] | 57 | GlobalValue, |
| Alex Lorenz | 6ede374 | 2015-07-21 16:59:53 +0000 | [diff] [blame] | 58 | ExternalSymbol, |
| 59 | QuotedExternalSymbol, |
| Alex Lorenz | 240fc1e | 2015-06-23 23:42:28 +0000 | [diff] [blame] | 60 | |
| 61 | // Other tokens |
| Alex Lorenz | 5346451 | 2015-07-10 22:51:20 +0000 | [diff] [blame] | 62 | IntegerLiteral, |
| Alex Lorenz | 31d7068 | 2015-07-15 23:38:35 +0000 | [diff] [blame] | 63 | VirtualRegister, |
| Alex Lorenz | ab98049 | 2015-07-20 20:51:18 +0000 | [diff] [blame] | 64 | ConstantPoolItem, |
| Alex Lorenz | 31d7068 | 2015-07-15 23:38:35 +0000 | [diff] [blame] | 65 | JumpTableIndex |
| Alex Lorenz | 91370c5 | 2015-06-22 20:37:46 +0000 | [diff] [blame] | 66 | }; |
| 67 | |
| 68 | private: |
| 69 | TokenKind Kind; |
| Alex Lorenz | 33f0aef | 2015-06-26 16:46:11 +0000 | [diff] [blame] | 70 | unsigned StringOffset; |
| Alex Lorenz | 91370c5 | 2015-06-22 20:37:46 +0000 | [diff] [blame] | 71 | StringRef Range; |
| Alex Lorenz | 240fc1e | 2015-06-23 23:42:28 +0000 | [diff] [blame] | 72 | APSInt IntVal; |
| Alex Lorenz | 91370c5 | 2015-06-22 20:37:46 +0000 | [diff] [blame] | 73 | |
| 74 | public: |
| Alex Lorenz | 33f0aef | 2015-06-26 16:46:11 +0000 | [diff] [blame] | 75 | MIToken(TokenKind Kind, StringRef Range, unsigned StringOffset = 0) |
| 76 | : Kind(Kind), StringOffset(StringOffset), Range(Range) {} |
| Alex Lorenz | 91370c5 | 2015-06-22 20:37:46 +0000 | [diff] [blame] | 77 | |
| Alex Lorenz | 33f0aef | 2015-06-26 16:46:11 +0000 | [diff] [blame] | 78 | MIToken(TokenKind Kind, StringRef Range, const APSInt &IntVal, |
| 79 | unsigned StringOffset = 0) |
| 80 | : Kind(Kind), StringOffset(StringOffset), Range(Range), IntVal(IntVal) {} |
| Alex Lorenz | 240fc1e | 2015-06-23 23:42:28 +0000 | [diff] [blame] | 81 | |
| Alex Lorenz | 91370c5 | 2015-06-22 20:37:46 +0000 | [diff] [blame] | 82 | TokenKind kind() const { return Kind; } |
| 83 | |
| 84 | bool isError() const { return Kind == Error; } |
| 85 | |
| Alex Lorenz | 12b554e | 2015-06-24 17:34:58 +0000 | [diff] [blame] | 86 | bool isRegister() const { |
| Alex Lorenz | 5346451 | 2015-07-10 22:51:20 +0000 | [diff] [blame] | 87 | return Kind == NamedRegister || Kind == underscore || |
| 88 | Kind == VirtualRegister; |
| Alex Lorenz | 12b554e | 2015-06-24 17:34:58 +0000 | [diff] [blame] | 89 | } |
| Alex Lorenz | f3db51de | 2015-06-23 16:35:26 +0000 | [diff] [blame] | 90 | |
| Alex Lorenz | cb268d4 | 2015-07-06 23:07:26 +0000 | [diff] [blame] | 91 | bool isRegisterFlag() const { |
| Alex Lorenz | 495ad87 | 2015-07-08 21:23:34 +0000 | [diff] [blame] | 92 | return Kind == kw_implicit || Kind == kw_implicit_define || |
| Alex Lorenz | 4d026b89 | 2015-07-08 23:58:31 +0000 | [diff] [blame] | 93 | Kind == kw_dead || Kind == kw_killed || Kind == kw_undef; |
| Alex Lorenz | cb268d4 | 2015-07-06 23:07:26 +0000 | [diff] [blame] | 94 | } |
| 95 | |
| Alex Lorenz | 91370c5 | 2015-06-22 20:37:46 +0000 | [diff] [blame] | 96 | bool is(TokenKind K) const { return Kind == K; } |
| 97 | |
| 98 | bool isNot(TokenKind K) const { return Kind != K; } |
| 99 | |
| 100 | StringRef::iterator location() const { return Range.begin(); } |
| 101 | |
| Alex Lorenz | 6ede374 | 2015-07-21 16:59:53 +0000 | [diff] [blame] | 102 | bool isStringValueQuoted() const { |
| 103 | return Kind == QuotedNamedGlobalValue || Kind == QuotedExternalSymbol; |
| 104 | } |
| Alex Lorenz | b29554d | 2015-07-20 20:31:01 +0000 | [diff] [blame] | 105 | |
| 106 | /// Return the token's raw string value. |
| 107 | /// |
| 108 | /// If the string value is quoted, this method returns that quoted string as |
| 109 | /// it is, without unescaping the string value. |
| 110 | StringRef rawStringValue() const { return Range.drop_front(StringOffset); } |
| 111 | |
| 112 | /// Return token's string value. |
| 113 | /// |
| 114 | /// Expects the string value to be unquoted. |
| 115 | StringRef stringValue() const { |
| 116 | assert(!isStringValueQuoted() && "String value is quoted"); |
| 117 | return Range.drop_front(StringOffset); |
| 118 | } |
| 119 | |
| 120 | /// Unescapes the token's string value. |
| 121 | /// |
| 122 | /// Expects the string value to be quoted. |
| 123 | void unescapeQuotedStringValue(std::string &Str) const; |
| Alex Lorenz | 240fc1e | 2015-06-23 23:42:28 +0000 | [diff] [blame] | 124 | |
| 125 | const APSInt &integerValue() const { return IntVal; } |
| Alex Lorenz | 33f0aef | 2015-06-26 16:46:11 +0000 | [diff] [blame] | 126 | |
| 127 | bool hasIntegerValue() const { |
| Alex Lorenz | 5d6108e | 2015-06-26 22:56:48 +0000 | [diff] [blame] | 128 | return Kind == IntegerLiteral || Kind == MachineBasicBlock || |
| Alex Lorenz | 7feaf7c | 2015-07-16 23:37:45 +0000 | [diff] [blame] | 129 | Kind == StackObject || Kind == FixedStackObject || |
| Alex Lorenz | 31d7068 | 2015-07-15 23:38:35 +0000 | [diff] [blame] | 130 | Kind == GlobalValue || Kind == VirtualRegister || |
| Alex Lorenz | ab98049 | 2015-07-20 20:51:18 +0000 | [diff] [blame] | 131 | Kind == ConstantPoolItem || Kind == JumpTableIndex; |
| Alex Lorenz | 33f0aef | 2015-06-26 16:46:11 +0000 | [diff] [blame] | 132 | } |
| Alex Lorenz | 91370c5 | 2015-06-22 20:37:46 +0000 | [diff] [blame] | 133 | }; |
| 134 | |
| 135 | /// Consume a single machine instruction token in the given source and return |
| 136 | /// the remaining source string. |
| 137 | StringRef lexMIToken( |
| 138 | StringRef Source, MIToken &Token, |
| 139 | function_ref<void(StringRef::iterator, const Twine &)> ErrorCallback); |
| 140 | |
| 141 | } // end namespace llvm |
| 142 | |
| 143 | #endif |