Chris Lattner | e79379a | 2018-06-22 10:39:19 -0700 | [diff] [blame] | 1 | //===- Token.h - MLIR Token Interface ---------------------------*- C++ -*-===// |
| 2 | // |
| 3 | // Copyright 2019 The MLIR Authors. |
| 4 | // |
| 5 | // Licensed under the Apache License, Version 2.0 (the "License"); |
| 6 | // you may not use this file except in compliance with the License. |
| 7 | // You may obtain a copy of the License at |
| 8 | // |
| 9 | // http://www.apache.org/licenses/LICENSE-2.0 |
| 10 | // |
| 11 | // Unless required by applicable law or agreed to in writing, software |
| 12 | // distributed under the License is distributed on an "AS IS" BASIS, |
| 13 | // WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. |
| 14 | // See the License for the specific language governing permissions and |
| 15 | // limitations under the License. |
| 16 | // ============================================================================= |
| 17 | |
| 18 | #ifndef MLIR_LIB_PARSER_TOKEN_H |
| 19 | #define MLIR_LIB_PARSER_TOKEN_H |
| 20 | |
| 21 | #include "mlir/Support/LLVM.h" |
| 22 | #include "llvm/ADT/StringRef.h" |
| 23 | #include "llvm/Support/SMLoc.h" |
| 24 | |
| 25 | namespace mlir { |
| 26 | |
| 27 | /// This represents a token in the MLIR syntax. |
| 28 | class Token { |
| 29 | public: |
| 30 | enum TokenKind { |
| 31 | // Markers |
| 32 | eof, error, |
| 33 | |
| 34 | // Identifiers. |
| 35 | bare_identifier, // foo |
| 36 | at_identifier, // @foo |
| 37 | // TODO: @@foo, etc. |
| 38 | |
Chris Lattner | bb8fafc | 2018-06-22 15:52:02 -0700 | [diff] [blame] | 39 | integer, // 42 |
| 40 | |
Chris Lattner | e79379a | 2018-06-22 10:39:19 -0700 | [diff] [blame] | 41 | // Punctuation. |
Chris Lattner | bb8fafc | 2018-06-22 15:52:02 -0700 | [diff] [blame] | 42 | arrow, // -> |
Chris Lattner | 4c95a50 | 2018-06-23 16:03:42 -0700 | [diff] [blame] | 43 | colon, // : |
Chris Lattner | bb8fafc | 2018-06-22 15:52:02 -0700 | [diff] [blame] | 44 | comma, // , |
| 45 | question, // ? |
| 46 | questionquestion, // ?? |
Chris Lattner | e79379a | 2018-06-22 10:39:19 -0700 | [diff] [blame] | 47 | l_paren, r_paren, // ( ) |
Chris Lattner | 4c95a50 | 2018-06-23 16:03:42 -0700 | [diff] [blame] | 48 | l_brace, r_brace, // { } |
Chris Lattner | e79379a | 2018-06-22 10:39:19 -0700 | [diff] [blame] | 49 | less, greater, // < > |
| 50 | // TODO: More punctuation. |
| 51 | |
| 52 | // Keywords. |
Chris Lattner | bb8fafc | 2018-06-22 15:52:02 -0700 | [diff] [blame] | 53 | kw_bf16, |
Chris Lattner | f6d80a0 | 2018-06-24 11:18:29 -0700 | [diff] [blame^] | 54 | kw_br, |
Chris Lattner | e79379a | 2018-06-22 10:39:19 -0700 | [diff] [blame] | 55 | kw_cfgfunc, |
| 56 | kw_extfunc, |
Chris Lattner | bb8fafc | 2018-06-22 15:52:02 -0700 | [diff] [blame] | 57 | kw_f16, |
| 58 | kw_f32, |
| 59 | kw_f64, |
| 60 | kw_i1, |
| 61 | kw_i16, |
| 62 | kw_i32, |
| 63 | kw_i64, |
| 64 | kw_i8, |
| 65 | kw_int, |
| 66 | kw_memref, |
Chris Lattner | e79379a | 2018-06-22 10:39:19 -0700 | [diff] [blame] | 67 | kw_mlfunc, |
Chris Lattner | 4c95a50 | 2018-06-23 16:03:42 -0700 | [diff] [blame] | 68 | kw_return, |
Chris Lattner | bb8fafc | 2018-06-22 15:52:02 -0700 | [diff] [blame] | 69 | kw_tensor, |
| 70 | kw_vector, |
Chris Lattner | e79379a | 2018-06-22 10:39:19 -0700 | [diff] [blame] | 71 | }; |
| 72 | |
| 73 | Token(TokenKind kind, StringRef spelling) |
| 74 | : kind(kind), spelling(spelling) {} |
| 75 | |
| 76 | // Return the bytes that make up this token. |
| 77 | StringRef getSpelling() const { return spelling; } |
| 78 | |
| 79 | // Token classification. |
| 80 | TokenKind getKind() const { return kind; } |
| 81 | bool is(TokenKind K) const { return kind == K; } |
| 82 | |
| 83 | bool isAny(TokenKind k1, TokenKind k2) const { |
| 84 | return is(k1) || is(k2); |
| 85 | } |
| 86 | |
| 87 | /// Return true if this token is one of the specified kinds. |
| 88 | template <typename ...T> |
| 89 | bool isAny(TokenKind k1, TokenKind k2, TokenKind k3, T... others) const { |
| 90 | if (is(k1)) |
| 91 | return true; |
| 92 | return isAny(k2, k3, others...); |
| 93 | } |
| 94 | |
| 95 | bool isNot(TokenKind k) const { return kind != k; } |
| 96 | |
| 97 | /// Return true if this token isn't one of the specified kinds. |
| 98 | template <typename ...T> |
| 99 | bool isNot(TokenKind k1, TokenKind k2, T... others) const { |
| 100 | return !isAny(k1, k2, others...); |
| 101 | } |
| 102 | |
Chris Lattner | bb8fafc | 2018-06-22 15:52:02 -0700 | [diff] [blame] | 103 | // Helpers to decode specific sorts of tokens. |
Chris Lattner | e79379a | 2018-06-22 10:39:19 -0700 | [diff] [blame] | 104 | |
Chris Lattner | bb8fafc | 2018-06-22 15:52:02 -0700 | [diff] [blame] | 105 | /// For an integer token, return its value as an unsigned. If it doesn't fit, |
| 106 | /// return None. |
| 107 | Optional<unsigned> getUnsignedIntegerValue(); |
| 108 | |
| 109 | // Location processing. |
Chris Lattner | e79379a | 2018-06-22 10:39:19 -0700 | [diff] [blame] | 110 | llvm::SMLoc getLoc() const; |
| 111 | llvm::SMLoc getEndLoc() const; |
| 112 | llvm::SMRange getLocRange() const; |
| 113 | |
| 114 | private: |
| 115 | /// Discriminator that indicates the sort of token this is. |
| 116 | TokenKind kind; |
| 117 | |
| 118 | /// A reference to the entire token contents; this is always a pointer into |
| 119 | /// a memory buffer owned by the source manager. |
| 120 | StringRef spelling; |
| 121 | }; |
| 122 | |
| 123 | } // end namespace mlir |
| 124 | |
| 125 | #endif // MLIR_LIB_PARSER_TOKEN_H |