blob: dde07222bed5118893927e0797b2deab25d27fe8 [file] [log] [blame]
Chris Lattnere79379a2018-06-22 10:39:19 -07001//===- Token.h - MLIR Token Interface ---------------------------*- C++ -*-===//
2//
3// Copyright 2019 The MLIR Authors.
4//
5// Licensed under the Apache License, Version 2.0 (the "License");
6// you may not use this file except in compliance with the License.
7// You may obtain a copy of the License at
8//
9// http://www.apache.org/licenses/LICENSE-2.0
10//
11// Unless required by applicable law or agreed to in writing, software
12// distributed under the License is distributed on an "AS IS" BASIS,
13// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
14// See the License for the specific language governing permissions and
15// limitations under the License.
16// =============================================================================
17
18#ifndef MLIR_LIB_PARSER_TOKEN_H
19#define MLIR_LIB_PARSER_TOKEN_H
20
21#include "mlir/Support/LLVM.h"
22#include "llvm/ADT/StringRef.h"
23#include "llvm/Support/SMLoc.h"
24
25namespace mlir {
26
27/// This represents a token in the MLIR syntax.
28class Token {
29public:
30 enum TokenKind {
31 // Markers
32 eof, error,
33
34 // Identifiers.
35 bare_identifier, // foo
36 at_identifier, // @foo
37 // TODO: @@foo, etc.
38
Chris Lattnerbb8fafc2018-06-22 15:52:02 -070039 integer, // 42
40
Chris Lattnere79379a2018-06-22 10:39:19 -070041 // Punctuation.
Chris Lattnerbb8fafc2018-06-22 15:52:02 -070042 arrow, // ->
Chris Lattner4c95a502018-06-23 16:03:42 -070043 colon, // :
Chris Lattnerbb8fafc2018-06-22 15:52:02 -070044 comma, // ,
45 question, // ?
46 questionquestion, // ??
Chris Lattnere79379a2018-06-22 10:39:19 -070047 l_paren, r_paren, // ( )
Chris Lattner4c95a502018-06-23 16:03:42 -070048 l_brace, r_brace, // { }
Chris Lattnere79379a2018-06-22 10:39:19 -070049 less, greater, // < >
50 // TODO: More punctuation.
51
52 // Keywords.
Chris Lattnerbb8fafc2018-06-22 15:52:02 -070053 kw_bf16,
Chris Lattnerf6d80a02018-06-24 11:18:29 -070054 kw_br,
Chris Lattnere79379a2018-06-22 10:39:19 -070055 kw_cfgfunc,
56 kw_extfunc,
Chris Lattnerbb8fafc2018-06-22 15:52:02 -070057 kw_f16,
58 kw_f32,
59 kw_f64,
60 kw_i1,
61 kw_i16,
62 kw_i32,
63 kw_i64,
64 kw_i8,
65 kw_int,
66 kw_memref,
Chris Lattnere79379a2018-06-22 10:39:19 -070067 kw_mlfunc,
Chris Lattner4c95a502018-06-23 16:03:42 -070068 kw_return,
Chris Lattnerbb8fafc2018-06-22 15:52:02 -070069 kw_tensor,
70 kw_vector,
Chris Lattnere79379a2018-06-22 10:39:19 -070071 };
72
73 Token(TokenKind kind, StringRef spelling)
74 : kind(kind), spelling(spelling) {}
75
76 // Return the bytes that make up this token.
77 StringRef getSpelling() const { return spelling; }
78
79 // Token classification.
80 TokenKind getKind() const { return kind; }
81 bool is(TokenKind K) const { return kind == K; }
82
83 bool isAny(TokenKind k1, TokenKind k2) const {
84 return is(k1) || is(k2);
85 }
86
87 /// Return true if this token is one of the specified kinds.
88 template <typename ...T>
89 bool isAny(TokenKind k1, TokenKind k2, TokenKind k3, T... others) const {
90 if (is(k1))
91 return true;
92 return isAny(k2, k3, others...);
93 }
94
95 bool isNot(TokenKind k) const { return kind != k; }
96
97 /// Return true if this token isn't one of the specified kinds.
98 template <typename ...T>
99 bool isNot(TokenKind k1, TokenKind k2, T... others) const {
100 return !isAny(k1, k2, others...);
101 }
102
Chris Lattnerbb8fafc2018-06-22 15:52:02 -0700103 // Helpers to decode specific sorts of tokens.
Chris Lattnere79379a2018-06-22 10:39:19 -0700104
Chris Lattnerbb8fafc2018-06-22 15:52:02 -0700105 /// For an integer token, return its value as an unsigned. If it doesn't fit,
106 /// return None.
107 Optional<unsigned> getUnsignedIntegerValue();
108
109 // Location processing.
Chris Lattnere79379a2018-06-22 10:39:19 -0700110 llvm::SMLoc getLoc() const;
111 llvm::SMLoc getEndLoc() const;
112 llvm::SMRange getLocRange() const;
113
114private:
115 /// Discriminator that indicates the sort of token this is.
116 TokenKind kind;
117
118 /// A reference to the entire token contents; this is always a pointer into
119 /// a memory buffer owned by the source manager.
120 StringRef spelling;
121};
122
123} // end namespace mlir
124
125#endif // MLIR_LIB_PARSER_TOKEN_H