Chris Lattner | a805874 | 2007-11-18 02:57:27 +0000 | [diff] [blame] | 1 | //===- TGLexer.h - Lexer for TableGen Files ---------------------*- C++ -*-===// |
| 2 | // |
| 3 | // The LLVM Compiler Infrastructure |
| 4 | // |
Chris Lattner | 3060910 | 2007-12-29 20:37:13 +0000 | [diff] [blame] | 5 | // This file is distributed under the University of Illinois Open Source |
| 6 | // License. See LICENSE.TXT for details. |
Chris Lattner | a805874 | 2007-11-18 02:57:27 +0000 | [diff] [blame] | 7 | // |
| 8 | //===----------------------------------------------------------------------===// |
| 9 | // |
| 10 | // This class represents the Lexer for tablegen files. |
| 11 | // |
| 12 | //===----------------------------------------------------------------------===// |
| 13 | |
| 14 | #ifndef TGLEXER_H |
| 15 | #define TGLEXER_H |
| 16 | |
Michael J. Spencer | 3cc52ea | 2010-11-29 18:47:54 +0000 | [diff] [blame] | 17 | #include "llvm/Support/DataTypes.h" |
Chris Lattner | a805874 | 2007-11-18 02:57:27 +0000 | [diff] [blame] | 18 | #include <string> |
Joerg Sonnenberger | dd13790 | 2011-06-01 13:10:15 +0000 | [diff] [blame] | 19 | #include <vector> |
Chris Lattner | 8dcf751 | 2007-11-22 23:19:05 +0000 | [diff] [blame] | 20 | #include <cassert> |
Chris Lattner | a805874 | 2007-11-18 02:57:27 +0000 | [diff] [blame] | 21 | |
| 22 | namespace llvm { |
| 23 | class MemoryBuffer; |
Chris Lattner | 8070ea3 | 2009-06-21 03:41:50 +0000 | [diff] [blame] | 24 | class SourceMgr; |
Chris Lattner | 1e3a8a4 | 2009-06-21 03:39:35 +0000 | [diff] [blame] | 25 | class SMLoc; |
Benjamin Kramer | d1e1703 | 2010-09-27 17:42:11 +0000 | [diff] [blame] | 26 | class Twine; |
| 27 | |
Chris Lattner | f460165 | 2007-11-22 20:49:04 +0000 | [diff] [blame] | 28 | namespace tgtok { |
| 29 | enum TokKind { |
| 30 | // Markers |
| 31 | Eof, Error, |
| 32 | |
| 33 | // Tokens with no info. |
| 34 | minus, plus, // - + |
| 35 | l_square, r_square, // [ ] |
| 36 | l_brace, r_brace, // { } |
| 37 | l_paren, r_paren, // ( ) |
| 38 | less, greater, // < > |
Francois Pichet | 606957f | 2011-03-14 02:30:32 +0000 | [diff] [blame] | 39 | colon, semi, // : ; |
Chris Lattner | f460165 | 2007-11-22 20:49:04 +0000 | [diff] [blame] | 40 | comma, period, // , . |
| 41 | equal, question, // = ? |
David Greene | d3d1cad | 2011-10-19 13:04:43 +0000 | [diff] [blame^] | 42 | paste, // # |
| 43 | |
Chris Lattner | f460165 | 2007-11-22 20:49:04 +0000 | [diff] [blame] | 44 | // Keywords. |
David Greene | a1b1b79 | 2011-10-07 18:25:05 +0000 | [diff] [blame] | 45 | Bit, Bits, Class, Code, Dag, Def, Defm, Field, In, Int, Let, List, |
Chris Lattner | f460165 | 2007-11-22 20:49:04 +0000 | [diff] [blame] | 46 | MultiClass, String, |
| 47 | |
| 48 | // !keywords. |
Chris Lattner | c7252ce | 2010-10-06 00:19:21 +0000 | [diff] [blame] | 49 | XConcat, XSRA, XSRL, XSHL, XStrConcat, XCast, XSubst, |
David Greene | 1434f66 | 2011-01-07 17:05:37 +0000 | [diff] [blame] | 50 | XForEach, XHead, XTail, XEmpty, XIf, XEq, |
David Greene | c7cafcd | 2009-04-22 20:18:10 +0000 | [diff] [blame] | 51 | |
Chris Lattner | f460165 | 2007-11-22 20:49:04 +0000 | [diff] [blame] | 52 | // Integer value. |
| 53 | IntVal, |
| 54 | |
| 55 | // String valued tokens. |
| 56 | Id, StrVal, VarName, CodeFragment |
| 57 | }; |
| 58 | } |
Chris Lattner | a805874 | 2007-11-18 02:57:27 +0000 | [diff] [blame] | 59 | |
Chris Lattner | f460165 | 2007-11-22 20:49:04 +0000 | [diff] [blame] | 60 | /// TGLexer - TableGen Lexer class. |
Chris Lattner | a805874 | 2007-11-18 02:57:27 +0000 | [diff] [blame] | 61 | class TGLexer { |
Chris Lattner | 8070ea3 | 2009-06-21 03:41:50 +0000 | [diff] [blame] | 62 | SourceMgr &SrcMgr; |
Chris Lattner | aa739d2 | 2009-03-13 07:05:43 +0000 | [diff] [blame] | 63 | |
Chris Lattner | a805874 | 2007-11-18 02:57:27 +0000 | [diff] [blame] | 64 | const char *CurPtr; |
Chris Lattner | aa739d2 | 2009-03-13 07:05:43 +0000 | [diff] [blame] | 65 | const MemoryBuffer *CurBuf; |
Chris Lattner | a805874 | 2007-11-18 02:57:27 +0000 | [diff] [blame] | 66 | |
Chris Lattner | f460165 | 2007-11-22 20:49:04 +0000 | [diff] [blame] | 67 | // Information about the current token. |
| 68 | const char *TokStart; |
| 69 | tgtok::TokKind CurCode; |
| 70 | std::string CurStrVal; // This is valid for ID, STRVAL, VARNAME, CODEFRAGMENT |
Dan Gohman | 63f9720 | 2008-10-17 01:33:43 +0000 | [diff] [blame] | 71 | int64_t CurIntVal; // This is valid for INTVAL. |
Chris Lattner | aa739d2 | 2009-03-13 07:05:43 +0000 | [diff] [blame] | 72 | |
| 73 | /// CurBuffer - This is the current buffer index we're lexing from as managed |
| 74 | /// by the SourceMgr object. |
| 75 | int CurBuffer; |
Joerg Sonnenberger | dd13790 | 2011-06-01 13:10:15 +0000 | [diff] [blame] | 76 | /// Dependencies - This is the list of all included files. |
| 77 | std::vector<std::string> Dependencies; |
Chris Lattner | a805874 | 2007-11-18 02:57:27 +0000 | [diff] [blame] | 78 | |
Chris Lattner | a805874 | 2007-11-18 02:57:27 +0000 | [diff] [blame] | 79 | public: |
Chris Lattner | 8070ea3 | 2009-06-21 03:41:50 +0000 | [diff] [blame] | 80 | TGLexer(SourceMgr &SrcMgr); |
Chris Lattner | aa739d2 | 2009-03-13 07:05:43 +0000 | [diff] [blame] | 81 | ~TGLexer() {} |
Chris Lattner | a805874 | 2007-11-18 02:57:27 +0000 | [diff] [blame] | 82 | |
Chris Lattner | f460165 | 2007-11-22 20:49:04 +0000 | [diff] [blame] | 83 | tgtok::TokKind Lex() { |
| 84 | return CurCode = LexToken(); |
| 85 | } |
Joerg Sonnenberger | dd13790 | 2011-06-01 13:10:15 +0000 | [diff] [blame] | 86 | |
| 87 | const std::vector<std::string> &getDependencies() const { |
| 88 | return Dependencies; |
| 89 | } |
Chris Lattner | a805874 | 2007-11-18 02:57:27 +0000 | [diff] [blame] | 90 | |
Chris Lattner | f460165 | 2007-11-22 20:49:04 +0000 | [diff] [blame] | 91 | tgtok::TokKind getCode() const { return CurCode; } |
| 92 | |
| 93 | const std::string &getCurStrVal() const { |
| 94 | assert((CurCode == tgtok::Id || CurCode == tgtok::StrVal || |
| 95 | CurCode == tgtok::VarName || CurCode == tgtok::CodeFragment) && |
| 96 | "This token doesn't have a string value"); |
| 97 | return CurStrVal; |
| 98 | } |
Dan Gohman | 63f9720 | 2008-10-17 01:33:43 +0000 | [diff] [blame] | 99 | int64_t getCurIntVal() const { |
Chris Lattner | f460165 | 2007-11-22 20:49:04 +0000 | [diff] [blame] | 100 | assert(CurCode == tgtok::IntVal && "This token isn't an integer"); |
| 101 | return CurIntVal; |
| 102 | } |
| 103 | |
Chris Lattner | 1e3a8a4 | 2009-06-21 03:39:35 +0000 | [diff] [blame] | 104 | SMLoc getLoc() const; |
Chris Lattner | f460165 | 2007-11-22 20:49:04 +0000 | [diff] [blame] | 105 | |
Chris Lattner | a805874 | 2007-11-18 02:57:27 +0000 | [diff] [blame] | 106 | private: |
Chris Lattner | f460165 | 2007-11-22 20:49:04 +0000 | [diff] [blame] | 107 | /// LexToken - Read the next token and return its code. |
| 108 | tgtok::TokKind LexToken(); |
| 109 | |
Benjamin Kramer | d1e1703 | 2010-09-27 17:42:11 +0000 | [diff] [blame] | 110 | tgtok::TokKind ReturnError(const char *Loc, const Twine &Msg); |
Chris Lattner | c8a9bbc | 2007-11-19 07:38:58 +0000 | [diff] [blame] | 111 | |
Chris Lattner | a805874 | 2007-11-18 02:57:27 +0000 | [diff] [blame] | 112 | int getNextChar(); |
David Greene | a761f92 | 2011-10-19 13:03:35 +0000 | [diff] [blame] | 113 | int peekNextChar(int Index); |
Chris Lattner | a805874 | 2007-11-18 02:57:27 +0000 | [diff] [blame] | 114 | void SkipBCPLComment(); |
| 115 | bool SkipCComment(); |
Chris Lattner | f460165 | 2007-11-22 20:49:04 +0000 | [diff] [blame] | 116 | tgtok::TokKind LexIdentifier(); |
Chris Lattner | a805874 | 2007-11-18 02:57:27 +0000 | [diff] [blame] | 117 | bool LexInclude(); |
Chris Lattner | f460165 | 2007-11-22 20:49:04 +0000 | [diff] [blame] | 118 | tgtok::TokKind LexString(); |
| 119 | tgtok::TokKind LexVarName(); |
| 120 | tgtok::TokKind LexNumber(); |
| 121 | tgtok::TokKind LexBracket(); |
| 122 | tgtok::TokKind LexExclaim(); |
Chris Lattner | a805874 | 2007-11-18 02:57:27 +0000 | [diff] [blame] | 123 | }; |
| 124 | |
| 125 | } // end namespace llvm |
| 126 | |
| 127 | #endif |