blob: 5d0002d4d85f52d3325acf9b52627959c2ee5779 [file] [log] [blame]
Chris Lattnera59e8772009-06-21 07:19:10 +00001//===- AsmLexer.h - Lexer for Assembly Files --------------------*- C++ -*-===//
2//
3// The LLVM Compiler Infrastructure
4//
5// This file is distributed under the University of Illinois Open Source
6// License. See LICENSE.TXT for details.
7//
8//===----------------------------------------------------------------------===//
9//
10// This class declares the lexer for assembly files.
11//
12//===----------------------------------------------------------------------===//
13
14#ifndef ASMLEXER_H
15#define ASMLEXER_H
16
17#include "llvm/Support/DataTypes.h"
18#include <string>
19#include <cassert>
20
21namespace llvm {
22class MemoryBuffer;
23class SourceMgr;
24class SMLoc;
25
26namespace asmtok {
27 enum TokKind {
28 // Markers
29 Eof, Error,
30
Chris Lattner10a907d2009-06-21 19:56:35 +000031 // String values.
Chris Lattnera59e8772009-06-21 07:19:10 +000032 Identifier,
Chris Lattner4651bca2009-06-21 19:21:25 +000033 Register,
Chris Lattner10a907d2009-06-21 19:56:35 +000034 String,
35
36 // Integer values.
Chris Lattnera59e8772009-06-21 07:19:10 +000037 IntVal,
38
Chris Lattner10a907d2009-06-21 19:56:35 +000039 // No-value.
Chris Lattner4651bca2009-06-21 19:21:25 +000040 EndOfStatement,
Chris Lattnera59e8772009-06-21 07:19:10 +000041 Colon,
Chris Lattner74ec1a32009-06-22 06:32:03 +000042 Plus, Minus, Tilde,
Chris Lattner4651bca2009-06-21 19:21:25 +000043 Slash, // '/'
44 LParen, RParen,
Daniel Dunbar475839e2009-06-29 20:37:27 +000045 Star, Comma, Dollar, Equal, EqualEqual,
Chris Lattner8dfbe6c2009-06-23 05:57:07 +000046
Daniel Dunbar475839e2009-06-29 20:37:27 +000047 Pipe, PipePipe, Caret,
48 Amp, AmpAmp, Exclaim, ExclaimEqual, Percent,
49 Less, LessEqual, LessLess, LessGreater,
50 Greater, GreaterEqual, GreaterGreater
Chris Lattnera59e8772009-06-21 07:19:10 +000051 };
52}
53
54/// AsmLexer - Lexer class for assembly files.
55class AsmLexer {
56 SourceMgr &SrcMgr;
57
58 const char *CurPtr;
59 const MemoryBuffer *CurBuf;
Chris Lattnerfaf32c12009-06-24 00:33:19 +000060 // A llvm::StringSet<>, which provides uniqued and null-terminated strings.
61 void *TheStringSet;
Chris Lattnera59e8772009-06-21 07:19:10 +000062
63 // Information about the current token.
64 const char *TokStart;
65 asmtok::TokKind CurKind;
Chris Lattnerfaf32c12009-06-24 00:33:19 +000066 const char *CurStrVal; // This is valid for Identifier.
Chris Lattnera59e8772009-06-21 07:19:10 +000067 int64_t CurIntVal;
68
69 /// CurBuffer - This is the current buffer index we're lexing from as managed
70 /// by the SourceMgr object.
71 int CurBuffer;
72
Chris Lattnerfaf32c12009-06-24 00:33:19 +000073 void operator=(const AsmLexer&); // DO NOT IMPLEMENT
74 AsmLexer(const AsmLexer&); // DO NOT IMPLEMENT
Chris Lattnera59e8772009-06-21 07:19:10 +000075public:
76 AsmLexer(SourceMgr &SrcMgr);
Chris Lattnerfaf32c12009-06-24 00:33:19 +000077 ~AsmLexer();
Chris Lattnera59e8772009-06-21 07:19:10 +000078
79 asmtok::TokKind Lex() {
80 return CurKind = LexToken();
81 }
82
83 asmtok::TokKind getKind() const { return CurKind; }
Chris Lattnerb0789ed2009-06-21 20:54:55 +000084 bool is(asmtok::TokKind K) const { return CurKind == K; }
85 bool isNot(asmtok::TokKind K) const { return CurKind != K; }
Chris Lattnera59e8772009-06-21 07:19:10 +000086
Chris Lattnerfaf32c12009-06-24 00:33:19 +000087 const char *getCurStrVal() const {
Chris Lattner10a907d2009-06-21 19:56:35 +000088 assert((CurKind == asmtok::Identifier || CurKind == asmtok::Register ||
89 CurKind == asmtok::String) &&
Chris Lattnera59e8772009-06-21 07:19:10 +000090 "This token doesn't have a string value");
91 return CurStrVal;
92 }
93 int64_t getCurIntVal() const {
94 assert(CurKind == asmtok::IntVal && "This token isn't an integer");
95 return CurIntVal;
96 }
97
98 SMLoc getLoc() const;
99
Chris Lattner14ee48a2009-06-21 21:22:11 +0000100 void PrintMessage(SMLoc Loc, const std::string &Msg) const;
Chris Lattnera59e8772009-06-21 07:19:10 +0000101
102private:
103 int getNextChar();
Chris Lattner4651bca2009-06-21 19:21:25 +0000104 asmtok::TokKind ReturnError(const char *Loc, const std::string &Msg);
Chris Lattnera59e8772009-06-21 07:19:10 +0000105
106 /// LexToken - Read the next token and return its code.
107 asmtok::TokKind LexToken();
Chris Lattner4651bca2009-06-21 19:21:25 +0000108 asmtok::TokKind LexIdentifier();
109 asmtok::TokKind LexPercent();
110 asmtok::TokKind LexSlash();
Daniel Dunbar1ad7edc2009-06-29 22:00:57 +0000111 asmtok::TokKind LexLineComment();
Chris Lattner4651bca2009-06-21 19:21:25 +0000112 asmtok::TokKind LexDigit();
Chris Lattner10a907d2009-06-21 19:56:35 +0000113 asmtok::TokKind LexQuote();
Chris Lattnera59e8772009-06-21 07:19:10 +0000114};
115
116} // end namespace llvm
117
118#endif