Lang Hames | bcdb994 | 2016-09-19 23:00:27 +0000 | [diff] [blame^] | 1 | #include "llvm/ADT/STLExtras.h" |
Will Dietz | 981af00 | 2013-10-12 00:55:57 +0000 | [diff] [blame] | 2 | #include <cctype> |
Erick Tryzelaar | 21e83ea | 2009-09-22 21:15:19 +0000 | [diff] [blame] | 3 | #include <cstdio> |
Eugene Zelenko | f981ec4 | 2016-05-19 01:08:04 +0000 | [diff] [blame] | 4 | #include <cstdlib> |
Erick Tryzelaar | 21e83ea | 2009-09-22 21:15:19 +0000 | [diff] [blame] | 5 | #include <map> |
David Blaikie | 96a9d8c | 2015-11-03 16:23:21 +0000 | [diff] [blame] | 6 | #include <memory> |
Chandler Carruth | 605e30e | 2012-12-04 10:16:57 +0000 | [diff] [blame] | 7 | #include <string> |
Erick Tryzelaar | 21e83ea | 2009-09-22 21:15:19 +0000 | [diff] [blame] | 8 | #include <vector> |
| 9 | |
| 10 | //===----------------------------------------------------------------------===// |
| 11 | // Lexer |
| 12 | //===----------------------------------------------------------------------===// |
| 13 | |
| 14 | // The lexer returns tokens [0-255] if it is an unknown character, otherwise one |
| 15 | // of these for known things. |
| 16 | enum Token { |
| 17 | tok_eof = -1, |
| 18 | |
| 19 | // commands |
Lang Hames | 59b0da8 | 2015-08-19 18:15:58 +0000 | [diff] [blame] | 20 | tok_def = -2, |
| 21 | tok_extern = -3, |
Erick Tryzelaar | 21e83ea | 2009-09-22 21:15:19 +0000 | [diff] [blame] | 22 | |
| 23 | // primary |
Lang Hames | 59b0da8 | 2015-08-19 18:15:58 +0000 | [diff] [blame] | 24 | tok_identifier = -4, |
| 25 | tok_number = -5 |
Erick Tryzelaar | 21e83ea | 2009-09-22 21:15:19 +0000 | [diff] [blame] | 26 | }; |
| 27 | |
Lang Hames | 59b0da8 | 2015-08-19 18:15:58 +0000 | [diff] [blame] | 28 | static std::string IdentifierStr; // Filled in if tok_identifier |
| 29 | static double NumVal; // Filled in if tok_number |
Erick Tryzelaar | 21e83ea | 2009-09-22 21:15:19 +0000 | [diff] [blame] | 30 | |
| 31 | /// gettok - Return the next token from standard input. |
| 32 | static int gettok() { |
| 33 | static int LastChar = ' '; |
| 34 | |
| 35 | // Skip any whitespace. |
| 36 | while (isspace(LastChar)) |
| 37 | LastChar = getchar(); |
| 38 | |
| 39 | if (isalpha(LastChar)) { // identifier: [a-zA-Z][a-zA-Z0-9]* |
| 40 | IdentifierStr = LastChar; |
| 41 | while (isalnum((LastChar = getchar()))) |
| 42 | IdentifierStr += LastChar; |
| 43 | |
Lang Hames | 59b0da8 | 2015-08-19 18:15:58 +0000 | [diff] [blame] | 44 | if (IdentifierStr == "def") |
| 45 | return tok_def; |
| 46 | if (IdentifierStr == "extern") |
| 47 | return tok_extern; |
Erick Tryzelaar | 21e83ea | 2009-09-22 21:15:19 +0000 | [diff] [blame] | 48 | return tok_identifier; |
| 49 | } |
| 50 | |
Lang Hames | 59b0da8 | 2015-08-19 18:15:58 +0000 | [diff] [blame] | 51 | if (isdigit(LastChar) || LastChar == '.') { // Number: [0-9.]+ |
Erick Tryzelaar | 21e83ea | 2009-09-22 21:15:19 +0000 | [diff] [blame] | 52 | std::string NumStr; |
| 53 | do { |
| 54 | NumStr += LastChar; |
| 55 | LastChar = getchar(); |
| 56 | } while (isdigit(LastChar) || LastChar == '.'); |
| 57 | |
Hans Wennborg | cc9deb4 | 2015-09-29 18:02:48 +0000 | [diff] [blame] | 58 | NumVal = strtod(NumStr.c_str(), nullptr); |
Erick Tryzelaar | 21e83ea | 2009-09-22 21:15:19 +0000 | [diff] [blame] | 59 | return tok_number; |
| 60 | } |
| 61 | |
| 62 | if (LastChar == '#') { |
| 63 | // Comment until end of line. |
Lang Hames | 59b0da8 | 2015-08-19 18:15:58 +0000 | [diff] [blame] | 64 | do |
| 65 | LastChar = getchar(); |
Erick Tryzelaar | 21e83ea | 2009-09-22 21:15:19 +0000 | [diff] [blame] | 66 | while (LastChar != EOF && LastChar != '\n' && LastChar != '\r'); |
Lang Hames | 59b0da8 | 2015-08-19 18:15:58 +0000 | [diff] [blame] | 67 | |
Erick Tryzelaar | 21e83ea | 2009-09-22 21:15:19 +0000 | [diff] [blame] | 68 | if (LastChar != EOF) |
| 69 | return gettok(); |
| 70 | } |
Lang Hames | 59b0da8 | 2015-08-19 18:15:58 +0000 | [diff] [blame] | 71 | |
Erick Tryzelaar | 21e83ea | 2009-09-22 21:15:19 +0000 | [diff] [blame] | 72 | // Check for end of file. Don't eat the EOF. |
| 73 | if (LastChar == EOF) |
| 74 | return tok_eof; |
| 75 | |
| 76 | // Otherwise, just return the character as its ascii value. |
| 77 | int ThisChar = LastChar; |
| 78 | LastChar = getchar(); |
| 79 | return ThisChar; |
| 80 | } |
| 81 | |
| 82 | //===----------------------------------------------------------------------===// |
| 83 | // Abstract Syntax Tree (aka Parse Tree) |
| 84 | //===----------------------------------------------------------------------===// |
Juergen Ributzka | 05c5a93 | 2013-11-19 03:08:35 +0000 | [diff] [blame] | 85 | namespace { |
Erick Tryzelaar | 21e83ea | 2009-09-22 21:15:19 +0000 | [diff] [blame] | 86 | /// ExprAST - Base class for all expression nodes. |
| 87 | class ExprAST { |
| 88 | public: |
Juergen Ributzka | 05c5a93 | 2013-11-19 03:08:35 +0000 | [diff] [blame] | 89 | virtual ~ExprAST() {} |
Erick Tryzelaar | 21e83ea | 2009-09-22 21:15:19 +0000 | [diff] [blame] | 90 | }; |
| 91 | |
| 92 | /// NumberExprAST - Expression class for numeric literals like "1.0". |
| 93 | class NumberExprAST : public ExprAST { |
Lang Hames | 59b0da8 | 2015-08-19 18:15:58 +0000 | [diff] [blame] | 94 | double Val; |
| 95 | |
Erick Tryzelaar | 21e83ea | 2009-09-22 21:15:19 +0000 | [diff] [blame] | 96 | public: |
Lang Hames | 59b0da8 | 2015-08-19 18:15:58 +0000 | [diff] [blame] | 97 | NumberExprAST(double Val) : Val(Val) {} |
Erick Tryzelaar | 21e83ea | 2009-09-22 21:15:19 +0000 | [diff] [blame] | 98 | }; |
| 99 | |
| 100 | /// VariableExprAST - Expression class for referencing a variable, like "a". |
| 101 | class VariableExprAST : public ExprAST { |
| 102 | std::string Name; |
Lang Hames | 59b0da8 | 2015-08-19 18:15:58 +0000 | [diff] [blame] | 103 | |
Erick Tryzelaar | 21e83ea | 2009-09-22 21:15:19 +0000 | [diff] [blame] | 104 | public: |
Lang Hames | 09bf4c1 | 2015-08-18 18:11:06 +0000 | [diff] [blame] | 105 | VariableExprAST(const std::string &Name) : Name(Name) {} |
Erick Tryzelaar | 21e83ea | 2009-09-22 21:15:19 +0000 | [diff] [blame] | 106 | }; |
| 107 | |
| 108 | /// BinaryExprAST - Expression class for a binary operator. |
| 109 | class BinaryExprAST : public ExprAST { |
Lang Hames | 59b0da8 | 2015-08-19 18:15:58 +0000 | [diff] [blame] | 110 | char Op; |
| 111 | std::unique_ptr<ExprAST> LHS, RHS; |
| 112 | |
Erick Tryzelaar | 21e83ea | 2009-09-22 21:15:19 +0000 | [diff] [blame] | 113 | public: |
Lang Hames | 09bf4c1 | 2015-08-18 18:11:06 +0000 | [diff] [blame] | 114 | BinaryExprAST(char Op, std::unique_ptr<ExprAST> LHS, |
Lang Hames | 59b0da8 | 2015-08-19 18:15:58 +0000 | [diff] [blame] | 115 | std::unique_ptr<ExprAST> RHS) |
| 116 | : Op(Op), LHS(std::move(LHS)), RHS(std::move(RHS)) {} |
Erick Tryzelaar | 21e83ea | 2009-09-22 21:15:19 +0000 | [diff] [blame] | 117 | }; |
| 118 | |
| 119 | /// CallExprAST - Expression class for function calls. |
| 120 | class CallExprAST : public ExprAST { |
| 121 | std::string Callee; |
Lang Hames | 09bf4c1 | 2015-08-18 18:11:06 +0000 | [diff] [blame] | 122 | std::vector<std::unique_ptr<ExprAST>> Args; |
Lang Hames | 59b0da8 | 2015-08-19 18:15:58 +0000 | [diff] [blame] | 123 | |
Erick Tryzelaar | 21e83ea | 2009-09-22 21:15:19 +0000 | [diff] [blame] | 124 | public: |
Lang Hames | 09bf4c1 | 2015-08-18 18:11:06 +0000 | [diff] [blame] | 125 | CallExprAST(const std::string &Callee, |
| 126 | std::vector<std::unique_ptr<ExprAST>> Args) |
Lang Hames | 59b0da8 | 2015-08-19 18:15:58 +0000 | [diff] [blame] | 127 | : Callee(Callee), Args(std::move(Args)) {} |
Erick Tryzelaar | 21e83ea | 2009-09-22 21:15:19 +0000 | [diff] [blame] | 128 | }; |
| 129 | |
| 130 | /// PrototypeAST - This class represents the "prototype" for a function, |
| 131 | /// which captures its name, and its argument names (thus implicitly the number |
| 132 | /// of arguments the function takes). |
| 133 | class PrototypeAST { |
| 134 | std::string Name; |
| 135 | std::vector<std::string> Args; |
Lang Hames | 59b0da8 | 2015-08-19 18:15:58 +0000 | [diff] [blame] | 136 | |
Erick Tryzelaar | 21e83ea | 2009-09-22 21:15:19 +0000 | [diff] [blame] | 137 | public: |
Lang Hames | 09bf4c1 | 2015-08-18 18:11:06 +0000 | [diff] [blame] | 138 | PrototypeAST(const std::string &Name, std::vector<std::string> Args) |
Lang Hames | 59b0da8 | 2015-08-19 18:15:58 +0000 | [diff] [blame] | 139 | : Name(Name), Args(std::move(Args)) {} |
Erick Tryzelaar | 21e83ea | 2009-09-22 21:15:19 +0000 | [diff] [blame] | 140 | }; |
| 141 | |
| 142 | /// FunctionAST - This class represents a function definition itself. |
| 143 | class FunctionAST { |
Lang Hames | 59b0da8 | 2015-08-19 18:15:58 +0000 | [diff] [blame] | 144 | std::unique_ptr<PrototypeAST> Proto; |
| 145 | std::unique_ptr<ExprAST> Body; |
| 146 | |
Erick Tryzelaar | 21e83ea | 2009-09-22 21:15:19 +0000 | [diff] [blame] | 147 | public: |
Lang Hames | 09bf4c1 | 2015-08-18 18:11:06 +0000 | [diff] [blame] | 148 | FunctionAST(std::unique_ptr<PrototypeAST> Proto, |
Lang Hames | 59b0da8 | 2015-08-19 18:15:58 +0000 | [diff] [blame] | 149 | std::unique_ptr<ExprAST> Body) |
| 150 | : Proto(std::move(Proto)), Body(std::move(Body)) {} |
Erick Tryzelaar | 21e83ea | 2009-09-22 21:15:19 +0000 | [diff] [blame] | 151 | }; |
Juergen Ributzka | 05c5a93 | 2013-11-19 03:08:35 +0000 | [diff] [blame] | 152 | } // end anonymous namespace |
Erick Tryzelaar | 21e83ea | 2009-09-22 21:15:19 +0000 | [diff] [blame] | 153 | |
| 154 | //===----------------------------------------------------------------------===// |
| 155 | // Parser |
| 156 | //===----------------------------------------------------------------------===// |
| 157 | |
| 158 | /// CurTok/getNextToken - Provide a simple token buffer. CurTok is the current |
| 159 | /// token the parser is looking at. getNextToken reads another token from the |
| 160 | /// lexer and updates CurTok with its results. |
| 161 | static int CurTok; |
Lang Hames | 59b0da8 | 2015-08-19 18:15:58 +0000 | [diff] [blame] | 162 | static int getNextToken() { return CurTok = gettok(); } |
Erick Tryzelaar | 21e83ea | 2009-09-22 21:15:19 +0000 | [diff] [blame] | 163 | |
| 164 | /// BinopPrecedence - This holds the precedence for each binary operator that is |
| 165 | /// defined. |
| 166 | static std::map<char, int> BinopPrecedence; |
| 167 | |
| 168 | /// GetTokPrecedence - Get the precedence of the pending binary operator token. |
| 169 | static int GetTokPrecedence() { |
| 170 | if (!isascii(CurTok)) |
| 171 | return -1; |
Lang Hames | 59b0da8 | 2015-08-19 18:15:58 +0000 | [diff] [blame] | 172 | |
Erick Tryzelaar | 21e83ea | 2009-09-22 21:15:19 +0000 | [diff] [blame] | 173 | // Make sure it's a declared binop. |
| 174 | int TokPrec = BinopPrecedence[CurTok]; |
Lang Hames | 59b0da8 | 2015-08-19 18:15:58 +0000 | [diff] [blame] | 175 | if (TokPrec <= 0) |
| 176 | return -1; |
Erick Tryzelaar | 21e83ea | 2009-09-22 21:15:19 +0000 | [diff] [blame] | 177 | return TokPrec; |
| 178 | } |
| 179 | |
Lang Hames | 5d045a9 | 2016-03-25 17:41:26 +0000 | [diff] [blame] | 180 | /// LogError* - These are little helper functions for error handling. |
| 181 | std::unique_ptr<ExprAST> LogError(const char *Str) { |
Lang Hames | 09bf4c1 | 2015-08-18 18:11:06 +0000 | [diff] [blame] | 182 | fprintf(stderr, "Error: %s\n", Str); |
| 183 | return nullptr; |
| 184 | } |
Lang Hames | 5d045a9 | 2016-03-25 17:41:26 +0000 | [diff] [blame] | 185 | std::unique_ptr<PrototypeAST> LogErrorP(const char *Str) { |
| 186 | LogError(Str); |
Lang Hames | 09bf4c1 | 2015-08-18 18:11:06 +0000 | [diff] [blame] | 187 | return nullptr; |
| 188 | } |
Erick Tryzelaar | 21e83ea | 2009-09-22 21:15:19 +0000 | [diff] [blame] | 189 | |
Lang Hames | 09bf4c1 | 2015-08-18 18:11:06 +0000 | [diff] [blame] | 190 | static std::unique_ptr<ExprAST> ParseExpression(); |
Erick Tryzelaar | 21e83ea | 2009-09-22 21:15:19 +0000 | [diff] [blame] | 191 | |
Erick Tryzelaar | 21e83ea | 2009-09-22 21:15:19 +0000 | [diff] [blame] | 192 | /// numberexpr ::= number |
Lang Hames | 09bf4c1 | 2015-08-18 18:11:06 +0000 | [diff] [blame] | 193 | static std::unique_ptr<ExprAST> ParseNumberExpr() { |
Lang Hames | bcdb994 | 2016-09-19 23:00:27 +0000 | [diff] [blame^] | 194 | auto Result = llvm::make_unique<NumberExprAST>(NumVal); |
Erick Tryzelaar | 21e83ea | 2009-09-22 21:15:19 +0000 | [diff] [blame] | 195 | getNextToken(); // consume the number |
Lang Hames | 09bf4c1 | 2015-08-18 18:11:06 +0000 | [diff] [blame] | 196 | return std::move(Result); |
Erick Tryzelaar | 21e83ea | 2009-09-22 21:15:19 +0000 | [diff] [blame] | 197 | } |
| 198 | |
| 199 | /// parenexpr ::= '(' expression ')' |
Lang Hames | 09bf4c1 | 2015-08-18 18:11:06 +0000 | [diff] [blame] | 200 | static std::unique_ptr<ExprAST> ParseParenExpr() { |
Lang Hames | 59b0da8 | 2015-08-19 18:15:58 +0000 | [diff] [blame] | 201 | getNextToken(); // eat (. |
Lang Hames | 09bf4c1 | 2015-08-18 18:11:06 +0000 | [diff] [blame] | 202 | auto V = ParseExpression(); |
| 203 | if (!V) |
| 204 | return nullptr; |
Lang Hames | 59b0da8 | 2015-08-19 18:15:58 +0000 | [diff] [blame] | 205 | |
Erick Tryzelaar | 21e83ea | 2009-09-22 21:15:19 +0000 | [diff] [blame] | 206 | if (CurTok != ')') |
Lang Hames | 5d045a9 | 2016-03-25 17:41:26 +0000 | [diff] [blame] | 207 | return LogError("expected ')'"); |
Lang Hames | 59b0da8 | 2015-08-19 18:15:58 +0000 | [diff] [blame] | 208 | getNextToken(); // eat ). |
Erick Tryzelaar | 21e83ea | 2009-09-22 21:15:19 +0000 | [diff] [blame] | 209 | return V; |
| 210 | } |
| 211 | |
Lang Hames | 59b0da8 | 2015-08-19 18:15:58 +0000 | [diff] [blame] | 212 | /// identifierexpr |
| 213 | /// ::= identifier |
| 214 | /// ::= identifier '(' expression* ')' |
| 215 | static std::unique_ptr<ExprAST> ParseIdentifierExpr() { |
| 216 | std::string IdName = IdentifierStr; |
| 217 | |
| 218 | getNextToken(); // eat identifier. |
| 219 | |
| 220 | if (CurTok != '(') // Simple variable ref. |
Lang Hames | bcdb994 | 2016-09-19 23:00:27 +0000 | [diff] [blame^] | 221 | return llvm::make_unique<VariableExprAST>(IdName); |
Lang Hames | 59b0da8 | 2015-08-19 18:15:58 +0000 | [diff] [blame] | 222 | |
| 223 | // Call. |
| 224 | getNextToken(); // eat ( |
| 225 | std::vector<std::unique_ptr<ExprAST>> Args; |
| 226 | if (CurTok != ')') { |
Eugene Zelenko | f981ec4 | 2016-05-19 01:08:04 +0000 | [diff] [blame] | 227 | while (true) { |
Lang Hames | 59b0da8 | 2015-08-19 18:15:58 +0000 | [diff] [blame] | 228 | if (auto Arg = ParseExpression()) |
| 229 | Args.push_back(std::move(Arg)); |
| 230 | else |
| 231 | return nullptr; |
| 232 | |
| 233 | if (CurTok == ')') |
| 234 | break; |
| 235 | |
| 236 | if (CurTok != ',') |
Lang Hames | 5d045a9 | 2016-03-25 17:41:26 +0000 | [diff] [blame] | 237 | return LogError("Expected ')' or ',' in argument list"); |
Lang Hames | 59b0da8 | 2015-08-19 18:15:58 +0000 | [diff] [blame] | 238 | getNextToken(); |
| 239 | } |
| 240 | } |
| 241 | |
| 242 | // Eat the ')'. |
| 243 | getNextToken(); |
| 244 | |
Lang Hames | bcdb994 | 2016-09-19 23:00:27 +0000 | [diff] [blame^] | 245 | return llvm::make_unique<CallExprAST>(IdName, std::move(Args)); |
Lang Hames | 59b0da8 | 2015-08-19 18:15:58 +0000 | [diff] [blame] | 246 | } |
| 247 | |
Erick Tryzelaar | 21e83ea | 2009-09-22 21:15:19 +0000 | [diff] [blame] | 248 | /// primary |
| 249 | /// ::= identifierexpr |
| 250 | /// ::= numberexpr |
| 251 | /// ::= parenexpr |
Lang Hames | 09bf4c1 | 2015-08-18 18:11:06 +0000 | [diff] [blame] | 252 | static std::unique_ptr<ExprAST> ParsePrimary() { |
Erick Tryzelaar | 21e83ea | 2009-09-22 21:15:19 +0000 | [diff] [blame] | 253 | switch (CurTok) { |
Lang Hames | 59b0da8 | 2015-08-19 18:15:58 +0000 | [diff] [blame] | 254 | default: |
Lang Hames | 5d045a9 | 2016-03-25 17:41:26 +0000 | [diff] [blame] | 255 | return LogError("unknown token when expecting an expression"); |
Lang Hames | 59b0da8 | 2015-08-19 18:15:58 +0000 | [diff] [blame] | 256 | case tok_identifier: |
| 257 | return ParseIdentifierExpr(); |
| 258 | case tok_number: |
| 259 | return ParseNumberExpr(); |
| 260 | case '(': |
| 261 | return ParseParenExpr(); |
Erick Tryzelaar | 21e83ea | 2009-09-22 21:15:19 +0000 | [diff] [blame] | 262 | } |
| 263 | } |
| 264 | |
| 265 | /// binoprhs |
| 266 | /// ::= ('+' primary)* |
Lang Hames | 09bf4c1 | 2015-08-18 18:11:06 +0000 | [diff] [blame] | 267 | static std::unique_ptr<ExprAST> ParseBinOpRHS(int ExprPrec, |
| 268 | std::unique_ptr<ExprAST> LHS) { |
Erick Tryzelaar | 21e83ea | 2009-09-22 21:15:19 +0000 | [diff] [blame] | 269 | // If this is a binop, find its precedence. |
Eugene Zelenko | f981ec4 | 2016-05-19 01:08:04 +0000 | [diff] [blame] | 270 | while (true) { |
Erick Tryzelaar | 21e83ea | 2009-09-22 21:15:19 +0000 | [diff] [blame] | 271 | int TokPrec = GetTokPrecedence(); |
Lang Hames | 59b0da8 | 2015-08-19 18:15:58 +0000 | [diff] [blame] | 272 | |
Erick Tryzelaar | 21e83ea | 2009-09-22 21:15:19 +0000 | [diff] [blame] | 273 | // If this is a binop that binds at least as tightly as the current binop, |
| 274 | // consume it, otherwise we are done. |
| 275 | if (TokPrec < ExprPrec) |
| 276 | return LHS; |
Lang Hames | 59b0da8 | 2015-08-19 18:15:58 +0000 | [diff] [blame] | 277 | |
Erick Tryzelaar | 21e83ea | 2009-09-22 21:15:19 +0000 | [diff] [blame] | 278 | // Okay, we know this is a binop. |
| 279 | int BinOp = CurTok; |
Lang Hames | 59b0da8 | 2015-08-19 18:15:58 +0000 | [diff] [blame] | 280 | getNextToken(); // eat binop |
| 281 | |
Erick Tryzelaar | 21e83ea | 2009-09-22 21:15:19 +0000 | [diff] [blame] | 282 | // Parse the primary expression after the binary operator. |
Lang Hames | 09bf4c1 | 2015-08-18 18:11:06 +0000 | [diff] [blame] | 283 | auto RHS = ParsePrimary(); |
Lang Hames | 59b0da8 | 2015-08-19 18:15:58 +0000 | [diff] [blame] | 284 | if (!RHS) |
| 285 | return nullptr; |
| 286 | |
Erick Tryzelaar | 21e83ea | 2009-09-22 21:15:19 +0000 | [diff] [blame] | 287 | // If BinOp binds less tightly with RHS than the operator after RHS, let |
| 288 | // the pending operator take RHS as its LHS. |
| 289 | int NextPrec = GetTokPrecedence(); |
| 290 | if (TokPrec < NextPrec) { |
Lang Hames | 59b0da8 | 2015-08-19 18:15:58 +0000 | [diff] [blame] | 291 | RHS = ParseBinOpRHS(TokPrec + 1, std::move(RHS)); |
| 292 | if (!RHS) |
| 293 | return nullptr; |
Erick Tryzelaar | 21e83ea | 2009-09-22 21:15:19 +0000 | [diff] [blame] | 294 | } |
Lang Hames | 59b0da8 | 2015-08-19 18:15:58 +0000 | [diff] [blame] | 295 | |
Erick Tryzelaar | 21e83ea | 2009-09-22 21:15:19 +0000 | [diff] [blame] | 296 | // Merge LHS/RHS. |
Lang Hames | bcdb994 | 2016-09-19 23:00:27 +0000 | [diff] [blame^] | 297 | LHS = llvm::make_unique<BinaryExprAST>(BinOp, std::move(LHS), |
| 298 | std::move(RHS)); |
Erick Tryzelaar | 21e83ea | 2009-09-22 21:15:19 +0000 | [diff] [blame] | 299 | } |
| 300 | } |
| 301 | |
| 302 | /// expression |
| 303 | /// ::= primary binoprhs |
| 304 | /// |
Lang Hames | 09bf4c1 | 2015-08-18 18:11:06 +0000 | [diff] [blame] | 305 | static std::unique_ptr<ExprAST> ParseExpression() { |
| 306 | auto LHS = ParsePrimary(); |
Lang Hames | 59b0da8 | 2015-08-19 18:15:58 +0000 | [diff] [blame] | 307 | if (!LHS) |
| 308 | return nullptr; |
| 309 | |
Lang Hames | 09bf4c1 | 2015-08-18 18:11:06 +0000 | [diff] [blame] | 310 | return ParseBinOpRHS(0, std::move(LHS)); |
Erick Tryzelaar | 21e83ea | 2009-09-22 21:15:19 +0000 | [diff] [blame] | 311 | } |
| 312 | |
| 313 | /// prototype |
| 314 | /// ::= id '(' id* ')' |
Lang Hames | 09bf4c1 | 2015-08-18 18:11:06 +0000 | [diff] [blame] | 315 | static std::unique_ptr<PrototypeAST> ParsePrototype() { |
Erick Tryzelaar | 21e83ea | 2009-09-22 21:15:19 +0000 | [diff] [blame] | 316 | if (CurTok != tok_identifier) |
Lang Hames | 5d045a9 | 2016-03-25 17:41:26 +0000 | [diff] [blame] | 317 | return LogErrorP("Expected function name in prototype"); |
Erick Tryzelaar | 21e83ea | 2009-09-22 21:15:19 +0000 | [diff] [blame] | 318 | |
| 319 | std::string FnName = IdentifierStr; |
| 320 | getNextToken(); |
Lang Hames | 59b0da8 | 2015-08-19 18:15:58 +0000 | [diff] [blame] | 321 | |
Erick Tryzelaar | 21e83ea | 2009-09-22 21:15:19 +0000 | [diff] [blame] | 322 | if (CurTok != '(') |
Lang Hames | 5d045a9 | 2016-03-25 17:41:26 +0000 | [diff] [blame] | 323 | return LogErrorP("Expected '(' in prototype"); |
Lang Hames | 59b0da8 | 2015-08-19 18:15:58 +0000 | [diff] [blame] | 324 | |
Erick Tryzelaar | 21e83ea | 2009-09-22 21:15:19 +0000 | [diff] [blame] | 325 | std::vector<std::string> ArgNames; |
| 326 | while (getNextToken() == tok_identifier) |
| 327 | ArgNames.push_back(IdentifierStr); |
| 328 | if (CurTok != ')') |
Lang Hames | 5d045a9 | 2016-03-25 17:41:26 +0000 | [diff] [blame] | 329 | return LogErrorP("Expected ')' in prototype"); |
Lang Hames | 59b0da8 | 2015-08-19 18:15:58 +0000 | [diff] [blame] | 330 | |
Erick Tryzelaar | 21e83ea | 2009-09-22 21:15:19 +0000 | [diff] [blame] | 331 | // success. |
Lang Hames | 59b0da8 | 2015-08-19 18:15:58 +0000 | [diff] [blame] | 332 | getNextToken(); // eat ')'. |
| 333 | |
Lang Hames | bcdb994 | 2016-09-19 23:00:27 +0000 | [diff] [blame^] | 334 | return llvm::make_unique<PrototypeAST>(FnName, std::move(ArgNames)); |
Erick Tryzelaar | 21e83ea | 2009-09-22 21:15:19 +0000 | [diff] [blame] | 335 | } |
| 336 | |
| 337 | /// definition ::= 'def' prototype expression |
Lang Hames | 09bf4c1 | 2015-08-18 18:11:06 +0000 | [diff] [blame] | 338 | static std::unique_ptr<FunctionAST> ParseDefinition() { |
Lang Hames | 59b0da8 | 2015-08-19 18:15:58 +0000 | [diff] [blame] | 339 | getNextToken(); // eat def. |
Lang Hames | 09bf4c1 | 2015-08-18 18:11:06 +0000 | [diff] [blame] | 340 | auto Proto = ParsePrototype(); |
Lang Hames | 59b0da8 | 2015-08-19 18:15:58 +0000 | [diff] [blame] | 341 | if (!Proto) |
| 342 | return nullptr; |
Erick Tryzelaar | 21e83ea | 2009-09-22 21:15:19 +0000 | [diff] [blame] | 343 | |
Lang Hames | 09bf4c1 | 2015-08-18 18:11:06 +0000 | [diff] [blame] | 344 | if (auto E = ParseExpression()) |
Lang Hames | bcdb994 | 2016-09-19 23:00:27 +0000 | [diff] [blame^] | 345 | return llvm::make_unique<FunctionAST>(std::move(Proto), std::move(E)); |
Lang Hames | 09bf4c1 | 2015-08-18 18:11:06 +0000 | [diff] [blame] | 346 | return nullptr; |
Erick Tryzelaar | 21e83ea | 2009-09-22 21:15:19 +0000 | [diff] [blame] | 347 | } |
| 348 | |
| 349 | /// toplevelexpr ::= expression |
Lang Hames | 09bf4c1 | 2015-08-18 18:11:06 +0000 | [diff] [blame] | 350 | static std::unique_ptr<FunctionAST> ParseTopLevelExpr() { |
| 351 | if (auto E = ParseExpression()) { |
Erick Tryzelaar | 21e83ea | 2009-09-22 21:15:19 +0000 | [diff] [blame] | 352 | // Make an anonymous proto. |
Lang Hames | bcdb994 | 2016-09-19 23:00:27 +0000 | [diff] [blame^] | 353 | auto Proto = llvm::make_unique<PrototypeAST>("__anon_expr", |
| 354 | std::vector<std::string>()); |
| 355 | return llvm::make_unique<FunctionAST>(std::move(Proto), std::move(E)); |
Erick Tryzelaar | 21e83ea | 2009-09-22 21:15:19 +0000 | [diff] [blame] | 356 | } |
Lang Hames | 09bf4c1 | 2015-08-18 18:11:06 +0000 | [diff] [blame] | 357 | return nullptr; |
Erick Tryzelaar | 21e83ea | 2009-09-22 21:15:19 +0000 | [diff] [blame] | 358 | } |
| 359 | |
| 360 | /// external ::= 'extern' prototype |
Lang Hames | 09bf4c1 | 2015-08-18 18:11:06 +0000 | [diff] [blame] | 361 | static std::unique_ptr<PrototypeAST> ParseExtern() { |
Lang Hames | 59b0da8 | 2015-08-19 18:15:58 +0000 | [diff] [blame] | 362 | getNextToken(); // eat extern. |
Erick Tryzelaar | 21e83ea | 2009-09-22 21:15:19 +0000 | [diff] [blame] | 363 | return ParsePrototype(); |
| 364 | } |
| 365 | |
| 366 | //===----------------------------------------------------------------------===// |
| 367 | // Top-Level parsing |
| 368 | //===----------------------------------------------------------------------===// |
| 369 | |
| 370 | static void HandleDefinition() { |
| 371 | if (ParseDefinition()) { |
| 372 | fprintf(stderr, "Parsed a function definition.\n"); |
| 373 | } else { |
| 374 | // Skip token for error recovery. |
| 375 | getNextToken(); |
| 376 | } |
| 377 | } |
| 378 | |
| 379 | static void HandleExtern() { |
| 380 | if (ParseExtern()) { |
| 381 | fprintf(stderr, "Parsed an extern\n"); |
| 382 | } else { |
| 383 | // Skip token for error recovery. |
| 384 | getNextToken(); |
| 385 | } |
| 386 | } |
| 387 | |
| 388 | static void HandleTopLevelExpression() { |
| 389 | // Evaluate a top-level expression into an anonymous function. |
| 390 | if (ParseTopLevelExpr()) { |
| 391 | fprintf(stderr, "Parsed a top-level expr\n"); |
| 392 | } else { |
| 393 | // Skip token for error recovery. |
| 394 | getNextToken(); |
| 395 | } |
| 396 | } |
| 397 | |
| 398 | /// top ::= definition | external | expression | ';' |
| 399 | static void MainLoop() { |
Eugene Zelenko | f981ec4 | 2016-05-19 01:08:04 +0000 | [diff] [blame] | 400 | while (true) { |
Erick Tryzelaar | 21e83ea | 2009-09-22 21:15:19 +0000 | [diff] [blame] | 401 | fprintf(stderr, "ready> "); |
| 402 | switch (CurTok) { |
Lang Hames | 59b0da8 | 2015-08-19 18:15:58 +0000 | [diff] [blame] | 403 | case tok_eof: |
| 404 | return; |
| 405 | case ';': // ignore top-level semicolons. |
| 406 | getNextToken(); |
| 407 | break; |
| 408 | case tok_def: |
| 409 | HandleDefinition(); |
| 410 | break; |
| 411 | case tok_extern: |
| 412 | HandleExtern(); |
| 413 | break; |
| 414 | default: |
| 415 | HandleTopLevelExpression(); |
| 416 | break; |
Erick Tryzelaar | 21e83ea | 2009-09-22 21:15:19 +0000 | [diff] [blame] | 417 | } |
| 418 | } |
| 419 | } |
| 420 | |
| 421 | //===----------------------------------------------------------------------===// |
| 422 | // Main driver code. |
| 423 | //===----------------------------------------------------------------------===// |
| 424 | |
| 425 | int main() { |
| 426 | // Install standard binary operators. |
| 427 | // 1 is lowest precedence. |
| 428 | BinopPrecedence['<'] = 10; |
| 429 | BinopPrecedence['+'] = 20; |
| 430 | BinopPrecedence['-'] = 20; |
Lang Hames | 59b0da8 | 2015-08-19 18:15:58 +0000 | [diff] [blame] | 431 | BinopPrecedence['*'] = 40; // highest. |
Erick Tryzelaar | 21e83ea | 2009-09-22 21:15:19 +0000 | [diff] [blame] | 432 | |
| 433 | // Prime the first token. |
| 434 | fprintf(stderr, "ready> "); |
| 435 | getNextToken(); |
| 436 | |
| 437 | // Run the main "interpreter loop" now. |
| 438 | MainLoop(); |
| 439 | |
| 440 | return 0; |
| 441 | } |