Lang Hames | bcdb994 | 2016-09-19 23:00:27 +0000 | [diff] [blame] | 1 | #include "llvm/ADT/STLExtras.h" |
Eugene Zelenko | ae7ac95 | 2016-11-18 21:57:58 +0000 | [diff] [blame] | 2 | #include <algorithm> |
Will Dietz | 981af00 | 2013-10-12 00:55:57 +0000 | [diff] [blame] | 3 | #include <cctype> |
Erick Tryzelaar | 21e83ea | 2009-09-22 21:15:19 +0000 | [diff] [blame] | 4 | #include <cstdio> |
Eugene Zelenko | f981ec4 | 2016-05-19 01:08:04 +0000 | [diff] [blame] | 5 | #include <cstdlib> |
Erick Tryzelaar | 21e83ea | 2009-09-22 21:15:19 +0000 | [diff] [blame] | 6 | #include <map> |
David Blaikie | 96a9d8c | 2015-11-03 16:23:21 +0000 | [diff] [blame] | 7 | #include <memory> |
Chandler Carruth | 605e30e | 2012-12-04 10:16:57 +0000 | [diff] [blame] | 8 | #include <string> |
Erick Tryzelaar | 21e83ea | 2009-09-22 21:15:19 +0000 | [diff] [blame] | 9 | #include <vector> |
| 10 | |
| 11 | //===----------------------------------------------------------------------===// |
| 12 | // Lexer |
| 13 | //===----------------------------------------------------------------------===// |
| 14 | |
| 15 | // The lexer returns tokens [0-255] if it is an unknown character, otherwise one |
| 16 | // of these for known things. |
| 17 | enum Token { |
| 18 | tok_eof = -1, |
| 19 | |
| 20 | // commands |
Lang Hames | 59b0da8 | 2015-08-19 18:15:58 +0000 | [diff] [blame] | 21 | tok_def = -2, |
| 22 | tok_extern = -3, |
Erick Tryzelaar | 21e83ea | 2009-09-22 21:15:19 +0000 | [diff] [blame] | 23 | |
| 24 | // primary |
Lang Hames | 59b0da8 | 2015-08-19 18:15:58 +0000 | [diff] [blame] | 25 | tok_identifier = -4, |
| 26 | tok_number = -5 |
Erick Tryzelaar | 21e83ea | 2009-09-22 21:15:19 +0000 | [diff] [blame] | 27 | }; |
| 28 | |
Lang Hames | 59b0da8 | 2015-08-19 18:15:58 +0000 | [diff] [blame] | 29 | static std::string IdentifierStr; // Filled in if tok_identifier |
| 30 | static double NumVal; // Filled in if tok_number |
Erick Tryzelaar | 21e83ea | 2009-09-22 21:15:19 +0000 | [diff] [blame] | 31 | |
| 32 | /// gettok - Return the next token from standard input. |
| 33 | static int gettok() { |
| 34 | static int LastChar = ' '; |
| 35 | |
| 36 | // Skip any whitespace. |
| 37 | while (isspace(LastChar)) |
| 38 | LastChar = getchar(); |
| 39 | |
| 40 | if (isalpha(LastChar)) { // identifier: [a-zA-Z][a-zA-Z0-9]* |
| 41 | IdentifierStr = LastChar; |
| 42 | while (isalnum((LastChar = getchar()))) |
| 43 | IdentifierStr += LastChar; |
| 44 | |
Lang Hames | 59b0da8 | 2015-08-19 18:15:58 +0000 | [diff] [blame] | 45 | if (IdentifierStr == "def") |
| 46 | return tok_def; |
| 47 | if (IdentifierStr == "extern") |
| 48 | return tok_extern; |
Erick Tryzelaar | 21e83ea | 2009-09-22 21:15:19 +0000 | [diff] [blame] | 49 | return tok_identifier; |
| 50 | } |
| 51 | |
Lang Hames | 59b0da8 | 2015-08-19 18:15:58 +0000 | [diff] [blame] | 52 | if (isdigit(LastChar) || LastChar == '.') { // Number: [0-9.]+ |
Erick Tryzelaar | 21e83ea | 2009-09-22 21:15:19 +0000 | [diff] [blame] | 53 | std::string NumStr; |
| 54 | do { |
| 55 | NumStr += LastChar; |
| 56 | LastChar = getchar(); |
| 57 | } while (isdigit(LastChar) || LastChar == '.'); |
| 58 | |
Hans Wennborg | cc9deb4 | 2015-09-29 18:02:48 +0000 | [diff] [blame] | 59 | NumVal = strtod(NumStr.c_str(), nullptr); |
Erick Tryzelaar | 21e83ea | 2009-09-22 21:15:19 +0000 | [diff] [blame] | 60 | return tok_number; |
| 61 | } |
| 62 | |
| 63 | if (LastChar == '#') { |
| 64 | // Comment until end of line. |
Lang Hames | 59b0da8 | 2015-08-19 18:15:58 +0000 | [diff] [blame] | 65 | do |
| 66 | LastChar = getchar(); |
Erick Tryzelaar | 21e83ea | 2009-09-22 21:15:19 +0000 | [diff] [blame] | 67 | while (LastChar != EOF && LastChar != '\n' && LastChar != '\r'); |
Lang Hames | 59b0da8 | 2015-08-19 18:15:58 +0000 | [diff] [blame] | 68 | |
Erick Tryzelaar | 21e83ea | 2009-09-22 21:15:19 +0000 | [diff] [blame] | 69 | if (LastChar != EOF) |
| 70 | return gettok(); |
| 71 | } |
Lang Hames | 59b0da8 | 2015-08-19 18:15:58 +0000 | [diff] [blame] | 72 | |
Erick Tryzelaar | 21e83ea | 2009-09-22 21:15:19 +0000 | [diff] [blame] | 73 | // Check for end of file. Don't eat the EOF. |
| 74 | if (LastChar == EOF) |
| 75 | return tok_eof; |
| 76 | |
| 77 | // Otherwise, just return the character as its ascii value. |
| 78 | int ThisChar = LastChar; |
| 79 | LastChar = getchar(); |
| 80 | return ThisChar; |
| 81 | } |
| 82 | |
| 83 | //===----------------------------------------------------------------------===// |
| 84 | // Abstract Syntax Tree (aka Parse Tree) |
| 85 | //===----------------------------------------------------------------------===// |
Eugene Zelenko | ae7ac95 | 2016-11-18 21:57:58 +0000 | [diff] [blame] | 86 | |
Juergen Ributzka | 05c5a93 | 2013-11-19 03:08:35 +0000 | [diff] [blame] | 87 | namespace { |
Eugene Zelenko | ae7ac95 | 2016-11-18 21:57:58 +0000 | [diff] [blame] | 88 | |
Erick Tryzelaar | 21e83ea | 2009-09-22 21:15:19 +0000 | [diff] [blame] | 89 | /// ExprAST - Base class for all expression nodes. |
| 90 | class ExprAST { |
| 91 | public: |
Eugene Zelenko | ae7ac95 | 2016-11-18 21:57:58 +0000 | [diff] [blame] | 92 | virtual ~ExprAST() = default; |
Erick Tryzelaar | 21e83ea | 2009-09-22 21:15:19 +0000 | [diff] [blame] | 93 | }; |
| 94 | |
| 95 | /// NumberExprAST - Expression class for numeric literals like "1.0". |
| 96 | class NumberExprAST : public ExprAST { |
Lang Hames | 59b0da8 | 2015-08-19 18:15:58 +0000 | [diff] [blame] | 97 | double Val; |
| 98 | |
Erick Tryzelaar | 21e83ea | 2009-09-22 21:15:19 +0000 | [diff] [blame] | 99 | public: |
Lang Hames | 59b0da8 | 2015-08-19 18:15:58 +0000 | [diff] [blame] | 100 | NumberExprAST(double Val) : Val(Val) {} |
Erick Tryzelaar | 21e83ea | 2009-09-22 21:15:19 +0000 | [diff] [blame] | 101 | }; |
| 102 | |
| 103 | /// VariableExprAST - Expression class for referencing a variable, like "a". |
| 104 | class VariableExprAST : public ExprAST { |
| 105 | std::string Name; |
Lang Hames | 59b0da8 | 2015-08-19 18:15:58 +0000 | [diff] [blame] | 106 | |
Erick Tryzelaar | 21e83ea | 2009-09-22 21:15:19 +0000 | [diff] [blame] | 107 | public: |
Lang Hames | 09bf4c1 | 2015-08-18 18:11:06 +0000 | [diff] [blame] | 108 | VariableExprAST(const std::string &Name) : Name(Name) {} |
Erick Tryzelaar | 21e83ea | 2009-09-22 21:15:19 +0000 | [diff] [blame] | 109 | }; |
| 110 | |
| 111 | /// BinaryExprAST - Expression class for a binary operator. |
| 112 | class BinaryExprAST : public ExprAST { |
Lang Hames | 59b0da8 | 2015-08-19 18:15:58 +0000 | [diff] [blame] | 113 | char Op; |
| 114 | std::unique_ptr<ExprAST> LHS, RHS; |
| 115 | |
Erick Tryzelaar | 21e83ea | 2009-09-22 21:15:19 +0000 | [diff] [blame] | 116 | public: |
Lang Hames | 09bf4c1 | 2015-08-18 18:11:06 +0000 | [diff] [blame] | 117 | BinaryExprAST(char Op, std::unique_ptr<ExprAST> LHS, |
Lang Hames | 59b0da8 | 2015-08-19 18:15:58 +0000 | [diff] [blame] | 118 | std::unique_ptr<ExprAST> RHS) |
| 119 | : Op(Op), LHS(std::move(LHS)), RHS(std::move(RHS)) {} |
Erick Tryzelaar | 21e83ea | 2009-09-22 21:15:19 +0000 | [diff] [blame] | 120 | }; |
| 121 | |
| 122 | /// CallExprAST - Expression class for function calls. |
| 123 | class CallExprAST : public ExprAST { |
| 124 | std::string Callee; |
Lang Hames | 09bf4c1 | 2015-08-18 18:11:06 +0000 | [diff] [blame] | 125 | std::vector<std::unique_ptr<ExprAST>> Args; |
Lang Hames | 59b0da8 | 2015-08-19 18:15:58 +0000 | [diff] [blame] | 126 | |
Erick Tryzelaar | 21e83ea | 2009-09-22 21:15:19 +0000 | [diff] [blame] | 127 | public: |
Lang Hames | 09bf4c1 | 2015-08-18 18:11:06 +0000 | [diff] [blame] | 128 | CallExprAST(const std::string &Callee, |
| 129 | std::vector<std::unique_ptr<ExprAST>> Args) |
Lang Hames | 59b0da8 | 2015-08-19 18:15:58 +0000 | [diff] [blame] | 130 | : Callee(Callee), Args(std::move(Args)) {} |
Erick Tryzelaar | 21e83ea | 2009-09-22 21:15:19 +0000 | [diff] [blame] | 131 | }; |
| 132 | |
| 133 | /// PrototypeAST - This class represents the "prototype" for a function, |
| 134 | /// which captures its name, and its argument names (thus implicitly the number |
| 135 | /// of arguments the function takes). |
| 136 | class PrototypeAST { |
| 137 | std::string Name; |
| 138 | std::vector<std::string> Args; |
Lang Hames | 59b0da8 | 2015-08-19 18:15:58 +0000 | [diff] [blame] | 139 | |
Erick Tryzelaar | 21e83ea | 2009-09-22 21:15:19 +0000 | [diff] [blame] | 140 | public: |
Lang Hames | 09bf4c1 | 2015-08-18 18:11:06 +0000 | [diff] [blame] | 141 | PrototypeAST(const std::string &Name, std::vector<std::string> Args) |
Lang Hames | 59b0da8 | 2015-08-19 18:15:58 +0000 | [diff] [blame] | 142 | : Name(Name), Args(std::move(Args)) {} |
Erick Tryzelaar | 21e83ea | 2009-09-22 21:15:19 +0000 | [diff] [blame] | 143 | }; |
| 144 | |
| 145 | /// FunctionAST - This class represents a function definition itself. |
| 146 | class FunctionAST { |
Lang Hames | 59b0da8 | 2015-08-19 18:15:58 +0000 | [diff] [blame] | 147 | std::unique_ptr<PrototypeAST> Proto; |
| 148 | std::unique_ptr<ExprAST> Body; |
| 149 | |
Erick Tryzelaar | 21e83ea | 2009-09-22 21:15:19 +0000 | [diff] [blame] | 150 | public: |
Lang Hames | 09bf4c1 | 2015-08-18 18:11:06 +0000 | [diff] [blame] | 151 | FunctionAST(std::unique_ptr<PrototypeAST> Proto, |
Lang Hames | 59b0da8 | 2015-08-19 18:15:58 +0000 | [diff] [blame] | 152 | std::unique_ptr<ExprAST> Body) |
| 153 | : Proto(std::move(Proto)), Body(std::move(Body)) {} |
Erick Tryzelaar | 21e83ea | 2009-09-22 21:15:19 +0000 | [diff] [blame] | 154 | }; |
Eugene Zelenko | ae7ac95 | 2016-11-18 21:57:58 +0000 | [diff] [blame] | 155 | |
Juergen Ributzka | 05c5a93 | 2013-11-19 03:08:35 +0000 | [diff] [blame] | 156 | } // end anonymous namespace |
Erick Tryzelaar | 21e83ea | 2009-09-22 21:15:19 +0000 | [diff] [blame] | 157 | |
| 158 | //===----------------------------------------------------------------------===// |
| 159 | // Parser |
| 160 | //===----------------------------------------------------------------------===// |
| 161 | |
| 162 | /// CurTok/getNextToken - Provide a simple token buffer. CurTok is the current |
| 163 | /// token the parser is looking at. getNextToken reads another token from the |
| 164 | /// lexer and updates CurTok with its results. |
| 165 | static int CurTok; |
Lang Hames | 59b0da8 | 2015-08-19 18:15:58 +0000 | [diff] [blame] | 166 | static int getNextToken() { return CurTok = gettok(); } |
Erick Tryzelaar | 21e83ea | 2009-09-22 21:15:19 +0000 | [diff] [blame] | 167 | |
| 168 | /// BinopPrecedence - This holds the precedence for each binary operator that is |
| 169 | /// defined. |
| 170 | static std::map<char, int> BinopPrecedence; |
| 171 | |
| 172 | /// GetTokPrecedence - Get the precedence of the pending binary operator token. |
| 173 | static int GetTokPrecedence() { |
| 174 | if (!isascii(CurTok)) |
| 175 | return -1; |
Lang Hames | 59b0da8 | 2015-08-19 18:15:58 +0000 | [diff] [blame] | 176 | |
Erick Tryzelaar | 21e83ea | 2009-09-22 21:15:19 +0000 | [diff] [blame] | 177 | // Make sure it's a declared binop. |
| 178 | int TokPrec = BinopPrecedence[CurTok]; |
Lang Hames | 59b0da8 | 2015-08-19 18:15:58 +0000 | [diff] [blame] | 179 | if (TokPrec <= 0) |
| 180 | return -1; |
Erick Tryzelaar | 21e83ea | 2009-09-22 21:15:19 +0000 | [diff] [blame] | 181 | return TokPrec; |
| 182 | } |
| 183 | |
Lang Hames | 5d045a9 | 2016-03-25 17:41:26 +0000 | [diff] [blame] | 184 | /// LogError* - These are little helper functions for error handling. |
| 185 | std::unique_ptr<ExprAST> LogError(const char *Str) { |
Lang Hames | 09bf4c1 | 2015-08-18 18:11:06 +0000 | [diff] [blame] | 186 | fprintf(stderr, "Error: %s\n", Str); |
| 187 | return nullptr; |
| 188 | } |
Lang Hames | 5d045a9 | 2016-03-25 17:41:26 +0000 | [diff] [blame] | 189 | std::unique_ptr<PrototypeAST> LogErrorP(const char *Str) { |
| 190 | LogError(Str); |
Lang Hames | 09bf4c1 | 2015-08-18 18:11:06 +0000 | [diff] [blame] | 191 | return nullptr; |
| 192 | } |
Erick Tryzelaar | 21e83ea | 2009-09-22 21:15:19 +0000 | [diff] [blame] | 193 | |
Lang Hames | 09bf4c1 | 2015-08-18 18:11:06 +0000 | [diff] [blame] | 194 | static std::unique_ptr<ExprAST> ParseExpression(); |
Erick Tryzelaar | 21e83ea | 2009-09-22 21:15:19 +0000 | [diff] [blame] | 195 | |
Erick Tryzelaar | 21e83ea | 2009-09-22 21:15:19 +0000 | [diff] [blame] | 196 | /// numberexpr ::= number |
Lang Hames | 09bf4c1 | 2015-08-18 18:11:06 +0000 | [diff] [blame] | 197 | static std::unique_ptr<ExprAST> ParseNumberExpr() { |
Lang Hames | bcdb994 | 2016-09-19 23:00:27 +0000 | [diff] [blame] | 198 | auto Result = llvm::make_unique<NumberExprAST>(NumVal); |
Erick Tryzelaar | 21e83ea | 2009-09-22 21:15:19 +0000 | [diff] [blame] | 199 | getNextToken(); // consume the number |
Lang Hames | 09bf4c1 | 2015-08-18 18:11:06 +0000 | [diff] [blame] | 200 | return std::move(Result); |
Erick Tryzelaar | 21e83ea | 2009-09-22 21:15:19 +0000 | [diff] [blame] | 201 | } |
| 202 | |
| 203 | /// parenexpr ::= '(' expression ')' |
Lang Hames | 09bf4c1 | 2015-08-18 18:11:06 +0000 | [diff] [blame] | 204 | static std::unique_ptr<ExprAST> ParseParenExpr() { |
Lang Hames | 59b0da8 | 2015-08-19 18:15:58 +0000 | [diff] [blame] | 205 | getNextToken(); // eat (. |
Lang Hames | 09bf4c1 | 2015-08-18 18:11:06 +0000 | [diff] [blame] | 206 | auto V = ParseExpression(); |
| 207 | if (!V) |
| 208 | return nullptr; |
Lang Hames | 59b0da8 | 2015-08-19 18:15:58 +0000 | [diff] [blame] | 209 | |
Erick Tryzelaar | 21e83ea | 2009-09-22 21:15:19 +0000 | [diff] [blame] | 210 | if (CurTok != ')') |
Lang Hames | 5d045a9 | 2016-03-25 17:41:26 +0000 | [diff] [blame] | 211 | return LogError("expected ')'"); |
Lang Hames | 59b0da8 | 2015-08-19 18:15:58 +0000 | [diff] [blame] | 212 | getNextToken(); // eat ). |
Erick Tryzelaar | 21e83ea | 2009-09-22 21:15:19 +0000 | [diff] [blame] | 213 | return V; |
| 214 | } |
| 215 | |
Lang Hames | 59b0da8 | 2015-08-19 18:15:58 +0000 | [diff] [blame] | 216 | /// identifierexpr |
| 217 | /// ::= identifier |
| 218 | /// ::= identifier '(' expression* ')' |
| 219 | static std::unique_ptr<ExprAST> ParseIdentifierExpr() { |
| 220 | std::string IdName = IdentifierStr; |
| 221 | |
| 222 | getNextToken(); // eat identifier. |
| 223 | |
| 224 | if (CurTok != '(') // Simple variable ref. |
Lang Hames | bcdb994 | 2016-09-19 23:00:27 +0000 | [diff] [blame] | 225 | return llvm::make_unique<VariableExprAST>(IdName); |
Lang Hames | 59b0da8 | 2015-08-19 18:15:58 +0000 | [diff] [blame] | 226 | |
| 227 | // Call. |
| 228 | getNextToken(); // eat ( |
| 229 | std::vector<std::unique_ptr<ExprAST>> Args; |
| 230 | if (CurTok != ')') { |
Eugene Zelenko | f981ec4 | 2016-05-19 01:08:04 +0000 | [diff] [blame] | 231 | while (true) { |
Lang Hames | 59b0da8 | 2015-08-19 18:15:58 +0000 | [diff] [blame] | 232 | if (auto Arg = ParseExpression()) |
| 233 | Args.push_back(std::move(Arg)); |
| 234 | else |
| 235 | return nullptr; |
| 236 | |
| 237 | if (CurTok == ')') |
| 238 | break; |
| 239 | |
| 240 | if (CurTok != ',') |
Lang Hames | 5d045a9 | 2016-03-25 17:41:26 +0000 | [diff] [blame] | 241 | return LogError("Expected ')' or ',' in argument list"); |
Lang Hames | 59b0da8 | 2015-08-19 18:15:58 +0000 | [diff] [blame] | 242 | getNextToken(); |
| 243 | } |
| 244 | } |
| 245 | |
| 246 | // Eat the ')'. |
| 247 | getNextToken(); |
| 248 | |
Lang Hames | bcdb994 | 2016-09-19 23:00:27 +0000 | [diff] [blame] | 249 | return llvm::make_unique<CallExprAST>(IdName, std::move(Args)); |
Lang Hames | 59b0da8 | 2015-08-19 18:15:58 +0000 | [diff] [blame] | 250 | } |
| 251 | |
Erick Tryzelaar | 21e83ea | 2009-09-22 21:15:19 +0000 | [diff] [blame] | 252 | /// primary |
| 253 | /// ::= identifierexpr |
| 254 | /// ::= numberexpr |
| 255 | /// ::= parenexpr |
Lang Hames | 09bf4c1 | 2015-08-18 18:11:06 +0000 | [diff] [blame] | 256 | static std::unique_ptr<ExprAST> ParsePrimary() { |
Erick Tryzelaar | 21e83ea | 2009-09-22 21:15:19 +0000 | [diff] [blame] | 257 | switch (CurTok) { |
Lang Hames | 59b0da8 | 2015-08-19 18:15:58 +0000 | [diff] [blame] | 258 | default: |
Lang Hames | 5d045a9 | 2016-03-25 17:41:26 +0000 | [diff] [blame] | 259 | return LogError("unknown token when expecting an expression"); |
Lang Hames | 59b0da8 | 2015-08-19 18:15:58 +0000 | [diff] [blame] | 260 | case tok_identifier: |
| 261 | return ParseIdentifierExpr(); |
| 262 | case tok_number: |
| 263 | return ParseNumberExpr(); |
| 264 | case '(': |
| 265 | return ParseParenExpr(); |
Erick Tryzelaar | 21e83ea | 2009-09-22 21:15:19 +0000 | [diff] [blame] | 266 | } |
| 267 | } |
| 268 | |
| 269 | /// binoprhs |
| 270 | /// ::= ('+' primary)* |
Lang Hames | 09bf4c1 | 2015-08-18 18:11:06 +0000 | [diff] [blame] | 271 | static std::unique_ptr<ExprAST> ParseBinOpRHS(int ExprPrec, |
| 272 | std::unique_ptr<ExprAST> LHS) { |
Erick Tryzelaar | 21e83ea | 2009-09-22 21:15:19 +0000 | [diff] [blame] | 273 | // If this is a binop, find its precedence. |
Eugene Zelenko | f981ec4 | 2016-05-19 01:08:04 +0000 | [diff] [blame] | 274 | while (true) { |
Erick Tryzelaar | 21e83ea | 2009-09-22 21:15:19 +0000 | [diff] [blame] | 275 | int TokPrec = GetTokPrecedence(); |
Lang Hames | 59b0da8 | 2015-08-19 18:15:58 +0000 | [diff] [blame] | 276 | |
Erick Tryzelaar | 21e83ea | 2009-09-22 21:15:19 +0000 | [diff] [blame] | 277 | // If this is a binop that binds at least as tightly as the current binop, |
| 278 | // consume it, otherwise we are done. |
| 279 | if (TokPrec < ExprPrec) |
| 280 | return LHS; |
Lang Hames | 59b0da8 | 2015-08-19 18:15:58 +0000 | [diff] [blame] | 281 | |
Erick Tryzelaar | 21e83ea | 2009-09-22 21:15:19 +0000 | [diff] [blame] | 282 | // Okay, we know this is a binop. |
| 283 | int BinOp = CurTok; |
Lang Hames | 59b0da8 | 2015-08-19 18:15:58 +0000 | [diff] [blame] | 284 | getNextToken(); // eat binop |
| 285 | |
Erick Tryzelaar | 21e83ea | 2009-09-22 21:15:19 +0000 | [diff] [blame] | 286 | // Parse the primary expression after the binary operator. |
Lang Hames | 09bf4c1 | 2015-08-18 18:11:06 +0000 | [diff] [blame] | 287 | auto RHS = ParsePrimary(); |
Lang Hames | 59b0da8 | 2015-08-19 18:15:58 +0000 | [diff] [blame] | 288 | if (!RHS) |
| 289 | return nullptr; |
| 290 | |
Erick Tryzelaar | 21e83ea | 2009-09-22 21:15:19 +0000 | [diff] [blame] | 291 | // If BinOp binds less tightly with RHS than the operator after RHS, let |
| 292 | // the pending operator take RHS as its LHS. |
| 293 | int NextPrec = GetTokPrecedence(); |
| 294 | if (TokPrec < NextPrec) { |
Lang Hames | 59b0da8 | 2015-08-19 18:15:58 +0000 | [diff] [blame] | 295 | RHS = ParseBinOpRHS(TokPrec + 1, std::move(RHS)); |
| 296 | if (!RHS) |
| 297 | return nullptr; |
Erick Tryzelaar | 21e83ea | 2009-09-22 21:15:19 +0000 | [diff] [blame] | 298 | } |
Lang Hames | 59b0da8 | 2015-08-19 18:15:58 +0000 | [diff] [blame] | 299 | |
Erick Tryzelaar | 21e83ea | 2009-09-22 21:15:19 +0000 | [diff] [blame] | 300 | // Merge LHS/RHS. |
Lang Hames | bcdb994 | 2016-09-19 23:00:27 +0000 | [diff] [blame] | 301 | LHS = llvm::make_unique<BinaryExprAST>(BinOp, std::move(LHS), |
| 302 | std::move(RHS)); |
Erick Tryzelaar | 21e83ea | 2009-09-22 21:15:19 +0000 | [diff] [blame] | 303 | } |
| 304 | } |
| 305 | |
| 306 | /// expression |
| 307 | /// ::= primary binoprhs |
| 308 | /// |
Lang Hames | 09bf4c1 | 2015-08-18 18:11:06 +0000 | [diff] [blame] | 309 | static std::unique_ptr<ExprAST> ParseExpression() { |
| 310 | auto LHS = ParsePrimary(); |
Lang Hames | 59b0da8 | 2015-08-19 18:15:58 +0000 | [diff] [blame] | 311 | if (!LHS) |
| 312 | return nullptr; |
| 313 | |
Lang Hames | 09bf4c1 | 2015-08-18 18:11:06 +0000 | [diff] [blame] | 314 | return ParseBinOpRHS(0, std::move(LHS)); |
Erick Tryzelaar | 21e83ea | 2009-09-22 21:15:19 +0000 | [diff] [blame] | 315 | } |
| 316 | |
| 317 | /// prototype |
| 318 | /// ::= id '(' id* ')' |
Lang Hames | 09bf4c1 | 2015-08-18 18:11:06 +0000 | [diff] [blame] | 319 | static std::unique_ptr<PrototypeAST> ParsePrototype() { |
Erick Tryzelaar | 21e83ea | 2009-09-22 21:15:19 +0000 | [diff] [blame] | 320 | if (CurTok != tok_identifier) |
Lang Hames | 5d045a9 | 2016-03-25 17:41:26 +0000 | [diff] [blame] | 321 | return LogErrorP("Expected function name in prototype"); |
Erick Tryzelaar | 21e83ea | 2009-09-22 21:15:19 +0000 | [diff] [blame] | 322 | |
| 323 | std::string FnName = IdentifierStr; |
| 324 | getNextToken(); |
Lang Hames | 59b0da8 | 2015-08-19 18:15:58 +0000 | [diff] [blame] | 325 | |
Erick Tryzelaar | 21e83ea | 2009-09-22 21:15:19 +0000 | [diff] [blame] | 326 | if (CurTok != '(') |
Lang Hames | 5d045a9 | 2016-03-25 17:41:26 +0000 | [diff] [blame] | 327 | return LogErrorP("Expected '(' in prototype"); |
Lang Hames | 59b0da8 | 2015-08-19 18:15:58 +0000 | [diff] [blame] | 328 | |
Erick Tryzelaar | 21e83ea | 2009-09-22 21:15:19 +0000 | [diff] [blame] | 329 | std::vector<std::string> ArgNames; |
| 330 | while (getNextToken() == tok_identifier) |
| 331 | ArgNames.push_back(IdentifierStr); |
| 332 | if (CurTok != ')') |
Lang Hames | 5d045a9 | 2016-03-25 17:41:26 +0000 | [diff] [blame] | 333 | return LogErrorP("Expected ')' in prototype"); |
Lang Hames | 59b0da8 | 2015-08-19 18:15:58 +0000 | [diff] [blame] | 334 | |
Erick Tryzelaar | 21e83ea | 2009-09-22 21:15:19 +0000 | [diff] [blame] | 335 | // success. |
Lang Hames | 59b0da8 | 2015-08-19 18:15:58 +0000 | [diff] [blame] | 336 | getNextToken(); // eat ')'. |
| 337 | |
Lang Hames | bcdb994 | 2016-09-19 23:00:27 +0000 | [diff] [blame] | 338 | return llvm::make_unique<PrototypeAST>(FnName, std::move(ArgNames)); |
Erick Tryzelaar | 21e83ea | 2009-09-22 21:15:19 +0000 | [diff] [blame] | 339 | } |
| 340 | |
| 341 | /// definition ::= 'def' prototype expression |
Lang Hames | 09bf4c1 | 2015-08-18 18:11:06 +0000 | [diff] [blame] | 342 | static std::unique_ptr<FunctionAST> ParseDefinition() { |
Lang Hames | 59b0da8 | 2015-08-19 18:15:58 +0000 | [diff] [blame] | 343 | getNextToken(); // eat def. |
Lang Hames | 09bf4c1 | 2015-08-18 18:11:06 +0000 | [diff] [blame] | 344 | auto Proto = ParsePrototype(); |
Lang Hames | 59b0da8 | 2015-08-19 18:15:58 +0000 | [diff] [blame] | 345 | if (!Proto) |
| 346 | return nullptr; |
Erick Tryzelaar | 21e83ea | 2009-09-22 21:15:19 +0000 | [diff] [blame] | 347 | |
Lang Hames | 09bf4c1 | 2015-08-18 18:11:06 +0000 | [diff] [blame] | 348 | if (auto E = ParseExpression()) |
Lang Hames | bcdb994 | 2016-09-19 23:00:27 +0000 | [diff] [blame] | 349 | return llvm::make_unique<FunctionAST>(std::move(Proto), std::move(E)); |
Lang Hames | 09bf4c1 | 2015-08-18 18:11:06 +0000 | [diff] [blame] | 350 | return nullptr; |
Erick Tryzelaar | 21e83ea | 2009-09-22 21:15:19 +0000 | [diff] [blame] | 351 | } |
| 352 | |
| 353 | /// toplevelexpr ::= expression |
Lang Hames | 09bf4c1 | 2015-08-18 18:11:06 +0000 | [diff] [blame] | 354 | static std::unique_ptr<FunctionAST> ParseTopLevelExpr() { |
| 355 | if (auto E = ParseExpression()) { |
Erick Tryzelaar | 21e83ea | 2009-09-22 21:15:19 +0000 | [diff] [blame] | 356 | // Make an anonymous proto. |
Lang Hames | bcdb994 | 2016-09-19 23:00:27 +0000 | [diff] [blame] | 357 | auto Proto = llvm::make_unique<PrototypeAST>("__anon_expr", |
| 358 | std::vector<std::string>()); |
| 359 | return llvm::make_unique<FunctionAST>(std::move(Proto), std::move(E)); |
Erick Tryzelaar | 21e83ea | 2009-09-22 21:15:19 +0000 | [diff] [blame] | 360 | } |
Lang Hames | 09bf4c1 | 2015-08-18 18:11:06 +0000 | [diff] [blame] | 361 | return nullptr; |
Erick Tryzelaar | 21e83ea | 2009-09-22 21:15:19 +0000 | [diff] [blame] | 362 | } |
| 363 | |
| 364 | /// external ::= 'extern' prototype |
Lang Hames | 09bf4c1 | 2015-08-18 18:11:06 +0000 | [diff] [blame] | 365 | static std::unique_ptr<PrototypeAST> ParseExtern() { |
Lang Hames | 59b0da8 | 2015-08-19 18:15:58 +0000 | [diff] [blame] | 366 | getNextToken(); // eat extern. |
Erick Tryzelaar | 21e83ea | 2009-09-22 21:15:19 +0000 | [diff] [blame] | 367 | return ParsePrototype(); |
| 368 | } |
| 369 | |
| 370 | //===----------------------------------------------------------------------===// |
| 371 | // Top-Level parsing |
| 372 | //===----------------------------------------------------------------------===// |
| 373 | |
| 374 | static void HandleDefinition() { |
| 375 | if (ParseDefinition()) { |
| 376 | fprintf(stderr, "Parsed a function definition.\n"); |
| 377 | } else { |
| 378 | // Skip token for error recovery. |
| 379 | getNextToken(); |
| 380 | } |
| 381 | } |
| 382 | |
| 383 | static void HandleExtern() { |
| 384 | if (ParseExtern()) { |
| 385 | fprintf(stderr, "Parsed an extern\n"); |
| 386 | } else { |
| 387 | // Skip token for error recovery. |
| 388 | getNextToken(); |
| 389 | } |
| 390 | } |
| 391 | |
| 392 | static void HandleTopLevelExpression() { |
| 393 | // Evaluate a top-level expression into an anonymous function. |
| 394 | if (ParseTopLevelExpr()) { |
| 395 | fprintf(stderr, "Parsed a top-level expr\n"); |
| 396 | } else { |
| 397 | // Skip token for error recovery. |
| 398 | getNextToken(); |
| 399 | } |
| 400 | } |
| 401 | |
| 402 | /// top ::= definition | external | expression | ';' |
| 403 | static void MainLoop() { |
Eugene Zelenko | f981ec4 | 2016-05-19 01:08:04 +0000 | [diff] [blame] | 404 | while (true) { |
Erick Tryzelaar | 21e83ea | 2009-09-22 21:15:19 +0000 | [diff] [blame] | 405 | fprintf(stderr, "ready> "); |
| 406 | switch (CurTok) { |
Lang Hames | 59b0da8 | 2015-08-19 18:15:58 +0000 | [diff] [blame] | 407 | case tok_eof: |
| 408 | return; |
| 409 | case ';': // ignore top-level semicolons. |
| 410 | getNextToken(); |
| 411 | break; |
| 412 | case tok_def: |
| 413 | HandleDefinition(); |
| 414 | break; |
| 415 | case tok_extern: |
| 416 | HandleExtern(); |
| 417 | break; |
| 418 | default: |
| 419 | HandleTopLevelExpression(); |
| 420 | break; |
Erick Tryzelaar | 21e83ea | 2009-09-22 21:15:19 +0000 | [diff] [blame] | 421 | } |
| 422 | } |
| 423 | } |
| 424 | |
| 425 | //===----------------------------------------------------------------------===// |
| 426 | // Main driver code. |
| 427 | //===----------------------------------------------------------------------===// |
| 428 | |
| 429 | int main() { |
| 430 | // Install standard binary operators. |
| 431 | // 1 is lowest precedence. |
| 432 | BinopPrecedence['<'] = 10; |
| 433 | BinopPrecedence['+'] = 20; |
| 434 | BinopPrecedence['-'] = 20; |
Lang Hames | 59b0da8 | 2015-08-19 18:15:58 +0000 | [diff] [blame] | 435 | BinopPrecedence['*'] = 40; // highest. |
Erick Tryzelaar | 21e83ea | 2009-09-22 21:15:19 +0000 | [diff] [blame] | 436 | |
| 437 | // Prime the first token. |
| 438 | fprintf(stderr, "ready> "); |
| 439 | getNextToken(); |
| 440 | |
| 441 | // Run the main "interpreter loop" now. |
| 442 | MainLoop(); |
| 443 | |
| 444 | return 0; |
| 445 | } |