blob: f8000c41a6fc1241385bfdd9551f6faa8a570537 [file] [log] [blame]
David Blaikiea27771b2018-04-24 00:48:59 +00001#include "../include/KaleidoscopeJIT.h"
Eugene Zelenkof981ec42016-05-19 01:08:04 +00002#include "llvm/ADT/APFloat.h"
Lang Hames09bf4c12015-08-18 18:11:06 +00003#include "llvm/ADT/STLExtras.h"
Eugene Zelenkof981ec42016-05-19 01:08:04 +00004#include "llvm/IR/BasicBlock.h"
5#include "llvm/IR/Constants.h"
6#include "llvm/IR/DerivedTypes.h"
7#include "llvm/IR/Function.h"
Chandler Carruth005f27a2013-01-02 11:56:33 +00008#include "llvm/IR/IRBuilder.h"
9#include "llvm/IR/LLVMContext.h"
Chandler Carruth30d69c22015-02-13 10:01:29 +000010#include "llvm/IR/LegacyPassManager.h"
Chandler Carruth005f27a2013-01-02 11:56:33 +000011#include "llvm/IR/Module.h"
Eugene Zelenkof981ec42016-05-19 01:08:04 +000012#include "llvm/IR/Type.h"
Chandler Carruth20d4e6b2014-01-13 09:58:03 +000013#include "llvm/IR/Verifier.h"
Evan Cheng2bb40352011-08-24 18:08:43 +000014#include "llvm/Support/TargetSelect.h"
Eugene Zelenkof981ec42016-05-19 01:08:04 +000015#include "llvm/Target/TargetMachine.h"
David Blaikiea27771b2018-04-24 00:48:59 +000016#include "llvm/Transforms/InstCombine/InstCombine.h"
Chandler Carruth605e30e2012-12-04 10:16:57 +000017#include "llvm/Transforms/Scalar.h"
Chandler Carruthec5872b2016-03-11 12:10:15 +000018#include "llvm/Transforms/Scalar/GVN.h"
Eugene Zelenkoae7ac952016-11-18 21:57:58 +000019#include <algorithm>
Eugene Zelenkof981ec42016-05-19 01:08:04 +000020#include <cassert>
Will Dietz981af002013-10-12 00:55:57 +000021#include <cctype>
Eugene Zelenkof981ec42016-05-19 01:08:04 +000022#include <cstdint>
Erick Tryzelaar21e83ea2009-09-22 21:15:19 +000023#include <cstdio>
Eugene Zelenkof981ec42016-05-19 01:08:04 +000024#include <cstdlib>
Erick Tryzelaar21e83ea2009-09-22 21:15:19 +000025#include <map>
Eugene Zelenkof981ec42016-05-19 01:08:04 +000026#include <memory>
Chandler Carruth605e30e2012-12-04 10:16:57 +000027#include <string>
Erick Tryzelaar21e83ea2009-09-22 21:15:19 +000028#include <vector>
Lang Hames2d789c32015-08-26 03:07:41 +000029
Erick Tryzelaar21e83ea2009-09-22 21:15:19 +000030using namespace llvm;
Lang Hames2d789c32015-08-26 03:07:41 +000031using namespace llvm::orc;
Erick Tryzelaar21e83ea2009-09-22 21:15:19 +000032
33//===----------------------------------------------------------------------===//
34// Lexer
35//===----------------------------------------------------------------------===//
36
37// The lexer returns tokens [0-255] if it is an unknown character, otherwise one
38// of these for known things.
39enum Token {
40 tok_eof = -1,
41
42 // commands
Eric Christopherc0239362014-12-08 18:12:28 +000043 tok_def = -2,
44 tok_extern = -3,
Erick Tryzelaar21e83ea2009-09-22 21:15:19 +000045
46 // primary
Eric Christopherc0239362014-12-08 18:12:28 +000047 tok_identifier = -4,
48 tok_number = -5
Erick Tryzelaar21e83ea2009-09-22 21:15:19 +000049};
50
Eric Christopherc0239362014-12-08 18:12:28 +000051static std::string IdentifierStr; // Filled in if tok_identifier
52static double NumVal; // Filled in if tok_number
Erick Tryzelaar21e83ea2009-09-22 21:15:19 +000053
54/// gettok - Return the next token from standard input.
55static int gettok() {
56 static int LastChar = ' ';
57
58 // Skip any whitespace.
59 while (isspace(LastChar))
60 LastChar = getchar();
61
62 if (isalpha(LastChar)) { // identifier: [a-zA-Z][a-zA-Z0-9]*
63 IdentifierStr = LastChar;
64 while (isalnum((LastChar = getchar())))
65 IdentifierStr += LastChar;
66
Eric Christopherc0239362014-12-08 18:12:28 +000067 if (IdentifierStr == "def")
68 return tok_def;
69 if (IdentifierStr == "extern")
70 return tok_extern;
Erick Tryzelaar21e83ea2009-09-22 21:15:19 +000071 return tok_identifier;
72 }
73
Eric Christopherc0239362014-12-08 18:12:28 +000074 if (isdigit(LastChar) || LastChar == '.') { // Number: [0-9.]+
Erick Tryzelaar21e83ea2009-09-22 21:15:19 +000075 std::string NumStr;
76 do {
77 NumStr += LastChar;
78 LastChar = getchar();
79 } while (isdigit(LastChar) || LastChar == '.');
80
Hans Wennborgcc9deb42015-09-29 18:02:48 +000081 NumVal = strtod(NumStr.c_str(), nullptr);
Erick Tryzelaar21e83ea2009-09-22 21:15:19 +000082 return tok_number;
83 }
84
85 if (LastChar == '#') {
86 // Comment until end of line.
Eric Christopherc0239362014-12-08 18:12:28 +000087 do
88 LastChar = getchar();
Erick Tryzelaar21e83ea2009-09-22 21:15:19 +000089 while (LastChar != EOF && LastChar != '\n' && LastChar != '\r');
Eric Christopherc0239362014-12-08 18:12:28 +000090
Erick Tryzelaar21e83ea2009-09-22 21:15:19 +000091 if (LastChar != EOF)
92 return gettok();
93 }
Eric Christopherc0239362014-12-08 18:12:28 +000094
Erick Tryzelaar21e83ea2009-09-22 21:15:19 +000095 // Check for end of file. Don't eat the EOF.
96 if (LastChar == EOF)
97 return tok_eof;
98
99 // Otherwise, just return the character as its ascii value.
100 int ThisChar = LastChar;
101 LastChar = getchar();
102 return ThisChar;
103}
104
105//===----------------------------------------------------------------------===//
106// Abstract Syntax Tree (aka Parse Tree)
107//===----------------------------------------------------------------------===//
Eugene Zelenkoae7ac952016-11-18 21:57:58 +0000108
Juergen Ributzka05c5a932013-11-19 03:08:35 +0000109namespace {
Eugene Zelenkoae7ac952016-11-18 21:57:58 +0000110
Erick Tryzelaar21e83ea2009-09-22 21:15:19 +0000111/// ExprAST - Base class for all expression nodes.
112class ExprAST {
113public:
Eugene Zelenkoae7ac952016-11-18 21:57:58 +0000114 virtual ~ExprAST() = default;
115
Lang Hames2d789c32015-08-26 03:07:41 +0000116 virtual Value *codegen() = 0;
Erick Tryzelaar21e83ea2009-09-22 21:15:19 +0000117};
118
119/// NumberExprAST - Expression class for numeric literals like "1.0".
120class NumberExprAST : public ExprAST {
121 double Val;
Lang Hames59b0da82015-08-19 18:15:58 +0000122
Erick Tryzelaar21e83ea2009-09-22 21:15:19 +0000123public:
Lang Hames09bf4c12015-08-18 18:11:06 +0000124 NumberExprAST(double Val) : Val(Val) {}
Eugene Zelenkoae7ac952016-11-18 21:57:58 +0000125
Lang Hames2d789c32015-08-26 03:07:41 +0000126 Value *codegen() override;
Erick Tryzelaar21e83ea2009-09-22 21:15:19 +0000127};
128
129/// VariableExprAST - Expression class for referencing a variable, like "a".
130class VariableExprAST : public ExprAST {
131 std::string Name;
Lang Hames59b0da82015-08-19 18:15:58 +0000132
Erick Tryzelaar21e83ea2009-09-22 21:15:19 +0000133public:
Lang Hames09bf4c12015-08-18 18:11:06 +0000134 VariableExprAST(const std::string &Name) : Name(Name) {}
Eugene Zelenkoae7ac952016-11-18 21:57:58 +0000135
Lang Hames2d789c32015-08-26 03:07:41 +0000136 Value *codegen() override;
Erick Tryzelaar21e83ea2009-09-22 21:15:19 +0000137};
138
139/// BinaryExprAST - Expression class for a binary operator.
140class BinaryExprAST : public ExprAST {
141 char Op;
Lang Hames09bf4c12015-08-18 18:11:06 +0000142 std::unique_ptr<ExprAST> LHS, RHS;
Lang Hames59b0da82015-08-19 18:15:58 +0000143
Erick Tryzelaar21e83ea2009-09-22 21:15:19 +0000144public:
Lang Hames09bf4c12015-08-18 18:11:06 +0000145 BinaryExprAST(char Op, std::unique_ptr<ExprAST> LHS,
146 std::unique_ptr<ExprAST> RHS)
147 : Op(Op), LHS(std::move(LHS)), RHS(std::move(RHS)) {}
Eugene Zelenkoae7ac952016-11-18 21:57:58 +0000148
Lang Hames2d789c32015-08-26 03:07:41 +0000149 Value *codegen() override;
Erick Tryzelaar21e83ea2009-09-22 21:15:19 +0000150};
151
152/// CallExprAST - Expression class for function calls.
153class CallExprAST : public ExprAST {
154 std::string Callee;
Lang Hames09bf4c12015-08-18 18:11:06 +0000155 std::vector<std::unique_ptr<ExprAST>> Args;
Lang Hames59b0da82015-08-19 18:15:58 +0000156
Erick Tryzelaar21e83ea2009-09-22 21:15:19 +0000157public:
Lang Hames09bf4c12015-08-18 18:11:06 +0000158 CallExprAST(const std::string &Callee,
159 std::vector<std::unique_ptr<ExprAST>> Args)
160 : Callee(Callee), Args(std::move(Args)) {}
Eugene Zelenkoae7ac952016-11-18 21:57:58 +0000161
Lang Hames2d789c32015-08-26 03:07:41 +0000162 Value *codegen() override;
Erick Tryzelaar21e83ea2009-09-22 21:15:19 +0000163};
164
165/// PrototypeAST - This class represents the "prototype" for a function,
166/// which captures its name, and its argument names (thus implicitly the number
167/// of arguments the function takes).
168class PrototypeAST {
169 std::string Name;
170 std::vector<std::string> Args;
Lang Hames59b0da82015-08-19 18:15:58 +0000171
Erick Tryzelaar21e83ea2009-09-22 21:15:19 +0000172public:
Lang Hames59b0da82015-08-19 18:15:58 +0000173 PrototypeAST(const std::string &Name, std::vector<std::string> Args)
174 : Name(Name), Args(std::move(Args)) {}
Eugene Zelenkoae7ac952016-11-18 21:57:58 +0000175
Lang Hames2d789c32015-08-26 03:07:41 +0000176 Function *codegen();
177 const std::string &getName() const { return Name; }
Erick Tryzelaar21e83ea2009-09-22 21:15:19 +0000178};
179
180/// FunctionAST - This class represents a function definition itself.
181class FunctionAST {
Lang Hames09bf4c12015-08-18 18:11:06 +0000182 std::unique_ptr<PrototypeAST> Proto;
183 std::unique_ptr<ExprAST> Body;
Lang Hames59b0da82015-08-19 18:15:58 +0000184
Erick Tryzelaar21e83ea2009-09-22 21:15:19 +0000185public:
Lang Hames09bf4c12015-08-18 18:11:06 +0000186 FunctionAST(std::unique_ptr<PrototypeAST> Proto,
187 std::unique_ptr<ExprAST> Body)
Lang Hames59b0da82015-08-19 18:15:58 +0000188 : Proto(std::move(Proto)), Body(std::move(Body)) {}
Eugene Zelenkoae7ac952016-11-18 21:57:58 +0000189
Lang Hames2d789c32015-08-26 03:07:41 +0000190 Function *codegen();
Erick Tryzelaar21e83ea2009-09-22 21:15:19 +0000191};
Eugene Zelenkoae7ac952016-11-18 21:57:58 +0000192
Juergen Ributzka05c5a932013-11-19 03:08:35 +0000193} // end anonymous namespace
Erick Tryzelaar21e83ea2009-09-22 21:15:19 +0000194
195//===----------------------------------------------------------------------===//
196// Parser
197//===----------------------------------------------------------------------===//
198
199/// CurTok/getNextToken - Provide a simple token buffer. CurTok is the current
200/// token the parser is looking at. getNextToken reads another token from the
201/// lexer and updates CurTok with its results.
202static int CurTok;
Eric Christopherc0239362014-12-08 18:12:28 +0000203static int getNextToken() { return CurTok = gettok(); }
Erick Tryzelaar21e83ea2009-09-22 21:15:19 +0000204
205/// BinopPrecedence - This holds the precedence for each binary operator that is
206/// defined.
207static std::map<char, int> BinopPrecedence;
208
209/// GetTokPrecedence - Get the precedence of the pending binary operator token.
210static int GetTokPrecedence() {
211 if (!isascii(CurTok))
212 return -1;
Eric Christopherc0239362014-12-08 18:12:28 +0000213
Erick Tryzelaar21e83ea2009-09-22 21:15:19 +0000214 // Make sure it's a declared binop.
215 int TokPrec = BinopPrecedence[CurTok];
Eric Christopherc0239362014-12-08 18:12:28 +0000216 if (TokPrec <= 0)
217 return -1;
Erick Tryzelaar21e83ea2009-09-22 21:15:19 +0000218 return TokPrec;
219}
220
Lang Hames5d045a92016-03-25 17:41:26 +0000221/// LogError* - These are little helper functions for error handling.
222std::unique_ptr<ExprAST> LogError(const char *Str) {
Eric Christopherc0239362014-12-08 18:12:28 +0000223 fprintf(stderr, "Error: %s\n", Str);
Lang Hames09bf4c12015-08-18 18:11:06 +0000224 return nullptr;
Eric Christopherc0239362014-12-08 18:12:28 +0000225}
Hans Wennborgcc9deb42015-09-29 18:02:48 +0000226
Lang Hames5d045a92016-03-25 17:41:26 +0000227std::unique_ptr<PrototypeAST> LogErrorP(const char *Str) {
228 LogError(Str);
Lang Hames09bf4c12015-08-18 18:11:06 +0000229 return nullptr;
Eric Christopherc0239362014-12-08 18:12:28 +0000230}
Erick Tryzelaar21e83ea2009-09-22 21:15:19 +0000231
Lang Hames09bf4c12015-08-18 18:11:06 +0000232static std::unique_ptr<ExprAST> ParseExpression();
Erick Tryzelaar21e83ea2009-09-22 21:15:19 +0000233
Lang Hames59b0da82015-08-19 18:15:58 +0000234/// numberexpr ::= number
235static std::unique_ptr<ExprAST> ParseNumberExpr() {
236 auto Result = llvm::make_unique<NumberExprAST>(NumVal);
237 getNextToken(); // consume the number
238 return std::move(Result);
239}
240
241/// parenexpr ::= '(' expression ')'
242static std::unique_ptr<ExprAST> ParseParenExpr() {
243 getNextToken(); // eat (.
244 auto V = ParseExpression();
245 if (!V)
246 return nullptr;
247
248 if (CurTok != ')')
Lang Hames5d045a92016-03-25 17:41:26 +0000249 return LogError("expected ')'");
Lang Hames59b0da82015-08-19 18:15:58 +0000250 getNextToken(); // eat ).
251 return V;
252}
253
Erick Tryzelaar21e83ea2009-09-22 21:15:19 +0000254/// identifierexpr
255/// ::= identifier
256/// ::= identifier '(' expression* ')'
Lang Hames09bf4c12015-08-18 18:11:06 +0000257static std::unique_ptr<ExprAST> ParseIdentifierExpr() {
Erick Tryzelaar21e83ea2009-09-22 21:15:19 +0000258 std::string IdName = IdentifierStr;
Eric Christopherc0239362014-12-08 18:12:28 +0000259
260 getNextToken(); // eat identifier.
261
Erick Tryzelaar21e83ea2009-09-22 21:15:19 +0000262 if (CurTok != '(') // Simple variable ref.
Lang Hames09bf4c12015-08-18 18:11:06 +0000263 return llvm::make_unique<VariableExprAST>(IdName);
Eric Christopherc0239362014-12-08 18:12:28 +0000264
Erick Tryzelaar21e83ea2009-09-22 21:15:19 +0000265 // Call.
Eric Christopherc0239362014-12-08 18:12:28 +0000266 getNextToken(); // eat (
Lang Hames09bf4c12015-08-18 18:11:06 +0000267 std::vector<std::unique_ptr<ExprAST>> Args;
Erick Tryzelaar21e83ea2009-09-22 21:15:19 +0000268 if (CurTok != ')') {
Eugene Zelenkof981ec42016-05-19 01:08:04 +0000269 while (true) {
Lang Hames09bf4c12015-08-18 18:11:06 +0000270 if (auto Arg = ParseExpression())
271 Args.push_back(std::move(Arg));
272 else
273 return nullptr;
Erick Tryzelaar21e83ea2009-09-22 21:15:19 +0000274
Eric Christopherc0239362014-12-08 18:12:28 +0000275 if (CurTok == ')')
276 break;
Erick Tryzelaar21e83ea2009-09-22 21:15:19 +0000277
278 if (CurTok != ',')
Lang Hames5d045a92016-03-25 17:41:26 +0000279 return LogError("Expected ')' or ',' in argument list");
Erick Tryzelaar21e83ea2009-09-22 21:15:19 +0000280 getNextToken();
281 }
282 }
283
284 // Eat the ')'.
285 getNextToken();
Eric Christopherc0239362014-12-08 18:12:28 +0000286
Lang Hames09bf4c12015-08-18 18:11:06 +0000287 return llvm::make_unique<CallExprAST>(IdName, std::move(Args));
Erick Tryzelaar21e83ea2009-09-22 21:15:19 +0000288}
289
Erick Tryzelaar21e83ea2009-09-22 21:15:19 +0000290/// primary
291/// ::= identifierexpr
292/// ::= numberexpr
293/// ::= parenexpr
Lang Hames09bf4c12015-08-18 18:11:06 +0000294static std::unique_ptr<ExprAST> ParsePrimary() {
Erick Tryzelaar21e83ea2009-09-22 21:15:19 +0000295 switch (CurTok) {
Eric Christopherc0239362014-12-08 18:12:28 +0000296 default:
Lang Hames5d045a92016-03-25 17:41:26 +0000297 return LogError("unknown token when expecting an expression");
Eric Christopherc0239362014-12-08 18:12:28 +0000298 case tok_identifier:
299 return ParseIdentifierExpr();
300 case tok_number:
301 return ParseNumberExpr();
302 case '(':
303 return ParseParenExpr();
Erick Tryzelaar21e83ea2009-09-22 21:15:19 +0000304 }
305}
306
307/// binoprhs
308/// ::= ('+' primary)*
Lang Hames09bf4c12015-08-18 18:11:06 +0000309static std::unique_ptr<ExprAST> ParseBinOpRHS(int ExprPrec,
310 std::unique_ptr<ExprAST> LHS) {
Erick Tryzelaar21e83ea2009-09-22 21:15:19 +0000311 // If this is a binop, find its precedence.
Eugene Zelenkof981ec42016-05-19 01:08:04 +0000312 while (true) {
Erick Tryzelaar21e83ea2009-09-22 21:15:19 +0000313 int TokPrec = GetTokPrecedence();
Eric Christopherc0239362014-12-08 18:12:28 +0000314
Erick Tryzelaar21e83ea2009-09-22 21:15:19 +0000315 // If this is a binop that binds at least as tightly as the current binop,
316 // consume it, otherwise we are done.
317 if (TokPrec < ExprPrec)
318 return LHS;
Eric Christopherc0239362014-12-08 18:12:28 +0000319
Erick Tryzelaar21e83ea2009-09-22 21:15:19 +0000320 // Okay, we know this is a binop.
321 int BinOp = CurTok;
Eric Christopherc0239362014-12-08 18:12:28 +0000322 getNextToken(); // eat binop
323
Erick Tryzelaar21e83ea2009-09-22 21:15:19 +0000324 // Parse the primary expression after the binary operator.
Lang Hames09bf4c12015-08-18 18:11:06 +0000325 auto RHS = ParsePrimary();
Eric Christopherc0239362014-12-08 18:12:28 +0000326 if (!RHS)
Lang Hames09bf4c12015-08-18 18:11:06 +0000327 return nullptr;
Eric Christopherc0239362014-12-08 18:12:28 +0000328
Erick Tryzelaar21e83ea2009-09-22 21:15:19 +0000329 // If BinOp binds less tightly with RHS than the operator after RHS, let
330 // the pending operator take RHS as its LHS.
331 int NextPrec = GetTokPrecedence();
332 if (TokPrec < NextPrec) {
Lang Hames09bf4c12015-08-18 18:11:06 +0000333 RHS = ParseBinOpRHS(TokPrec + 1, std::move(RHS));
334 if (!RHS)
335 return nullptr;
Erick Tryzelaar21e83ea2009-09-22 21:15:19 +0000336 }
Eric Christopherc0239362014-12-08 18:12:28 +0000337
Erick Tryzelaar21e83ea2009-09-22 21:15:19 +0000338 // Merge LHS/RHS.
Lang Hames59b0da82015-08-19 18:15:58 +0000339 LHS =
340 llvm::make_unique<BinaryExprAST>(BinOp, std::move(LHS), std::move(RHS));
Erick Tryzelaar21e83ea2009-09-22 21:15:19 +0000341 }
342}
343
344/// expression
345/// ::= primary binoprhs
346///
Lang Hames09bf4c12015-08-18 18:11:06 +0000347static std::unique_ptr<ExprAST> ParseExpression() {
348 auto LHS = ParsePrimary();
Eric Christopherc0239362014-12-08 18:12:28 +0000349 if (!LHS)
Lang Hames09bf4c12015-08-18 18:11:06 +0000350 return nullptr;
Eric Christopherc0239362014-12-08 18:12:28 +0000351
Lang Hames09bf4c12015-08-18 18:11:06 +0000352 return ParseBinOpRHS(0, std::move(LHS));
Erick Tryzelaar21e83ea2009-09-22 21:15:19 +0000353}
354
355/// prototype
356/// ::= id '(' id* ')'
Lang Hames09bf4c12015-08-18 18:11:06 +0000357static std::unique_ptr<PrototypeAST> ParsePrototype() {
Erick Tryzelaar21e83ea2009-09-22 21:15:19 +0000358 if (CurTok != tok_identifier)
Lang Hames5d045a92016-03-25 17:41:26 +0000359 return LogErrorP("Expected function name in prototype");
Erick Tryzelaar21e83ea2009-09-22 21:15:19 +0000360
361 std::string FnName = IdentifierStr;
362 getNextToken();
Eric Christopherc0239362014-12-08 18:12:28 +0000363
Erick Tryzelaar21e83ea2009-09-22 21:15:19 +0000364 if (CurTok != '(')
Lang Hames5d045a92016-03-25 17:41:26 +0000365 return LogErrorP("Expected '(' in prototype");
Eric Christopherc0239362014-12-08 18:12:28 +0000366
Erick Tryzelaar21e83ea2009-09-22 21:15:19 +0000367 std::vector<std::string> ArgNames;
368 while (getNextToken() == tok_identifier)
369 ArgNames.push_back(IdentifierStr);
370 if (CurTok != ')')
Lang Hames5d045a92016-03-25 17:41:26 +0000371 return LogErrorP("Expected ')' in prototype");
Eric Christopherc0239362014-12-08 18:12:28 +0000372
Erick Tryzelaar21e83ea2009-09-22 21:15:19 +0000373 // success.
Eric Christopherc0239362014-12-08 18:12:28 +0000374 getNextToken(); // eat ')'.
375
Lang Hames09bf4c12015-08-18 18:11:06 +0000376 return llvm::make_unique<PrototypeAST>(FnName, std::move(ArgNames));
Erick Tryzelaar21e83ea2009-09-22 21:15:19 +0000377}
378
379/// definition ::= 'def' prototype expression
Lang Hames09bf4c12015-08-18 18:11:06 +0000380static std::unique_ptr<FunctionAST> ParseDefinition() {
Eric Christopherc0239362014-12-08 18:12:28 +0000381 getNextToken(); // eat def.
Lang Hames09bf4c12015-08-18 18:11:06 +0000382 auto Proto = ParsePrototype();
383 if (!Proto)
384 return nullptr;
Erick Tryzelaar21e83ea2009-09-22 21:15:19 +0000385
Lang Hames09bf4c12015-08-18 18:11:06 +0000386 if (auto E = ParseExpression())
387 return llvm::make_unique<FunctionAST>(std::move(Proto), std::move(E));
388 return nullptr;
Erick Tryzelaar21e83ea2009-09-22 21:15:19 +0000389}
390
391/// toplevelexpr ::= expression
Lang Hames09bf4c12015-08-18 18:11:06 +0000392static std::unique_ptr<FunctionAST> ParseTopLevelExpr() {
393 if (auto E = ParseExpression()) {
Erick Tryzelaar21e83ea2009-09-22 21:15:19 +0000394 // Make an anonymous proto.
Lang Hames2d789c32015-08-26 03:07:41 +0000395 auto Proto = llvm::make_unique<PrototypeAST>("__anon_expr",
396 std::vector<std::string>());
Lang Hames09bf4c12015-08-18 18:11:06 +0000397 return llvm::make_unique<FunctionAST>(std::move(Proto), std::move(E));
Erick Tryzelaar21e83ea2009-09-22 21:15:19 +0000398 }
Lang Hames09bf4c12015-08-18 18:11:06 +0000399 return nullptr;
Erick Tryzelaar21e83ea2009-09-22 21:15:19 +0000400}
401
402/// external ::= 'extern' prototype
Lang Hames09bf4c12015-08-18 18:11:06 +0000403static std::unique_ptr<PrototypeAST> ParseExtern() {
Eric Christopherc0239362014-12-08 18:12:28 +0000404 getNextToken(); // eat extern.
Erick Tryzelaar21e83ea2009-09-22 21:15:19 +0000405 return ParsePrototype();
406}
407
408//===----------------------------------------------------------------------===//
409// Code Generation
410//===----------------------------------------------------------------------===//
411
Mehdi Amini03b42e42016-04-14 21:59:01 +0000412static LLVMContext TheContext;
413static IRBuilder<> Builder(TheContext);
Lang Hames24796802016-05-22 22:48:36 +0000414static std::unique_ptr<Module> TheModule;
Eric Christopherc0239362014-12-08 18:12:28 +0000415static std::map<std::string, Value *> NamedValues;
Lang Hames2d789c32015-08-26 03:07:41 +0000416static std::unique_ptr<legacy::FunctionPassManager> TheFPM;
417static std::unique_ptr<KaleidoscopeJIT> TheJIT;
418static std::map<std::string, std::unique_ptr<PrototypeAST>> FunctionProtos;
Erick Tryzelaar21e83ea2009-09-22 21:15:19 +0000419
Lang Hames5d045a92016-03-25 17:41:26 +0000420Value *LogErrorV(const char *Str) {
421 LogError(Str);
Lang Hames09bf4c12015-08-18 18:11:06 +0000422 return nullptr;
Eric Christopherc0239362014-12-08 18:12:28 +0000423}
Erick Tryzelaar21e83ea2009-09-22 21:15:19 +0000424
Lang Hames2d789c32015-08-26 03:07:41 +0000425Function *getFunction(std::string Name) {
426 // First, see if the function has already been added to the current module.
427 if (auto *F = TheModule->getFunction(Name))
428 return F;
429
430 // If not, check whether we can codegen the declaration from some existing
431 // prototype.
432 auto FI = FunctionProtos.find(Name);
433 if (FI != FunctionProtos.end())
434 return FI->second->codegen();
435
436 // If no existing prototype exists, return null.
437 return nullptr;
438}
439
440Value *NumberExprAST::codegen() {
Mehdi Amini03b42e42016-04-14 21:59:01 +0000441 return ConstantFP::get(TheContext, APFloat(Val));
Erick Tryzelaar21e83ea2009-09-22 21:15:19 +0000442}
443
Lang Hames2d789c32015-08-26 03:07:41 +0000444Value *VariableExprAST::codegen() {
Erick Tryzelaar21e83ea2009-09-22 21:15:19 +0000445 // Look this variable up in the function.
446 Value *V = NamedValues[Name];
Lang Hames596aec92015-08-19 18:32:58 +0000447 if (!V)
Lang Hames5d045a92016-03-25 17:41:26 +0000448 return LogErrorV("Unknown variable name");
Lang Hames596aec92015-08-19 18:32:58 +0000449 return V;
Erick Tryzelaar21e83ea2009-09-22 21:15:19 +0000450}
451
Lang Hames2d789c32015-08-26 03:07:41 +0000452Value *BinaryExprAST::codegen() {
453 Value *L = LHS->codegen();
454 Value *R = RHS->codegen();
Lang Hames09bf4c12015-08-18 18:11:06 +0000455 if (!L || !R)
456 return nullptr;
Eric Christopherc0239362014-12-08 18:12:28 +0000457
Erick Tryzelaar21e83ea2009-09-22 21:15:19 +0000458 switch (Op) {
Eric Christopherc0239362014-12-08 18:12:28 +0000459 case '+':
460 return Builder.CreateFAdd(L, R, "addtmp");
461 case '-':
462 return Builder.CreateFSub(L, R, "subtmp");
463 case '*':
464 return Builder.CreateFMul(L, R, "multmp");
Erick Tryzelaar21e83ea2009-09-22 21:15:19 +0000465 case '<':
466 L = Builder.CreateFCmpULT(L, R, "cmptmp");
467 // Convert bool 0/1 to double 0.0 or 1.0
Mehdi Amini03b42e42016-04-14 21:59:01 +0000468 return Builder.CreateUIToFP(L, Type::getDoubleTy(TheContext), "booltmp");
Eric Christopherc0239362014-12-08 18:12:28 +0000469 default:
Lang Hames5d045a92016-03-25 17:41:26 +0000470 return LogErrorV("invalid binary operator");
Erick Tryzelaar21e83ea2009-09-22 21:15:19 +0000471 }
472}
473
Lang Hames2d789c32015-08-26 03:07:41 +0000474Value *CallExprAST::codegen() {
Erick Tryzelaar21e83ea2009-09-22 21:15:19 +0000475 // Look up the name in the global module table.
Lang Hames2d789c32015-08-26 03:07:41 +0000476 Function *CalleeF = getFunction(Callee);
Lang Hames09bf4c12015-08-18 18:11:06 +0000477 if (!CalleeF)
Lang Hames5d045a92016-03-25 17:41:26 +0000478 return LogErrorV("Unknown function referenced");
Eric Christopherc0239362014-12-08 18:12:28 +0000479
Erick Tryzelaar21e83ea2009-09-22 21:15:19 +0000480 // If argument mismatch error.
481 if (CalleeF->arg_size() != Args.size())
Lang Hames5d045a92016-03-25 17:41:26 +0000482 return LogErrorV("Incorrect # arguments passed");
Erick Tryzelaar21e83ea2009-09-22 21:15:19 +0000483
Eric Christopherc0239362014-12-08 18:12:28 +0000484 std::vector<Value *> ArgsV;
Erick Tryzelaar21e83ea2009-09-22 21:15:19 +0000485 for (unsigned i = 0, e = Args.size(); i != e; ++i) {
Lang Hames2d789c32015-08-26 03:07:41 +0000486 ArgsV.push_back(Args[i]->codegen());
Lang Hames09bf4c12015-08-18 18:11:06 +0000487 if (!ArgsV.back())
488 return nullptr;
Erick Tryzelaar21e83ea2009-09-22 21:15:19 +0000489 }
Eric Christopherc0239362014-12-08 18:12:28 +0000490
Francois Pichetc5d10502011-07-15 10:59:52 +0000491 return Builder.CreateCall(CalleeF, ArgsV, "calltmp");
Erick Tryzelaar21e83ea2009-09-22 21:15:19 +0000492}
493
Lang Hames2d789c32015-08-26 03:07:41 +0000494Function *PrototypeAST::codegen() {
Erick Tryzelaar21e83ea2009-09-22 21:15:19 +0000495 // Make the function type: double(double,double) etc.
Mehdi Amini03b42e42016-04-14 21:59:01 +0000496 std::vector<Type *> Doubles(Args.size(), Type::getDoubleTy(TheContext));
Eric Christopherc0239362014-12-08 18:12:28 +0000497 FunctionType *FT =
Mehdi Amini03b42e42016-04-14 21:59:01 +0000498 FunctionType::get(Type::getDoubleTy(TheContext), Doubles, false);
Eric Christopherc0239362014-12-08 18:12:28 +0000499
Lang Hames2d789c32015-08-26 03:07:41 +0000500 Function *F =
501 Function::Create(FT, Function::ExternalLinkage, Name, TheModule.get());
Eric Christopherc0239362014-12-08 18:12:28 +0000502
Erick Tryzelaar21e83ea2009-09-22 21:15:19 +0000503 // Set names for all arguments.
504 unsigned Idx = 0;
Lang Hames2d789c32015-08-26 03:07:41 +0000505 for (auto &Arg : F->args())
506 Arg.setName(Args[Idx++]);
Eric Christopherc0239362014-12-08 18:12:28 +0000507
Erick Tryzelaar21e83ea2009-09-22 21:15:19 +0000508 return F;
509}
510
Lang Hames2d789c32015-08-26 03:07:41 +0000511Function *FunctionAST::codegen() {
512 // Transfer ownership of the prototype to the FunctionProtos map, but keep a
513 // reference to it for use below.
514 auto &P = *Proto;
515 FunctionProtos[Proto->getName()] = std::move(Proto);
516 Function *TheFunction = getFunction(P.getName());
Lang Hames09bf4c12015-08-18 18:11:06 +0000517 if (!TheFunction)
518 return nullptr;
Eric Christopherc0239362014-12-08 18:12:28 +0000519
Erick Tryzelaar21e83ea2009-09-22 21:15:19 +0000520 // Create a new basic block to start insertion into.
Mehdi Amini03b42e42016-04-14 21:59:01 +0000521 BasicBlock *BB = BasicBlock::Create(TheContext, "entry", TheFunction);
Erick Tryzelaar21e83ea2009-09-22 21:15:19 +0000522 Builder.SetInsertPoint(BB);
Eric Christopherc0239362014-12-08 18:12:28 +0000523
Lang Hames2d789c32015-08-26 03:07:41 +0000524 // Record the function arguments in the NamedValues map.
525 NamedValues.clear();
526 for (auto &Arg : TheFunction->args())
527 NamedValues[Arg.getName()] = &Arg;
528
529 if (Value *RetVal = Body->codegen()) {
Erick Tryzelaar21e83ea2009-09-22 21:15:19 +0000530 // Finish off the function.
531 Builder.CreateRet(RetVal);
532
533 // Validate the generated code, checking for consistency.
534 verifyFunction(*TheFunction);
535
Lang Hames2d789c32015-08-26 03:07:41 +0000536 // Run the optimizer on the function.
537 TheFPM->run(*TheFunction);
538
Erick Tryzelaar21e83ea2009-09-22 21:15:19 +0000539 return TheFunction;
540 }
Eric Christopherc0239362014-12-08 18:12:28 +0000541
Erick Tryzelaar21e83ea2009-09-22 21:15:19 +0000542 // Error reading body, remove function.
543 TheFunction->eraseFromParent();
Lang Hames09bf4c12015-08-18 18:11:06 +0000544 return nullptr;
Erick Tryzelaar21e83ea2009-09-22 21:15:19 +0000545}
546
547//===----------------------------------------------------------------------===//
548// Top-Level parsing and JIT Driver
549//===----------------------------------------------------------------------===//
550
Lang Hames2d789c32015-08-26 03:07:41 +0000551static void InitializeModuleAndPassManager() {
552 // Open a new module.
Mehdi Amini03b42e42016-04-14 21:59:01 +0000553 TheModule = llvm::make_unique<Module>("my cool jit", TheContext);
Lang Hames2d789c32015-08-26 03:07:41 +0000554 TheModule->setDataLayout(TheJIT->getTargetMachine().createDataLayout());
555
556 // Create a new pass manager attached to it.
557 TheFPM = llvm::make_unique<legacy::FunctionPassManager>(TheModule.get());
558
Lang Hames2d789c32015-08-26 03:07:41 +0000559 // Do simple "peephole" optimizations and bit-twiddling optzns.
560 TheFPM->add(createInstructionCombiningPass());
561 // Reassociate expressions.
562 TheFPM->add(createReassociatePass());
563 // Eliminate Common SubExpressions.
564 TheFPM->add(createGVNPass());
565 // Simplify the control flow graph (deleting unreachable blocks, etc).
566 TheFPM->add(createCFGSimplificationPass());
567
568 TheFPM->doInitialization();
569}
570
Erick Tryzelaar21e83ea2009-09-22 21:15:19 +0000571static void HandleDefinition() {
Lang Hames09bf4c12015-08-18 18:11:06 +0000572 if (auto FnAST = ParseDefinition()) {
Lang Hames2d789c32015-08-26 03:07:41 +0000573 if (auto *FnIR = FnAST->codegen()) {
Erick Tryzelaar21e83ea2009-09-22 21:15:19 +0000574 fprintf(stderr, "Read function definition:");
Matthias Braun25bcaba2017-01-28 02:47:46 +0000575 FnIR->print(errs());
576 fprintf(stderr, "\n");
Lang Hames2d789c32015-08-26 03:07:41 +0000577 TheJIT->addModule(std::move(TheModule));
578 InitializeModuleAndPassManager();
Erick Tryzelaar21e83ea2009-09-22 21:15:19 +0000579 }
580 } else {
581 // Skip token for error recovery.
582 getNextToken();
583 }
584}
585
586static void HandleExtern() {
Lang Hames09bf4c12015-08-18 18:11:06 +0000587 if (auto ProtoAST = ParseExtern()) {
Lang Hames2d789c32015-08-26 03:07:41 +0000588 if (auto *FnIR = ProtoAST->codegen()) {
Erick Tryzelaar21e83ea2009-09-22 21:15:19 +0000589 fprintf(stderr, "Read extern: ");
Matthias Braun25bcaba2017-01-28 02:47:46 +0000590 FnIR->print(errs());
591 fprintf(stderr, "\n");
Lang Hames2d789c32015-08-26 03:07:41 +0000592 FunctionProtos[ProtoAST->getName()] = std::move(ProtoAST);
Erick Tryzelaar21e83ea2009-09-22 21:15:19 +0000593 }
594 } else {
595 // Skip token for error recovery.
596 getNextToken();
597 }
598}
599
600static void HandleTopLevelExpression() {
601 // Evaluate a top-level expression into an anonymous function.
Lang Hames09bf4c12015-08-18 18:11:06 +0000602 if (auto FnAST = ParseTopLevelExpr()) {
Lang Hames2d789c32015-08-26 03:07:41 +0000603 if (FnAST->codegen()) {
Lang Hames2d789c32015-08-26 03:07:41 +0000604 // JIT the module containing the anonymous expression, keeping a handle so
605 // we can free it later.
606 auto H = TheJIT->addModule(std::move(TheModule));
607 InitializeModuleAndPassManager();
608
609 // Search the JIT for the __anon_expr symbol.
610 auto ExprSymbol = TheJIT->findSymbol("__anon_expr");
611 assert(ExprSymbol && "Function not found");
612
613 // Get the symbol's address and cast it to the right type (takes no
614 // arguments, returns a double) so we can call it as a native function.
Lang Hames4ce98662017-07-07 02:59:13 +0000615 double (*FP)() = (double (*)())(intptr_t)cantFail(ExprSymbol.getAddress());
Erick Tryzelaar21e83ea2009-09-22 21:15:19 +0000616 fprintf(stderr, "Evaluated to %f\n", FP());
Lang Hames2d789c32015-08-26 03:07:41 +0000617
618 // Delete the anonymous expression module from the JIT.
619 TheJIT->removeModule(H);
Erick Tryzelaar21e83ea2009-09-22 21:15:19 +0000620 }
621 } else {
622 // Skip token for error recovery.
623 getNextToken();
624 }
625}
626
627/// top ::= definition | external | expression | ';'
628static void MainLoop() {
Eugene Zelenkof981ec42016-05-19 01:08:04 +0000629 while (true) {
Erick Tryzelaar21e83ea2009-09-22 21:15:19 +0000630 fprintf(stderr, "ready> ");
631 switch (CurTok) {
Eric Christopherc0239362014-12-08 18:12:28 +0000632 case tok_eof:
633 return;
Lang Hames59b0da82015-08-19 18:15:58 +0000634 case ';': // ignore top-level semicolons.
Eric Christopherc0239362014-12-08 18:12:28 +0000635 getNextToken();
Lang Hames59b0da82015-08-19 18:15:58 +0000636 break;
Eric Christopherc0239362014-12-08 18:12:28 +0000637 case tok_def:
638 HandleDefinition();
639 break;
640 case tok_extern:
641 HandleExtern();
642 break;
643 default:
644 HandleTopLevelExpression();
645 break;
Erick Tryzelaar21e83ea2009-09-22 21:15:19 +0000646 }
647 }
648}
649
650//===----------------------------------------------------------------------===//
651// "Library" functions that can be "extern'd" from user code.
652//===----------------------------------------------------------------------===//
653
Nico Weber712e8d22018-04-29 00:45:03 +0000654#ifdef _WIN32
Mehdi Aminibb6805d2017-02-11 21:26:52 +0000655#define DLLEXPORT __declspec(dllexport)
656#else
657#define DLLEXPORT
658#endif
659
Erick Tryzelaar21e83ea2009-09-22 21:15:19 +0000660/// putchard - putchar that takes a double and returns 0.
Mehdi Aminibb6805d2017-02-11 21:26:52 +0000661extern "C" DLLEXPORT double putchard(double X) {
Lang Hamesd76e0672015-08-27 20:31:44 +0000662 fputc((char)X, stderr);
Erick Tryzelaar21e83ea2009-09-22 21:15:19 +0000663 return 0;
664}
665
Lang Hames59b0da82015-08-19 18:15:58 +0000666/// printd - printf that takes a double prints it as "%f\n", returning 0.
Mehdi Aminibb6805d2017-02-11 21:26:52 +0000667extern "C" DLLEXPORT double printd(double X) {
Lang Hamesd76e0672015-08-27 20:31:44 +0000668 fprintf(stderr, "%f\n", X);
Lang Hames59b0da82015-08-19 18:15:58 +0000669 return 0;
670}
671
Erick Tryzelaar21e83ea2009-09-22 21:15:19 +0000672//===----------------------------------------------------------------------===//
673// Main driver code.
674//===----------------------------------------------------------------------===//
675
676int main() {
677 InitializeNativeTarget();
Eric Christopher1b74b652014-12-08 18:00:38 +0000678 InitializeNativeTargetAsmPrinter();
679 InitializeNativeTargetAsmParser();
Erick Tryzelaar21e83ea2009-09-22 21:15:19 +0000680
681 // Install standard binary operators.
682 // 1 is lowest precedence.
683 BinopPrecedence['<'] = 10;
684 BinopPrecedence['+'] = 20;
685 BinopPrecedence['-'] = 20;
Eric Christopherc0239362014-12-08 18:12:28 +0000686 BinopPrecedence['*'] = 40; // highest.
Erick Tryzelaar21e83ea2009-09-22 21:15:19 +0000687
688 // Prime the first token.
689 fprintf(stderr, "ready> ");
690 getNextToken();
691
Lang Hames2d789c32015-08-26 03:07:41 +0000692 TheJIT = llvm::make_unique<KaleidoscopeJIT>();
693
694 InitializeModuleAndPassManager();
695
Erick Tryzelaar21e83ea2009-09-22 21:15:19 +0000696 // Run the main "interpreter loop" now.
697 MainLoop();
698
Erick Tryzelaar21e83ea2009-09-22 21:15:19 +0000699 return 0;
700}