blob: d8c54b50b854902cd78f7e3b35a6c8e6468f22c0 [file] [log] [blame]
Chris Lattner909ef092007-09-12 18:24:00 +00001//===-- BrainF.cpp - BrainF compiler example ----------------------------===//
2//
3// The LLVM Compiler Infrastructure
4//
Chris Lattnerbcf65db2007-12-29 20:37:57 +00005// This file is distributed under the University of Illinois Open Source
6// License. See LICENSE.TXT for details.
Chris Lattner909ef092007-09-12 18:24:00 +00007//
8//===--------------------------------------------------------------------===//
9//
10// This class compiles the BrainF language into LLVM assembly.
11//
12// The BrainF language has 8 commands:
13// Command Equivalent C Action
14// ------- ------------ ------
15// , *h=getchar(); Read a character from stdin, 255 on EOF
16// . putchar(*h); Write a character to stdout
17// - --*h; Decrement tape
18// + ++*h; Increment tape
19// < --h; Move head left
20// > ++h; Move head right
21// [ while(*h) { Start loop
22// ] } End loop
23//
24//===--------------------------------------------------------------------===//
25
26#include "BrainF.h"
Chandler Carruth605e30e2012-12-04 10:16:57 +000027#include "llvm/ADT/STLExtras.h"
Chandler Carruth005f27a2013-01-02 11:56:33 +000028#include "llvm/IR/Constants.h"
29#include "llvm/IR/Instructions.h"
30#include "llvm/IR/Intrinsics.h"
Chris Lattner8e8eae62008-08-23 22:00:15 +000031#include <iostream>
Hans Wennborgcc9deb42015-09-29 18:02:48 +000032
Chris Lattner909ef092007-09-12 18:24:00 +000033using namespace llvm;
34
35//Set the constants for naming
36const char *BrainF::tapereg = "tape";
37const char *BrainF::headreg = "head";
38const char *BrainF::label = "brainf";
39const char *BrainF::testreg = "test";
40
Owen Anderson6773d382009-07-01 16:58:40 +000041Module *BrainF::parse(std::istream *in1, int mem, CompileFlags cf,
Owen Anderson2a154432009-07-01 23:13:44 +000042 LLVMContext& Context) {
Chris Lattner909ef092007-09-12 18:24:00 +000043 in = in1;
44 memtotal = mem;
45 comflag = cf;
46
Owen Anderson6773d382009-07-01 16:58:40 +000047 header(Context);
Hans Wennborgcc9deb42015-09-29 18:02:48 +000048 readloop(nullptr, nullptr, nullptr, Context);
Chris Lattner909ef092007-09-12 18:24:00 +000049 delete builder;
50 return module;
51}
52
Owen Anderson2a154432009-07-01 23:13:44 +000053void BrainF::header(LLVMContext& C) {
Owen Anderson6773d382009-07-01 16:58:40 +000054 module = new Module("BrainF", C);
Chris Lattner909ef092007-09-12 18:24:00 +000055
56 //Function prototypes
57
Chris Lattner0b6dce42010-08-10 21:45:38 +000058 //declare void @llvm.memset.p0i8.i32(i8 *, i8, i32, i32, i1)
Francois Pichetce206002011-07-12 22:04:11 +000059 Type *Tys[] = { Type::getInt8PtrTy(C), Type::getInt32Ty(C) };
Chris Lattnerdd708342008-11-21 16:42:48 +000060 Function *memset_func = Intrinsic::getDeclaration(module, Intrinsic::memset,
Benjamin Kramere6e19332011-07-14 17:45:39 +000061 Tys);
Chris Lattner909ef092007-09-12 18:24:00 +000062
63 //declare i32 @getchar()
64 getchar_func = cast<Function>(module->
Owen Anderson55f1c092009-08-13 21:58:54 +000065 getOrInsertFunction("getchar", IntegerType::getInt32Ty(C), NULL));
Chris Lattner909ef092007-09-12 18:24:00 +000066
67 //declare i32 @putchar(i32)
68 putchar_func = cast<Function>(module->
Owen Anderson55f1c092009-08-13 21:58:54 +000069 getOrInsertFunction("putchar", IntegerType::getInt32Ty(C),
70 IntegerType::getInt32Ty(C), NULL));
Chris Lattner909ef092007-09-12 18:24:00 +000071
Chris Lattner909ef092007-09-12 18:24:00 +000072 //Function header
73
74 //define void @brainf()
75 brainf_func = cast<Function>(module->
Owen Anderson55f1c092009-08-13 21:58:54 +000076 getOrInsertFunction("brainf", Type::getVoidTy(C), NULL));
Chris Lattner909ef092007-09-12 18:24:00 +000077
Owen Anderson55f1c092009-08-13 21:58:54 +000078 builder = new IRBuilder<>(BasicBlock::Create(C, label, brainf_func));
Chris Lattner909ef092007-09-12 18:24:00 +000079
80 //%arr = malloc i8, i32 %d
Owen Andersonedb4a702009-07-24 23:12:02 +000081 ConstantInt *val_mem = ConstantInt::get(C, APInt(32, memtotal));
Victor Hernandezc7d6a832009-10-17 00:00:19 +000082 BasicBlock* BB = builder->GetInsertBlock();
Chris Lattner805d0942011-07-18 04:52:58 +000083 Type* IntPtrTy = IntegerType::getInt32Ty(C);
84 Type* Int8Ty = IntegerType::getInt8Ty(C);
Victor Hernandezf3db9152009-11-07 00:16:28 +000085 Constant* allocsize = ConstantExpr::getSizeOf(Int8Ty);
86 allocsize = ConstantExpr::getTruncOrBitCast(allocsize, IntPtrTy);
87 ptr_arr = CallInst::CreateMalloc(BB, IntPtrTy, Int8Ty, allocsize, val_mem,
Hans Wennborgcc9deb42015-09-29 18:02:48 +000088 nullptr, "arr");
Victor Hernandezc7d6a832009-10-17 00:00:19 +000089 BB->getInstList().push_back(cast<Instruction>(ptr_arr));
Chris Lattner909ef092007-09-12 18:24:00 +000090
Chris Lattner0b6dce42010-08-10 21:45:38 +000091 //call void @llvm.memset.p0i8.i32(i8 *%arr, i8 0, i32 %d, i32 1, i1 0)
Chris Lattner909ef092007-09-12 18:24:00 +000092 {
93 Value *memset_params[] = {
94 ptr_arr,
Owen Andersonedb4a702009-07-24 23:12:02 +000095 ConstantInt::get(C, APInt(8, 0)),
Chris Lattner909ef092007-09-12 18:24:00 +000096 val_mem,
Chris Lattner0b6dce42010-08-10 21:45:38 +000097 ConstantInt::get(C, APInt(32, 1)),
98 ConstantInt::get(C, APInt(1, 0))
Chris Lattner909ef092007-09-12 18:24:00 +000099 };
100
101 CallInst *memset_call = builder->
Francois Pichetc5d10502011-07-15 10:59:52 +0000102 CreateCall(memset_func, memset_params);
Chris Lattner909ef092007-09-12 18:24:00 +0000103 memset_call->setTailCall(false);
104 }
105
106 //%arrmax = getelementptr i8 *%arr, i32 %d
107 if (comflag & flag_arraybounds) {
108 ptr_arrmax = builder->
Owen Andersonedb4a702009-07-24 23:12:02 +0000109 CreateGEP(ptr_arr, ConstantInt::get(C, APInt(32, memtotal)), "arrmax");
Chris Lattner909ef092007-09-12 18:24:00 +0000110 }
111
112 //%head.%d = getelementptr i8 *%arr, i32 %d
113 curhead = builder->CreateGEP(ptr_arr,
Owen Andersonedb4a702009-07-24 23:12:02 +0000114 ConstantInt::get(C, APInt(32, memtotal/2)),
Chris Lattner909ef092007-09-12 18:24:00 +0000115 headreg);
116
Chris Lattner909ef092007-09-12 18:24:00 +0000117 //Function footer
118
119 //brainf.end:
Owen Anderson55f1c092009-08-13 21:58:54 +0000120 endbb = BasicBlock::Create(C, label, brainf_func);
Chris Lattner909ef092007-09-12 18:24:00 +0000121
Victor Hernandezde5ad422009-10-26 23:43:48 +0000122 //call free(i8 *%arr)
123 endbb->getInstList().push_back(CallInst::CreateFree(ptr_arr, endbb));
Chris Lattner909ef092007-09-12 18:24:00 +0000124
125 //ret void
Owen Anderson55f1c092009-08-13 21:58:54 +0000126 ReturnInst::Create(C, endbb);
Chris Lattner909ef092007-09-12 18:24:00 +0000127
Chris Lattner909ef092007-09-12 18:24:00 +0000128 //Error block for array out of bounds
129 if (comflag & flag_arraybounds)
130 {
131 //@aberrormsg = internal constant [%d x i8] c"\00"
Owen Andersonb6b25302009-07-14 23:09:55 +0000132 Constant *msg_0 =
Francois Pichet4ce6e6e2012-01-31 09:35:01 +0000133 ConstantDataArray::getString(C, "Error: The head has left the tape.",
134 true);
Chris Lattner909ef092007-09-12 18:24:00 +0000135
136 GlobalVariable *aberrormsg = new GlobalVariable(
Owen Andersonb17f3292009-07-08 19:03:57 +0000137 *module,
Chris Lattner909ef092007-09-12 18:24:00 +0000138 msg_0->getType(),
139 true,
140 GlobalValue::InternalLinkage,
141 msg_0,
Owen Andersonb17f3292009-07-08 19:03:57 +0000142 "aberrormsg");
Chris Lattner909ef092007-09-12 18:24:00 +0000143
144 //declare i32 @puts(i8 *)
145 Function *puts_func = cast<Function>(module->
Owen Anderson55f1c092009-08-13 21:58:54 +0000146 getOrInsertFunction("puts", IntegerType::getInt32Ty(C),
147 PointerType::getUnqual(IntegerType::getInt8Ty(C)), NULL));
Chris Lattner909ef092007-09-12 18:24:00 +0000148
149 //brainf.aberror:
Owen Anderson55f1c092009-08-13 21:58:54 +0000150 aberrorbb = BasicBlock::Create(C, label, brainf_func);
Chris Lattner909ef092007-09-12 18:24:00 +0000151
152 //call i32 @puts(i8 *getelementptr([%d x i8] *@aberrormsg, i32 0, i32 0))
153 {
Owen Anderson55f1c092009-08-13 21:58:54 +0000154 Constant *zero_32 = Constant::getNullValue(IntegerType::getInt32Ty(C));
Chris Lattner909ef092007-09-12 18:24:00 +0000155
156 Constant *gep_params[] = {
157 zero_32,
158 zero_32
159 };
160
161 Constant *msgptr = ConstantExpr::
NAKAMURA Takumi696f2752015-04-02 22:44:00 +0000162 getGetElementPtr(aberrormsg->getValueType(), aberrormsg, gep_params);
Chris Lattner909ef092007-09-12 18:24:00 +0000163
164 Value *puts_params[] = {
165 msgptr
166 };
167
168 CallInst *puts_call =
Gabor Greife9ecc682008-04-06 20:25:17 +0000169 CallInst::Create(puts_func,
Francois Pichetc5d10502011-07-15 10:59:52 +0000170 puts_params,
Gabor Greife9ecc682008-04-06 20:25:17 +0000171 "", aberrorbb);
Chris Lattner909ef092007-09-12 18:24:00 +0000172 puts_call->setTailCall(false);
173 }
174
175 //br label %brainf.end
Gabor Greife9ecc682008-04-06 20:25:17 +0000176 BranchInst::Create(endbb, aberrorbb);
Chris Lattner909ef092007-09-12 18:24:00 +0000177 }
178}
179
Owen Andersonb6b25302009-07-14 23:09:55 +0000180void BrainF::readloop(PHINode *phi, BasicBlock *oldbb, BasicBlock *testbb,
181 LLVMContext &C) {
Chris Lattner909ef092007-09-12 18:24:00 +0000182 Symbol cursym = SYM_NONE;
183 int curvalue = 0;
184 Symbol nextsym = SYM_NONE;
185 int nextvalue = 0;
186 char c;
187 int loop;
188 int direction;
189
190 while(cursym != SYM_EOF && cursym != SYM_ENDLOOP) {
191 // Write out commands
192 switch(cursym) {
193 case SYM_NONE:
194 // Do nothing
195 break;
196
197 case SYM_READ:
198 {
199 //%tape.%d = call i32 @getchar()
NAKAMURA Takumi5b9bc2f2015-05-19 06:50:19 +0000200 CallInst *getchar_call =
201 builder->CreateCall(getchar_func, {}, tapereg);
Chris Lattner909ef092007-09-12 18:24:00 +0000202 getchar_call->setTailCall(false);
203 Value *tape_0 = getchar_call;
204
205 //%tape.%d = trunc i32 %tape.%d to i8
Duncan Sandsa07136e2008-04-13 06:22:09 +0000206 Value *tape_1 = builder->
Owen Anderson55f1c092009-08-13 21:58:54 +0000207 CreateTrunc(tape_0, IntegerType::getInt8Ty(C), tapereg);
Chris Lattner909ef092007-09-12 18:24:00 +0000208
209 //store i8 %tape.%d, i8 *%head.%d
210 builder->CreateStore(tape_1, curhead);
211 }
212 break;
213
214 case SYM_WRITE:
215 {
216 //%tape.%d = load i8 *%head.%d
217 LoadInst *tape_0 = builder->CreateLoad(curhead, tapereg);
218
219 //%tape.%d = sext i8 %tape.%d to i32
Duncan Sandsa07136e2008-04-13 06:22:09 +0000220 Value *tape_1 = builder->
Owen Anderson55f1c092009-08-13 21:58:54 +0000221 CreateSExt(tape_0, IntegerType::getInt32Ty(C), tapereg);
Chris Lattner909ef092007-09-12 18:24:00 +0000222
223 //call i32 @putchar(i32 %tape.%d)
224 Value *putchar_params[] = {
225 tape_1
226 };
227 CallInst *putchar_call = builder->
228 CreateCall(putchar_func,
Francois Pichetc5d10502011-07-15 10:59:52 +0000229 putchar_params);
Chris Lattner909ef092007-09-12 18:24:00 +0000230 putchar_call->setTailCall(false);
231 }
232 break;
233
234 case SYM_MOVE:
235 {
236 //%head.%d = getelementptr i8 *%head.%d, i32 %d
237 curhead = builder->
Owen Andersonedb4a702009-07-24 23:12:02 +0000238 CreateGEP(curhead, ConstantInt::get(C, APInt(32, curvalue)),
Chris Lattner909ef092007-09-12 18:24:00 +0000239 headreg);
240
241 //Error block for array out of bounds
242 if (comflag & flag_arraybounds)
243 {
244 //%test.%d = icmp uge i8 *%head.%d, %arrmax
Duncan Sandsa07136e2008-04-13 06:22:09 +0000245 Value *test_0 = builder->
Chris Lattner909ef092007-09-12 18:24:00 +0000246 CreateICmpUGE(curhead, ptr_arrmax, testreg);
247
248 //%test.%d = icmp ult i8 *%head.%d, %arr
Duncan Sandsa07136e2008-04-13 06:22:09 +0000249 Value *test_1 = builder->
Chris Lattner909ef092007-09-12 18:24:00 +0000250 CreateICmpULT(curhead, ptr_arr, testreg);
251
252 //%test.%d = or i1 %test.%d, %test.%d
Duncan Sandsa07136e2008-04-13 06:22:09 +0000253 Value *test_2 = builder->
Chris Lattner909ef092007-09-12 18:24:00 +0000254 CreateOr(test_0, test_1, testreg);
255
256 //br i1 %test.%d, label %main.%d, label %main.%d
Owen Anderson55f1c092009-08-13 21:58:54 +0000257 BasicBlock *nextbb = BasicBlock::Create(C, label, brainf_func);
Chris Lattner909ef092007-09-12 18:24:00 +0000258 builder->CreateCondBr(test_2, aberrorbb, nextbb);
259
260 //main.%d:
261 builder->SetInsertPoint(nextbb);
262 }
263 }
264 break;
265
266 case SYM_CHANGE:
267 {
268 //%tape.%d = load i8 *%head.%d
269 LoadInst *tape_0 = builder->CreateLoad(curhead, tapereg);
270
271 //%tape.%d = add i8 %tape.%d, %d
Duncan Sandsa07136e2008-04-13 06:22:09 +0000272 Value *tape_1 = builder->
Owen Andersonedb4a702009-07-24 23:12:02 +0000273 CreateAdd(tape_0, ConstantInt::get(C, APInt(8, curvalue)), tapereg);
Chris Lattner909ef092007-09-12 18:24:00 +0000274
275 //store i8 %tape.%d, i8 *%head.%d\n"
276 builder->CreateStore(tape_1, curhead);
277 }
278 break;
279
280 case SYM_LOOP:
281 {
282 //br label %main.%d
Owen Anderson55f1c092009-08-13 21:58:54 +0000283 BasicBlock *testbb = BasicBlock::Create(C, label, brainf_func);
Chris Lattner909ef092007-09-12 18:24:00 +0000284 builder->CreateBr(testbb);
285
286 //main.%d:
287 BasicBlock *bb_0 = builder->GetInsertBlock();
Owen Anderson55f1c092009-08-13 21:58:54 +0000288 BasicBlock *bb_1 = BasicBlock::Create(C, label, brainf_func);
Chris Lattner909ef092007-09-12 18:24:00 +0000289 builder->SetInsertPoint(bb_1);
290
Gabor Greif697e94c2008-05-15 10:04:30 +0000291 // Make part of PHI instruction now, wait until end of loop to finish
292 PHINode *phi_0 =
Owen Anderson55f1c092009-08-13 21:58:54 +0000293 PHINode::Create(PointerType::getUnqual(IntegerType::getInt8Ty(C)),
Jay Foad52131342011-03-30 11:28:46 +0000294 2, headreg, testbb);
Chris Lattner909ef092007-09-12 18:24:00 +0000295 phi_0->addIncoming(curhead, bb_0);
296 curhead = phi_0;
297
Owen Andersonb6b25302009-07-14 23:09:55 +0000298 readloop(phi_0, bb_1, testbb, C);
Chris Lattner909ef092007-09-12 18:24:00 +0000299 }
300 break;
301
302 default:
Chris Lattner8e8eae62008-08-23 22:00:15 +0000303 std::cerr << "Error: Unknown symbol.\n";
Chris Lattner909ef092007-09-12 18:24:00 +0000304 abort();
305 break;
306 }
307
308 cursym = nextsym;
309 curvalue = nextvalue;
310 nextsym = SYM_NONE;
311
312 // Reading stdin loop
313 loop = (cursym == SYM_NONE)
314 || (cursym == SYM_MOVE)
315 || (cursym == SYM_CHANGE);
316 while(loop) {
317 *in>>c;
318 if (in->eof()) {
319 if (cursym == SYM_NONE) {
320 cursym = SYM_EOF;
321 } else {
322 nextsym = SYM_EOF;
323 }
324 loop = 0;
325 } else {
326 direction = 1;
327 switch(c) {
328 case '-':
329 direction = -1;
330 // Fall through
331
332 case '+':
333 if (cursym == SYM_CHANGE) {
334 curvalue += direction;
335 // loop = 1
336 } else {
337 if (cursym == SYM_NONE) {
338 cursym = SYM_CHANGE;
339 curvalue = direction;
340 // loop = 1
341 } else {
342 nextsym = SYM_CHANGE;
343 nextvalue = direction;
344 loop = 0;
345 }
346 }
347 break;
348
349 case '<':
350 direction = -1;
351 // Fall through
352
353 case '>':
354 if (cursym == SYM_MOVE) {
355 curvalue += direction;
356 // loop = 1
357 } else {
358 if (cursym == SYM_NONE) {
359 cursym = SYM_MOVE;
360 curvalue = direction;
361 // loop = 1
362 } else {
363 nextsym = SYM_MOVE;
364 nextvalue = direction;
365 loop = 0;
366 }
367 }
368 break;
369
370 case ',':
371 if (cursym == SYM_NONE) {
372 cursym = SYM_READ;
373 } else {
374 nextsym = SYM_READ;
375 }
376 loop = 0;
377 break;
378
379 case '.':
380 if (cursym == SYM_NONE) {
381 cursym = SYM_WRITE;
382 } else {
383 nextsym = SYM_WRITE;
384 }
385 loop = 0;
386 break;
387
388 case '[':
389 if (cursym == SYM_NONE) {
390 cursym = SYM_LOOP;
391 } else {
392 nextsym = SYM_LOOP;
393 }
394 loop = 0;
395 break;
396
397 case ']':
398 if (cursym == SYM_NONE) {
399 cursym = SYM_ENDLOOP;
400 } else {
401 nextsym = SYM_ENDLOOP;
402 }
403 loop = 0;
404 break;
405
406 // Ignore other characters
407 default:
408 break;
409 }
410 }
411 }
412 }
413
414 if (cursym == SYM_ENDLOOP) {
415 if (!phi) {
Chris Lattner8e8eae62008-08-23 22:00:15 +0000416 std::cerr << "Error: Extra ']'\n";
Chris Lattner909ef092007-09-12 18:24:00 +0000417 abort();
418 }
419
420 // Write loop test
421 {
422 //br label %main.%d
423 builder->CreateBr(testbb);
424
425 //main.%d:
426
427 //%head.%d = phi i8 *[%head.%d, %main.%d], [%head.%d, %main.%d]
428 //Finish phi made at beginning of loop
429 phi->addIncoming(curhead, builder->GetInsertBlock());
430 Value *head_0 = phi;
431
432 //%tape.%d = load i8 *%head.%d
433 LoadInst *tape_0 = new LoadInst(head_0, tapereg, testbb);
434
435 //%test.%d = icmp eq i8 %tape.%d, 0
Owen Anderson1e5f00e2009-07-09 23:48:35 +0000436 ICmpInst *test_0 = new ICmpInst(*testbb, ICmpInst::ICMP_EQ, tape_0,
Owen Andersonedb4a702009-07-24 23:12:02 +0000437 ConstantInt::get(C, APInt(8, 0)), testreg);
Chris Lattner909ef092007-09-12 18:24:00 +0000438
439 //br i1 %test.%d, label %main.%d, label %main.%d
Owen Anderson55f1c092009-08-13 21:58:54 +0000440 BasicBlock *bb_0 = BasicBlock::Create(C, label, brainf_func);
Gabor Greife9ecc682008-04-06 20:25:17 +0000441 BranchInst::Create(bb_0, oldbb, test_0, testbb);
Chris Lattner909ef092007-09-12 18:24:00 +0000442
443 //main.%d:
444 builder->SetInsertPoint(bb_0);
445
446 //%head.%d = phi i8 *[%head.%d, %main.%d]
447 PHINode *phi_1 = builder->
Jay Foad52131342011-03-30 11:28:46 +0000448 CreatePHI(PointerType::getUnqual(IntegerType::getInt8Ty(C)), 1,
449 headreg);
Chris Lattner909ef092007-09-12 18:24:00 +0000450 phi_1->addIncoming(head_0, testbb);
451 curhead = phi_1;
452 }
453
454 return;
455 }
456
457 //End of the program, so go to return block
458 builder->CreateBr(endbb);
459
460 if (phi) {
Chris Lattner8e8eae62008-08-23 22:00:15 +0000461 std::cerr << "Error: Missing ']'\n";
Chris Lattner909ef092007-09-12 18:24:00 +0000462 abort();
463 }
464}