blob: b002d1f496d2240da2e668e285c705424debc62b [file] [log] [blame]
Chris Lattnerbef8e0b2007-09-12 18:24:00 +00001//===-- BrainF.cpp - BrainF compiler example ----------------------------===//
2//
3// The LLVM Compiler Infrastructure
4//
Chris Lattnerfc001bb2007-12-29 20:37:57 +00005// This file is distributed under the University of Illinois Open Source
6// License. See LICENSE.TXT for details.
Chris Lattnerbef8e0b2007-09-12 18:24:00 +00007//
8//===--------------------------------------------------------------------===//
9//
10// This class compiles the BrainF language into LLVM assembly.
11//
12// The BrainF language has 8 commands:
13// Command Equivalent C Action
14// ------- ------------ ------
15// , *h=getchar(); Read a character from stdin, 255 on EOF
16// . putchar(*h); Write a character to stdout
17// - --*h; Decrement tape
18// + ++*h; Increment tape
19// < --h; Move head left
20// > ++h; Move head right
21// [ while(*h) { Start loop
22// ] } End loop
23//
24//===--------------------------------------------------------------------===//
25
26#include "BrainF.h"
27#include "llvm/Constants.h"
Victor Hernandez13ad5aa2009-10-17 00:00:19 +000028#include "llvm/Instructions.h"
Duncan Sandse2c43042008-04-07 13:45:04 +000029#include "llvm/Intrinsics.h"
Chris Lattnerbef8e0b2007-09-12 18:24:00 +000030#include "llvm/ADT/STLExtras.h"
Chris Lattneref5dc362008-08-23 22:00:15 +000031#include <iostream>
Chris Lattnerbef8e0b2007-09-12 18:24:00 +000032using namespace llvm;
33
34//Set the constants for naming
35const char *BrainF::tapereg = "tape";
36const char *BrainF::headreg = "head";
37const char *BrainF::label = "brainf";
38const char *BrainF::testreg = "test";
39
Owen Anderson8b477ed2009-07-01 16:58:40 +000040Module *BrainF::parse(std::istream *in1, int mem, CompileFlags cf,
Owen Anderson4434ed42009-07-01 23:13:44 +000041 LLVMContext& Context) {
Chris Lattnerbef8e0b2007-09-12 18:24:00 +000042 in = in1;
43 memtotal = mem;
44 comflag = cf;
45
Owen Anderson8b477ed2009-07-01 16:58:40 +000046 header(Context);
Owen Anderson9adc0ab2009-07-14 23:09:55 +000047 readloop(0, 0, 0, Context);
Chris Lattnerbef8e0b2007-09-12 18:24:00 +000048 delete builder;
49 return module;
50}
51
Owen Anderson4434ed42009-07-01 23:13:44 +000052void BrainF::header(LLVMContext& C) {
Owen Anderson8b477ed2009-07-01 16:58:40 +000053 module = new Module("BrainF", C);
Chris Lattnerbef8e0b2007-09-12 18:24:00 +000054
55 //Function prototypes
56
Chris Lattner9908fec2010-08-10 21:45:38 +000057 //declare void @llvm.memset.p0i8.i32(i8 *, i8, i32, i32, i1)
Francois Pichete8b323a2011-07-12 22:04:11 +000058 Type *Tys[] = { Type::getInt8PtrTy(C), Type::getInt32Ty(C) };
Chris Lattner824b9582008-11-21 16:42:48 +000059 Function *memset_func = Intrinsic::getDeclaration(module, Intrinsic::memset,
Benjamin Kramereb9a85f2011-07-14 17:45:39 +000060 Tys);
Chris Lattnerbef8e0b2007-09-12 18:24:00 +000061
62 //declare i32 @getchar()
63 getchar_func = cast<Function>(module->
Owen Anderson1d0be152009-08-13 21:58:54 +000064 getOrInsertFunction("getchar", IntegerType::getInt32Ty(C), NULL));
Chris Lattnerbef8e0b2007-09-12 18:24:00 +000065
66 //declare i32 @putchar(i32)
67 putchar_func = cast<Function>(module->
Owen Anderson1d0be152009-08-13 21:58:54 +000068 getOrInsertFunction("putchar", IntegerType::getInt32Ty(C),
69 IntegerType::getInt32Ty(C), NULL));
Chris Lattnerbef8e0b2007-09-12 18:24:00 +000070
71
72 //Function header
73
74 //define void @brainf()
75 brainf_func = cast<Function>(module->
Owen Anderson1d0be152009-08-13 21:58:54 +000076 getOrInsertFunction("brainf", Type::getVoidTy(C), NULL));
Chris Lattnerbef8e0b2007-09-12 18:24:00 +000077
Owen Anderson1d0be152009-08-13 21:58:54 +000078 builder = new IRBuilder<>(BasicBlock::Create(C, label, brainf_func));
Chris Lattnerbef8e0b2007-09-12 18:24:00 +000079
80 //%arr = malloc i8, i32 %d
Owen Andersoneed707b2009-07-24 23:12:02 +000081 ConstantInt *val_mem = ConstantInt::get(C, APInt(32, memtotal));
Victor Hernandez13ad5aa2009-10-17 00:00:19 +000082 BasicBlock* BB = builder->GetInsertBlock();
Chris Lattner4b3d5462011-07-18 04:52:58 +000083 Type* IntPtrTy = IntegerType::getInt32Ty(C);
84 Type* Int8Ty = IntegerType::getInt8Ty(C);
Victor Hernandez9d0b7042009-11-07 00:16:28 +000085 Constant* allocsize = ConstantExpr::getSizeOf(Int8Ty);
86 allocsize = ConstantExpr::getTruncOrBitCast(allocsize, IntPtrTy);
87 ptr_arr = CallInst::CreateMalloc(BB, IntPtrTy, Int8Ty, allocsize, val_mem,
88 NULL, "arr");
Victor Hernandez13ad5aa2009-10-17 00:00:19 +000089 BB->getInstList().push_back(cast<Instruction>(ptr_arr));
Chris Lattnerbef8e0b2007-09-12 18:24:00 +000090
Chris Lattner9908fec2010-08-10 21:45:38 +000091 //call void @llvm.memset.p0i8.i32(i8 *%arr, i8 0, i32 %d, i32 1, i1 0)
Chris Lattnerbef8e0b2007-09-12 18:24:00 +000092 {
93 Value *memset_params[] = {
94 ptr_arr,
Owen Andersoneed707b2009-07-24 23:12:02 +000095 ConstantInt::get(C, APInt(8, 0)),
Chris Lattnerbef8e0b2007-09-12 18:24:00 +000096 val_mem,
Chris Lattner9908fec2010-08-10 21:45:38 +000097 ConstantInt::get(C, APInt(32, 1)),
98 ConstantInt::get(C, APInt(1, 0))
Chris Lattnerbef8e0b2007-09-12 18:24:00 +000099 };
100
101 CallInst *memset_call = builder->
Francois Pichet0bd9d3a2011-07-15 10:59:52 +0000102 CreateCall(memset_func, memset_params);
Chris Lattnerbef8e0b2007-09-12 18:24:00 +0000103 memset_call->setTailCall(false);
104 }
105
106 //%arrmax = getelementptr i8 *%arr, i32 %d
107 if (comflag & flag_arraybounds) {
108 ptr_arrmax = builder->
Owen Andersoneed707b2009-07-24 23:12:02 +0000109 CreateGEP(ptr_arr, ConstantInt::get(C, APInt(32, memtotal)), "arrmax");
Chris Lattnerbef8e0b2007-09-12 18:24:00 +0000110 }
111
112 //%head.%d = getelementptr i8 *%arr, i32 %d
113 curhead = builder->CreateGEP(ptr_arr,
Owen Andersoneed707b2009-07-24 23:12:02 +0000114 ConstantInt::get(C, APInt(32, memtotal/2)),
Chris Lattnerbef8e0b2007-09-12 18:24:00 +0000115 headreg);
116
117
118
119 //Function footer
120
121 //brainf.end:
Owen Anderson1d0be152009-08-13 21:58:54 +0000122 endbb = BasicBlock::Create(C, label, brainf_func);
Chris Lattnerbef8e0b2007-09-12 18:24:00 +0000123
Victor Hernandez046e78c2009-10-26 23:43:48 +0000124 //call free(i8 *%arr)
125 endbb->getInstList().push_back(CallInst::CreateFree(ptr_arr, endbb));
Chris Lattnerbef8e0b2007-09-12 18:24:00 +0000126
127 //ret void
Owen Anderson1d0be152009-08-13 21:58:54 +0000128 ReturnInst::Create(C, endbb);
Chris Lattnerbef8e0b2007-09-12 18:24:00 +0000129
130
131
132 //Error block for array out of bounds
133 if (comflag & flag_arraybounds)
134 {
135 //@aberrormsg = internal constant [%d x i8] c"\00"
Owen Anderson9adc0ab2009-07-14 23:09:55 +0000136 Constant *msg_0 =
Francois Picheta0935772012-01-31 09:35:01 +0000137 ConstantDataArray::getString(C, "Error: The head has left the tape.",
138 true);
Chris Lattnerbef8e0b2007-09-12 18:24:00 +0000139
140 GlobalVariable *aberrormsg = new GlobalVariable(
Owen Andersone9b11b42009-07-08 19:03:57 +0000141 *module,
Chris Lattnerbef8e0b2007-09-12 18:24:00 +0000142 msg_0->getType(),
143 true,
144 GlobalValue::InternalLinkage,
145 msg_0,
Owen Andersone9b11b42009-07-08 19:03:57 +0000146 "aberrormsg");
Chris Lattnerbef8e0b2007-09-12 18:24:00 +0000147
148 //declare i32 @puts(i8 *)
149 Function *puts_func = cast<Function>(module->
Owen Anderson1d0be152009-08-13 21:58:54 +0000150 getOrInsertFunction("puts", IntegerType::getInt32Ty(C),
151 PointerType::getUnqual(IntegerType::getInt8Ty(C)), NULL));
Chris Lattnerbef8e0b2007-09-12 18:24:00 +0000152
153 //brainf.aberror:
Owen Anderson1d0be152009-08-13 21:58:54 +0000154 aberrorbb = BasicBlock::Create(C, label, brainf_func);
Chris Lattnerbef8e0b2007-09-12 18:24:00 +0000155
156 //call i32 @puts(i8 *getelementptr([%d x i8] *@aberrormsg, i32 0, i32 0))
157 {
Owen Anderson1d0be152009-08-13 21:58:54 +0000158 Constant *zero_32 = Constant::getNullValue(IntegerType::getInt32Ty(C));
Chris Lattnerbef8e0b2007-09-12 18:24:00 +0000159
160 Constant *gep_params[] = {
161 zero_32,
162 zero_32
163 };
164
165 Constant *msgptr = ConstantExpr::
Jay Foaddab3d292011-07-21 14:31:17 +0000166 getGetElementPtr(aberrormsg, gep_params);
Chris Lattnerbef8e0b2007-09-12 18:24:00 +0000167
168 Value *puts_params[] = {
169 msgptr
170 };
171
172 CallInst *puts_call =
Gabor Greif051a9502008-04-06 20:25:17 +0000173 CallInst::Create(puts_func,
Francois Pichet0bd9d3a2011-07-15 10:59:52 +0000174 puts_params,
Gabor Greif051a9502008-04-06 20:25:17 +0000175 "", aberrorbb);
Chris Lattnerbef8e0b2007-09-12 18:24:00 +0000176 puts_call->setTailCall(false);
177 }
178
179 //br label %brainf.end
Gabor Greif051a9502008-04-06 20:25:17 +0000180 BranchInst::Create(endbb, aberrorbb);
Chris Lattnerbef8e0b2007-09-12 18:24:00 +0000181 }
182}
183
Owen Anderson9adc0ab2009-07-14 23:09:55 +0000184void BrainF::readloop(PHINode *phi, BasicBlock *oldbb, BasicBlock *testbb,
185 LLVMContext &C) {
Chris Lattnerbef8e0b2007-09-12 18:24:00 +0000186 Symbol cursym = SYM_NONE;
187 int curvalue = 0;
188 Symbol nextsym = SYM_NONE;
189 int nextvalue = 0;
190 char c;
191 int loop;
192 int direction;
193
194 while(cursym != SYM_EOF && cursym != SYM_ENDLOOP) {
195 // Write out commands
196 switch(cursym) {
197 case SYM_NONE:
198 // Do nothing
199 break;
200
201 case SYM_READ:
202 {
203 //%tape.%d = call i32 @getchar()
204 CallInst *getchar_call = builder->CreateCall(getchar_func, tapereg);
205 getchar_call->setTailCall(false);
206 Value *tape_0 = getchar_call;
207
208 //%tape.%d = trunc i32 %tape.%d to i8
Duncan Sands89f6d882008-04-13 06:22:09 +0000209 Value *tape_1 = builder->
Owen Anderson1d0be152009-08-13 21:58:54 +0000210 CreateTrunc(tape_0, IntegerType::getInt8Ty(C), tapereg);
Chris Lattnerbef8e0b2007-09-12 18:24:00 +0000211
212 //store i8 %tape.%d, i8 *%head.%d
213 builder->CreateStore(tape_1, curhead);
214 }
215 break;
216
217 case SYM_WRITE:
218 {
219 //%tape.%d = load i8 *%head.%d
220 LoadInst *tape_0 = builder->CreateLoad(curhead, tapereg);
221
222 //%tape.%d = sext i8 %tape.%d to i32
Duncan Sands89f6d882008-04-13 06:22:09 +0000223 Value *tape_1 = builder->
Owen Anderson1d0be152009-08-13 21:58:54 +0000224 CreateSExt(tape_0, IntegerType::getInt32Ty(C), tapereg);
Chris Lattnerbef8e0b2007-09-12 18:24:00 +0000225
226 //call i32 @putchar(i32 %tape.%d)
227 Value *putchar_params[] = {
228 tape_1
229 };
230 CallInst *putchar_call = builder->
231 CreateCall(putchar_func,
Francois Pichet0bd9d3a2011-07-15 10:59:52 +0000232 putchar_params);
Chris Lattnerbef8e0b2007-09-12 18:24:00 +0000233 putchar_call->setTailCall(false);
234 }
235 break;
236
237 case SYM_MOVE:
238 {
239 //%head.%d = getelementptr i8 *%head.%d, i32 %d
240 curhead = builder->
Owen Andersoneed707b2009-07-24 23:12:02 +0000241 CreateGEP(curhead, ConstantInt::get(C, APInt(32, curvalue)),
Chris Lattnerbef8e0b2007-09-12 18:24:00 +0000242 headreg);
243
244 //Error block for array out of bounds
245 if (comflag & flag_arraybounds)
246 {
247 //%test.%d = icmp uge i8 *%head.%d, %arrmax
Duncan Sands89f6d882008-04-13 06:22:09 +0000248 Value *test_0 = builder->
Chris Lattnerbef8e0b2007-09-12 18:24:00 +0000249 CreateICmpUGE(curhead, ptr_arrmax, testreg);
250
251 //%test.%d = icmp ult i8 *%head.%d, %arr
Duncan Sands89f6d882008-04-13 06:22:09 +0000252 Value *test_1 = builder->
Chris Lattnerbef8e0b2007-09-12 18:24:00 +0000253 CreateICmpULT(curhead, ptr_arr, testreg);
254
255 //%test.%d = or i1 %test.%d, %test.%d
Duncan Sands89f6d882008-04-13 06:22:09 +0000256 Value *test_2 = builder->
Chris Lattnerbef8e0b2007-09-12 18:24:00 +0000257 CreateOr(test_0, test_1, testreg);
258
259 //br i1 %test.%d, label %main.%d, label %main.%d
Owen Anderson1d0be152009-08-13 21:58:54 +0000260 BasicBlock *nextbb = BasicBlock::Create(C, label, brainf_func);
Chris Lattnerbef8e0b2007-09-12 18:24:00 +0000261 builder->CreateCondBr(test_2, aberrorbb, nextbb);
262
263 //main.%d:
264 builder->SetInsertPoint(nextbb);
265 }
266 }
267 break;
268
269 case SYM_CHANGE:
270 {
271 //%tape.%d = load i8 *%head.%d
272 LoadInst *tape_0 = builder->CreateLoad(curhead, tapereg);
273
274 //%tape.%d = add i8 %tape.%d, %d
Duncan Sands89f6d882008-04-13 06:22:09 +0000275 Value *tape_1 = builder->
Owen Andersoneed707b2009-07-24 23:12:02 +0000276 CreateAdd(tape_0, ConstantInt::get(C, APInt(8, curvalue)), tapereg);
Chris Lattnerbef8e0b2007-09-12 18:24:00 +0000277
278 //store i8 %tape.%d, i8 *%head.%d\n"
279 builder->CreateStore(tape_1, curhead);
280 }
281 break;
282
283 case SYM_LOOP:
284 {
285 //br label %main.%d
Owen Anderson1d0be152009-08-13 21:58:54 +0000286 BasicBlock *testbb = BasicBlock::Create(C, label, brainf_func);
Chris Lattnerbef8e0b2007-09-12 18:24:00 +0000287 builder->CreateBr(testbb);
288
289 //main.%d:
290 BasicBlock *bb_0 = builder->GetInsertBlock();
Owen Anderson1d0be152009-08-13 21:58:54 +0000291 BasicBlock *bb_1 = BasicBlock::Create(C, label, brainf_func);
Chris Lattnerbef8e0b2007-09-12 18:24:00 +0000292 builder->SetInsertPoint(bb_1);
293
Gabor Greifb1dbcd82008-05-15 10:04:30 +0000294 // Make part of PHI instruction now, wait until end of loop to finish
295 PHINode *phi_0 =
Owen Anderson1d0be152009-08-13 21:58:54 +0000296 PHINode::Create(PointerType::getUnqual(IntegerType::getInt8Ty(C)),
Jay Foad3ecfc862011-03-30 11:28:46 +0000297 2, headreg, testbb);
Chris Lattnerbef8e0b2007-09-12 18:24:00 +0000298 phi_0->addIncoming(curhead, bb_0);
299 curhead = phi_0;
300
Owen Anderson9adc0ab2009-07-14 23:09:55 +0000301 readloop(phi_0, bb_1, testbb, C);
Chris Lattnerbef8e0b2007-09-12 18:24:00 +0000302 }
303 break;
304
305 default:
Chris Lattneref5dc362008-08-23 22:00:15 +0000306 std::cerr << "Error: Unknown symbol.\n";
Chris Lattnerbef8e0b2007-09-12 18:24:00 +0000307 abort();
308 break;
309 }
310
311 cursym = nextsym;
312 curvalue = nextvalue;
313 nextsym = SYM_NONE;
314
315 // Reading stdin loop
316 loop = (cursym == SYM_NONE)
317 || (cursym == SYM_MOVE)
318 || (cursym == SYM_CHANGE);
319 while(loop) {
320 *in>>c;
321 if (in->eof()) {
322 if (cursym == SYM_NONE) {
323 cursym = SYM_EOF;
324 } else {
325 nextsym = SYM_EOF;
326 }
327 loop = 0;
328 } else {
329 direction = 1;
330 switch(c) {
331 case '-':
332 direction = -1;
333 // Fall through
334
335 case '+':
336 if (cursym == SYM_CHANGE) {
337 curvalue += direction;
338 // loop = 1
339 } else {
340 if (cursym == SYM_NONE) {
341 cursym = SYM_CHANGE;
342 curvalue = direction;
343 // loop = 1
344 } else {
345 nextsym = SYM_CHANGE;
346 nextvalue = direction;
347 loop = 0;
348 }
349 }
350 break;
351
352 case '<':
353 direction = -1;
354 // Fall through
355
356 case '>':
357 if (cursym == SYM_MOVE) {
358 curvalue += direction;
359 // loop = 1
360 } else {
361 if (cursym == SYM_NONE) {
362 cursym = SYM_MOVE;
363 curvalue = direction;
364 // loop = 1
365 } else {
366 nextsym = SYM_MOVE;
367 nextvalue = direction;
368 loop = 0;
369 }
370 }
371 break;
372
373 case ',':
374 if (cursym == SYM_NONE) {
375 cursym = SYM_READ;
376 } else {
377 nextsym = SYM_READ;
378 }
379 loop = 0;
380 break;
381
382 case '.':
383 if (cursym == SYM_NONE) {
384 cursym = SYM_WRITE;
385 } else {
386 nextsym = SYM_WRITE;
387 }
388 loop = 0;
389 break;
390
391 case '[':
392 if (cursym == SYM_NONE) {
393 cursym = SYM_LOOP;
394 } else {
395 nextsym = SYM_LOOP;
396 }
397 loop = 0;
398 break;
399
400 case ']':
401 if (cursym == SYM_NONE) {
402 cursym = SYM_ENDLOOP;
403 } else {
404 nextsym = SYM_ENDLOOP;
405 }
406 loop = 0;
407 break;
408
409 // Ignore other characters
410 default:
411 break;
412 }
413 }
414 }
415 }
416
417 if (cursym == SYM_ENDLOOP) {
418 if (!phi) {
Chris Lattneref5dc362008-08-23 22:00:15 +0000419 std::cerr << "Error: Extra ']'\n";
Chris Lattnerbef8e0b2007-09-12 18:24:00 +0000420 abort();
421 }
422
423 // Write loop test
424 {
425 //br label %main.%d
426 builder->CreateBr(testbb);
427
428 //main.%d:
429
430 //%head.%d = phi i8 *[%head.%d, %main.%d], [%head.%d, %main.%d]
431 //Finish phi made at beginning of loop
432 phi->addIncoming(curhead, builder->GetInsertBlock());
433 Value *head_0 = phi;
434
435 //%tape.%d = load i8 *%head.%d
436 LoadInst *tape_0 = new LoadInst(head_0, tapereg, testbb);
437
438 //%test.%d = icmp eq i8 %tape.%d, 0
Owen Anderson333c4002009-07-09 23:48:35 +0000439 ICmpInst *test_0 = new ICmpInst(*testbb, ICmpInst::ICMP_EQ, tape_0,
Owen Andersoneed707b2009-07-24 23:12:02 +0000440 ConstantInt::get(C, APInt(8, 0)), testreg);
Chris Lattnerbef8e0b2007-09-12 18:24:00 +0000441
442 //br i1 %test.%d, label %main.%d, label %main.%d
Owen Anderson1d0be152009-08-13 21:58:54 +0000443 BasicBlock *bb_0 = BasicBlock::Create(C, label, brainf_func);
Gabor Greif051a9502008-04-06 20:25:17 +0000444 BranchInst::Create(bb_0, oldbb, test_0, testbb);
Chris Lattnerbef8e0b2007-09-12 18:24:00 +0000445
446 //main.%d:
447 builder->SetInsertPoint(bb_0);
448
449 //%head.%d = phi i8 *[%head.%d, %main.%d]
450 PHINode *phi_1 = builder->
Jay Foad3ecfc862011-03-30 11:28:46 +0000451 CreatePHI(PointerType::getUnqual(IntegerType::getInt8Ty(C)), 1,
452 headreg);
Chris Lattnerbef8e0b2007-09-12 18:24:00 +0000453 phi_1->addIncoming(head_0, testbb);
454 curhead = phi_1;
455 }
456
457 return;
458 }
459
460 //End of the program, so go to return block
461 builder->CreateBr(endbb);
462
463 if (phi) {
Chris Lattneref5dc362008-08-23 22:00:15 +0000464 std::cerr << "Error: Missing ']'\n";
Chris Lattnerbef8e0b2007-09-12 18:24:00 +0000465 abort();
466 }
467}