blob: e47365bfa16b5639bbb1b67288ffed1a27582bb5 [file] [log] [blame]
Chris Lattnerbef8e0b2007-09-12 18:24:00 +00001//===-- BrainF.cpp - BrainF compiler example ----------------------------===//
2//
3// The LLVM Compiler Infrastructure
4//
Chris Lattnerfc001bb2007-12-29 20:37:57 +00005// This file is distributed under the University of Illinois Open Source
6// License. See LICENSE.TXT for details.
Chris Lattnerbef8e0b2007-09-12 18:24:00 +00007//
8//===--------------------------------------------------------------------===//
9//
10// This class compiles the BrainF language into LLVM assembly.
11//
12// The BrainF language has 8 commands:
13// Command Equivalent C Action
14// ------- ------------ ------
15// , *h=getchar(); Read a character from stdin, 255 on EOF
16// . putchar(*h); Write a character to stdout
17// - --*h; Decrement tape
18// + ++*h; Increment tape
19// < --h; Move head left
20// > ++h; Move head right
21// [ while(*h) { Start loop
22// ] } End loop
23//
24//===--------------------------------------------------------------------===//
25
26#include "BrainF.h"
27#include "llvm/Constants.h"
Duncan Sandse2c43042008-04-07 13:45:04 +000028#include "llvm/Intrinsics.h"
Chris Lattnerbef8e0b2007-09-12 18:24:00 +000029#include "llvm/ADT/STLExtras.h"
Chris Lattneref5dc362008-08-23 22:00:15 +000030#include <iostream>
Chris Lattnerbef8e0b2007-09-12 18:24:00 +000031using namespace llvm;
32
33//Set the constants for naming
34const char *BrainF::tapereg = "tape";
35const char *BrainF::headreg = "head";
36const char *BrainF::label = "brainf";
37const char *BrainF::testreg = "test";
38
Owen Anderson8b477ed2009-07-01 16:58:40 +000039Module *BrainF::parse(std::istream *in1, int mem, CompileFlags cf,
Owen Anderson4434ed42009-07-01 23:13:44 +000040 LLVMContext& Context) {
Chris Lattnerbef8e0b2007-09-12 18:24:00 +000041 in = in1;
42 memtotal = mem;
43 comflag = cf;
44
Owen Anderson8b477ed2009-07-01 16:58:40 +000045 header(Context);
Owen Anderson9adc0ab2009-07-14 23:09:55 +000046 readloop(0, 0, 0, Context);
Chris Lattnerbef8e0b2007-09-12 18:24:00 +000047 delete builder;
48 return module;
49}
50
Owen Anderson4434ed42009-07-01 23:13:44 +000051void BrainF::header(LLVMContext& C) {
Owen Anderson8b477ed2009-07-01 16:58:40 +000052 module = new Module("BrainF", C);
Chris Lattnerbef8e0b2007-09-12 18:24:00 +000053
54 //Function prototypes
55
56 //declare void @llvm.memset.i32(i8 *, i8, i32, i32)
Chris Lattner824b9582008-11-21 16:42:48 +000057 const Type *Tys[] = { Type::Int32Ty };
58 Function *memset_func = Intrinsic::getDeclaration(module, Intrinsic::memset,
59 Tys, 1);
Chris Lattnerbef8e0b2007-09-12 18:24:00 +000060
61 //declare i32 @getchar()
62 getchar_func = cast<Function>(module->
63 getOrInsertFunction("getchar", IntegerType::Int32Ty, NULL));
64
65 //declare i32 @putchar(i32)
66 putchar_func = cast<Function>(module->
67 getOrInsertFunction("putchar", IntegerType::Int32Ty,
68 IntegerType::Int32Ty, NULL));
69
70
71 //Function header
72
73 //define void @brainf()
74 brainf_func = cast<Function>(module->
75 getOrInsertFunction("brainf", Type::VoidTy, NULL));
76
Eric Christopher7a61d702008-08-08 19:39:37 +000077 builder = new IRBuilder<>(BasicBlock::Create(label, brainf_func));
Chris Lattnerbef8e0b2007-09-12 18:24:00 +000078
79 //%arr = malloc i8, i32 %d
Owen Andersoneed707b2009-07-24 23:12:02 +000080 ConstantInt *val_mem = ConstantInt::get(C, APInt(32, memtotal));
Chris Lattnerbef8e0b2007-09-12 18:24:00 +000081 ptr_arr = builder->CreateMalloc(IntegerType::Int8Ty, val_mem, "arr");
82
83 //call void @llvm.memset.i32(i8 *%arr, i8 0, i32 %d, i32 1)
84 {
85 Value *memset_params[] = {
86 ptr_arr,
Owen Andersoneed707b2009-07-24 23:12:02 +000087 ConstantInt::get(C, APInt(8, 0)),
Chris Lattnerbef8e0b2007-09-12 18:24:00 +000088 val_mem,
Owen Andersoneed707b2009-07-24 23:12:02 +000089 ConstantInt::get(C, APInt(32, 1))
Chris Lattnerbef8e0b2007-09-12 18:24:00 +000090 };
91
92 CallInst *memset_call = builder->
93 CreateCall(memset_func, memset_params, array_endof(memset_params));
94 memset_call->setTailCall(false);
95 }
96
97 //%arrmax = getelementptr i8 *%arr, i32 %d
98 if (comflag & flag_arraybounds) {
99 ptr_arrmax = builder->
Owen Andersoneed707b2009-07-24 23:12:02 +0000100 CreateGEP(ptr_arr, ConstantInt::get(C, APInt(32, memtotal)), "arrmax");
Chris Lattnerbef8e0b2007-09-12 18:24:00 +0000101 }
102
103 //%head.%d = getelementptr i8 *%arr, i32 %d
104 curhead = builder->CreateGEP(ptr_arr,
Owen Andersoneed707b2009-07-24 23:12:02 +0000105 ConstantInt::get(C, APInt(32, memtotal/2)),
Chris Lattnerbef8e0b2007-09-12 18:24:00 +0000106 headreg);
107
108
109
110 //Function footer
111
112 //brainf.end:
Gabor Greif051a9502008-04-06 20:25:17 +0000113 endbb = BasicBlock::Create(label, brainf_func);
Chris Lattnerbef8e0b2007-09-12 18:24:00 +0000114
115 //free i8 *%arr
116 new FreeInst(ptr_arr, endbb);
117
118 //ret void
Gabor Greif051a9502008-04-06 20:25:17 +0000119 ReturnInst::Create(endbb);
Chris Lattnerbef8e0b2007-09-12 18:24:00 +0000120
121
122
123 //Error block for array out of bounds
124 if (comflag & flag_arraybounds)
125 {
126 //@aberrormsg = internal constant [%d x i8] c"\00"
Owen Anderson9adc0ab2009-07-14 23:09:55 +0000127 Constant *msg_0 =
Owen Anderson1fd70962009-07-28 18:32:17 +0000128 ConstantArray::get("Error: The head has left the tape.", true);
Chris Lattnerbef8e0b2007-09-12 18:24:00 +0000129
130 GlobalVariable *aberrormsg = new GlobalVariable(
Owen Andersone9b11b42009-07-08 19:03:57 +0000131 *module,
Chris Lattnerbef8e0b2007-09-12 18:24:00 +0000132 msg_0->getType(),
133 true,
134 GlobalValue::InternalLinkage,
135 msg_0,
Owen Andersone9b11b42009-07-08 19:03:57 +0000136 "aberrormsg");
Chris Lattnerbef8e0b2007-09-12 18:24:00 +0000137
138 //declare i32 @puts(i8 *)
139 Function *puts_func = cast<Function>(module->
140 getOrInsertFunction("puts", IntegerType::Int32Ty,
Owen Anderson9adc0ab2009-07-14 23:09:55 +0000141 C.getPointerTypeUnqual(IntegerType::Int8Ty), NULL));
Chris Lattnerbef8e0b2007-09-12 18:24:00 +0000142
143 //brainf.aberror:
Gabor Greif051a9502008-04-06 20:25:17 +0000144 aberrorbb = BasicBlock::Create(label, brainf_func);
Chris Lattnerbef8e0b2007-09-12 18:24:00 +0000145
146 //call i32 @puts(i8 *getelementptr([%d x i8] *@aberrormsg, i32 0, i32 0))
147 {
Owen Anderson0a5372e2009-07-13 04:09:18 +0000148 Constant *zero_32 = C.getNullValue(IntegerType::Int32Ty);
Chris Lattnerbef8e0b2007-09-12 18:24:00 +0000149
150 Constant *gep_params[] = {
151 zero_32,
152 zero_32
153 };
154
155 Constant *msgptr = ConstantExpr::
156 getGetElementPtr(aberrormsg, gep_params,
157 array_lengthof(gep_params));
158
159 Value *puts_params[] = {
160 msgptr
161 };
162
163 CallInst *puts_call =
Gabor Greif051a9502008-04-06 20:25:17 +0000164 CallInst::Create(puts_func,
165 puts_params, array_endof(puts_params),
166 "", aberrorbb);
Chris Lattnerbef8e0b2007-09-12 18:24:00 +0000167 puts_call->setTailCall(false);
168 }
169
170 //br label %brainf.end
Gabor Greif051a9502008-04-06 20:25:17 +0000171 BranchInst::Create(endbb, aberrorbb);
Chris Lattnerbef8e0b2007-09-12 18:24:00 +0000172 }
173}
174
Owen Anderson9adc0ab2009-07-14 23:09:55 +0000175void BrainF::readloop(PHINode *phi, BasicBlock *oldbb, BasicBlock *testbb,
176 LLVMContext &C) {
Chris Lattnerbef8e0b2007-09-12 18:24:00 +0000177 Symbol cursym = SYM_NONE;
178 int curvalue = 0;
179 Symbol nextsym = SYM_NONE;
180 int nextvalue = 0;
181 char c;
182 int loop;
183 int direction;
184
185 while(cursym != SYM_EOF && cursym != SYM_ENDLOOP) {
186 // Write out commands
187 switch(cursym) {
188 case SYM_NONE:
189 // Do nothing
190 break;
191
192 case SYM_READ:
193 {
194 //%tape.%d = call i32 @getchar()
195 CallInst *getchar_call = builder->CreateCall(getchar_func, tapereg);
196 getchar_call->setTailCall(false);
197 Value *tape_0 = getchar_call;
198
199 //%tape.%d = trunc i32 %tape.%d to i8
Duncan Sands89f6d882008-04-13 06:22:09 +0000200 Value *tape_1 = builder->
Chris Lattnerbef8e0b2007-09-12 18:24:00 +0000201 CreateTrunc(tape_0, IntegerType::Int8Ty, tapereg);
202
203 //store i8 %tape.%d, i8 *%head.%d
204 builder->CreateStore(tape_1, curhead);
205 }
206 break;
207
208 case SYM_WRITE:
209 {
210 //%tape.%d = load i8 *%head.%d
211 LoadInst *tape_0 = builder->CreateLoad(curhead, tapereg);
212
213 //%tape.%d = sext i8 %tape.%d to i32
Duncan Sands89f6d882008-04-13 06:22:09 +0000214 Value *tape_1 = builder->
Chris Lattnerbef8e0b2007-09-12 18:24:00 +0000215 CreateSExt(tape_0, IntegerType::Int32Ty, tapereg);
216
217 //call i32 @putchar(i32 %tape.%d)
218 Value *putchar_params[] = {
219 tape_1
220 };
221 CallInst *putchar_call = builder->
222 CreateCall(putchar_func,
223 putchar_params, array_endof(putchar_params));
224 putchar_call->setTailCall(false);
225 }
226 break;
227
228 case SYM_MOVE:
229 {
230 //%head.%d = getelementptr i8 *%head.%d, i32 %d
231 curhead = builder->
Owen Andersoneed707b2009-07-24 23:12:02 +0000232 CreateGEP(curhead, ConstantInt::get(C, APInt(32, curvalue)),
Chris Lattnerbef8e0b2007-09-12 18:24:00 +0000233 headreg);
234
235 //Error block for array out of bounds
236 if (comflag & flag_arraybounds)
237 {
238 //%test.%d = icmp uge i8 *%head.%d, %arrmax
Duncan Sands89f6d882008-04-13 06:22:09 +0000239 Value *test_0 = builder->
Chris Lattnerbef8e0b2007-09-12 18:24:00 +0000240 CreateICmpUGE(curhead, ptr_arrmax, testreg);
241
242 //%test.%d = icmp ult i8 *%head.%d, %arr
Duncan Sands89f6d882008-04-13 06:22:09 +0000243 Value *test_1 = builder->
Chris Lattnerbef8e0b2007-09-12 18:24:00 +0000244 CreateICmpULT(curhead, ptr_arr, testreg);
245
246 //%test.%d = or i1 %test.%d, %test.%d
Duncan Sands89f6d882008-04-13 06:22:09 +0000247 Value *test_2 = builder->
Chris Lattnerbef8e0b2007-09-12 18:24:00 +0000248 CreateOr(test_0, test_1, testreg);
249
250 //br i1 %test.%d, label %main.%d, label %main.%d
Gabor Greif051a9502008-04-06 20:25:17 +0000251 BasicBlock *nextbb = BasicBlock::Create(label, brainf_func);
Chris Lattnerbef8e0b2007-09-12 18:24:00 +0000252 builder->CreateCondBr(test_2, aberrorbb, nextbb);
253
254 //main.%d:
255 builder->SetInsertPoint(nextbb);
256 }
257 }
258 break;
259
260 case SYM_CHANGE:
261 {
262 //%tape.%d = load i8 *%head.%d
263 LoadInst *tape_0 = builder->CreateLoad(curhead, tapereg);
264
265 //%tape.%d = add i8 %tape.%d, %d
Duncan Sands89f6d882008-04-13 06:22:09 +0000266 Value *tape_1 = builder->
Owen Andersoneed707b2009-07-24 23:12:02 +0000267 CreateAdd(tape_0, ConstantInt::get(C, APInt(8, curvalue)), tapereg);
Chris Lattnerbef8e0b2007-09-12 18:24:00 +0000268
269 //store i8 %tape.%d, i8 *%head.%d\n"
270 builder->CreateStore(tape_1, curhead);
271 }
272 break;
273
274 case SYM_LOOP:
275 {
276 //br label %main.%d
Gabor Greif051a9502008-04-06 20:25:17 +0000277 BasicBlock *testbb = BasicBlock::Create(label, brainf_func);
Chris Lattnerbef8e0b2007-09-12 18:24:00 +0000278 builder->CreateBr(testbb);
279
280 //main.%d:
281 BasicBlock *bb_0 = builder->GetInsertBlock();
Gabor Greif051a9502008-04-06 20:25:17 +0000282 BasicBlock *bb_1 = BasicBlock::Create(label, brainf_func);
Chris Lattnerbef8e0b2007-09-12 18:24:00 +0000283 builder->SetInsertPoint(bb_1);
284
Gabor Greifb1dbcd82008-05-15 10:04:30 +0000285 // Make part of PHI instruction now, wait until end of loop to finish
286 PHINode *phi_0 =
Owen Anderson9adc0ab2009-07-14 23:09:55 +0000287 PHINode::Create(C.getPointerTypeUnqual(IntegerType::Int8Ty),
Gabor Greifb1dbcd82008-05-15 10:04:30 +0000288 headreg, testbb);
Chris Lattnerbef8e0b2007-09-12 18:24:00 +0000289 phi_0->reserveOperandSpace(2);
290 phi_0->addIncoming(curhead, bb_0);
291 curhead = phi_0;
292
Owen Anderson9adc0ab2009-07-14 23:09:55 +0000293 readloop(phi_0, bb_1, testbb, C);
Chris Lattnerbef8e0b2007-09-12 18:24:00 +0000294 }
295 break;
296
297 default:
Chris Lattneref5dc362008-08-23 22:00:15 +0000298 std::cerr << "Error: Unknown symbol.\n";
Chris Lattnerbef8e0b2007-09-12 18:24:00 +0000299 abort();
300 break;
301 }
302
303 cursym = nextsym;
304 curvalue = nextvalue;
305 nextsym = SYM_NONE;
306
307 // Reading stdin loop
308 loop = (cursym == SYM_NONE)
309 || (cursym == SYM_MOVE)
310 || (cursym == SYM_CHANGE);
311 while(loop) {
312 *in>>c;
313 if (in->eof()) {
314 if (cursym == SYM_NONE) {
315 cursym = SYM_EOF;
316 } else {
317 nextsym = SYM_EOF;
318 }
319 loop = 0;
320 } else {
321 direction = 1;
322 switch(c) {
323 case '-':
324 direction = -1;
325 // Fall through
326
327 case '+':
328 if (cursym == SYM_CHANGE) {
329 curvalue += direction;
330 // loop = 1
331 } else {
332 if (cursym == SYM_NONE) {
333 cursym = SYM_CHANGE;
334 curvalue = direction;
335 // loop = 1
336 } else {
337 nextsym = SYM_CHANGE;
338 nextvalue = direction;
339 loop = 0;
340 }
341 }
342 break;
343
344 case '<':
345 direction = -1;
346 // Fall through
347
348 case '>':
349 if (cursym == SYM_MOVE) {
350 curvalue += direction;
351 // loop = 1
352 } else {
353 if (cursym == SYM_NONE) {
354 cursym = SYM_MOVE;
355 curvalue = direction;
356 // loop = 1
357 } else {
358 nextsym = SYM_MOVE;
359 nextvalue = direction;
360 loop = 0;
361 }
362 }
363 break;
364
365 case ',':
366 if (cursym == SYM_NONE) {
367 cursym = SYM_READ;
368 } else {
369 nextsym = SYM_READ;
370 }
371 loop = 0;
372 break;
373
374 case '.':
375 if (cursym == SYM_NONE) {
376 cursym = SYM_WRITE;
377 } else {
378 nextsym = SYM_WRITE;
379 }
380 loop = 0;
381 break;
382
383 case '[':
384 if (cursym == SYM_NONE) {
385 cursym = SYM_LOOP;
386 } else {
387 nextsym = SYM_LOOP;
388 }
389 loop = 0;
390 break;
391
392 case ']':
393 if (cursym == SYM_NONE) {
394 cursym = SYM_ENDLOOP;
395 } else {
396 nextsym = SYM_ENDLOOP;
397 }
398 loop = 0;
399 break;
400
401 // Ignore other characters
402 default:
403 break;
404 }
405 }
406 }
407 }
408
409 if (cursym == SYM_ENDLOOP) {
410 if (!phi) {
Chris Lattneref5dc362008-08-23 22:00:15 +0000411 std::cerr << "Error: Extra ']'\n";
Chris Lattnerbef8e0b2007-09-12 18:24:00 +0000412 abort();
413 }
414
415 // Write loop test
416 {
417 //br label %main.%d
418 builder->CreateBr(testbb);
419
420 //main.%d:
421
422 //%head.%d = phi i8 *[%head.%d, %main.%d], [%head.%d, %main.%d]
423 //Finish phi made at beginning of loop
424 phi->addIncoming(curhead, builder->GetInsertBlock());
425 Value *head_0 = phi;
426
427 //%tape.%d = load i8 *%head.%d
428 LoadInst *tape_0 = new LoadInst(head_0, tapereg, testbb);
429
430 //%test.%d = icmp eq i8 %tape.%d, 0
Owen Anderson333c4002009-07-09 23:48:35 +0000431 ICmpInst *test_0 = new ICmpInst(*testbb, ICmpInst::ICMP_EQ, tape_0,
Owen Andersoneed707b2009-07-24 23:12:02 +0000432 ConstantInt::get(C, APInt(8, 0)), testreg);
Chris Lattnerbef8e0b2007-09-12 18:24:00 +0000433
434 //br i1 %test.%d, label %main.%d, label %main.%d
Gabor Greif051a9502008-04-06 20:25:17 +0000435 BasicBlock *bb_0 = BasicBlock::Create(label, brainf_func);
436 BranchInst::Create(bb_0, oldbb, test_0, testbb);
Chris Lattnerbef8e0b2007-09-12 18:24:00 +0000437
438 //main.%d:
439 builder->SetInsertPoint(bb_0);
440
441 //%head.%d = phi i8 *[%head.%d, %main.%d]
442 PHINode *phi_1 = builder->
Owen Anderson9adc0ab2009-07-14 23:09:55 +0000443 CreatePHI(C.getPointerTypeUnqual(IntegerType::Int8Ty), headreg);
Chris Lattnerbef8e0b2007-09-12 18:24:00 +0000444 phi_1->reserveOperandSpace(1);
445 phi_1->addIncoming(head_0, testbb);
446 curhead = phi_1;
447 }
448
449 return;
450 }
451
452 //End of the program, so go to return block
453 builder->CreateBr(endbb);
454
455 if (phi) {
Chris Lattneref5dc362008-08-23 22:00:15 +0000456 std::cerr << "Error: Missing ']'\n";
Chris Lattnerbef8e0b2007-09-12 18:24:00 +0000457 abort();
458 }
459}