blob: a3a70d18717b798d0559c92fbc648c1685709d72 [file] [log] [blame]
Jack Palevichae54f1f2009-05-08 14:54:15 -07001/*
Jack Paleviche7b59062009-05-19 17:12:17 -07002 * Android "Almost" C Compiler.
3 * This is a compiler for a small subset of the C language, intended for use
4 * in scripting environments where speed and memory footprint are important.
5 *
6 * This code is based upon the "unobfuscated" version of the
Jack Palevich1cdef202009-05-22 12:06:27 -07007 * Obfuscated Tiny C compiler, see the file LICENSE for details.
Jack Paleviche7b59062009-05-19 17:12:17 -07008 *
9 */
10
Jack Palevich77ae76e2009-05-10 19:59:24 -070011#include <ctype.h>
12#include <dlfcn.h>
Jack Palevichac0e95e2009-05-29 13:53:44 -070013#include <setjmp.h>
Jack Paleviche27bf3e2009-05-10 14:09:03 -070014#include <stdarg.h>
Jack Palevich8b0624c2009-05-20 12:12:06 -070015#include <stdint.h>
Jack Palevichae54f1f2009-05-08 14:54:15 -070016#include <stdio.h>
Jack Palevichf6b5a532009-05-10 19:16:42 -070017#include <stdlib.h>
18#include <string.h>
Jack Palevich2d11dfb2009-06-08 14:34:26 -070019#include <cutils/hashmap.h>
Jack Palevichae54f1f2009-05-08 14:54:15 -070020
Jack Palevich546b2242009-05-13 15:10:04 -070021#if defined(__arm__)
22#include <unistd.h>
23#endif
24
Jack Paleviche7b59062009-05-19 17:12:17 -070025#if defined(__arm__)
26#define DEFAULT_ARM_CODEGEN
Jack Palevich8b0624c2009-05-20 12:12:06 -070027#define PROVIDE_ARM_CODEGEN
Jack Paleviche7b59062009-05-19 17:12:17 -070028#elif defined(__i386__)
29#define DEFAULT_X86_CODEGEN
Jack Palevich8b0624c2009-05-20 12:12:06 -070030#define PROVIDE_X86_CODEGEN
Jack Paleviche7b59062009-05-19 17:12:17 -070031#elif defined(__x86_64__)
32#define DEFAULT_X64_CODEGEN
Jack Palevich8b0624c2009-05-20 12:12:06 -070033#define PROVIDE_X64_CODEGEN
Jack Paleviche7b59062009-05-19 17:12:17 -070034#endif
35
Jack Paleviche7b59062009-05-19 17:12:17 -070036
37#ifdef PROVIDE_ARM_CODEGEN
Jack Palevicha6535612009-05-13 16:24:17 -070038#include "disassem.h"
Jack Paleviche7b59062009-05-19 17:12:17 -070039#endif
Jack Palevicha6535612009-05-13 16:24:17 -070040
Jack Palevich1cdef202009-05-22 12:06:27 -070041#include <acc/acc.h>
42
Jack Palevich09555c72009-05-27 12:25:55 -070043#define LOG_API(...) do {} while(0)
44// #define LOG_API(...) fprintf (stderr, __VA_ARGS__)
Jack Palevich09555c72009-05-27 12:25:55 -070045// #define ENABLE_ARM_DISASSEMBLY
46
Jack Palevichbbf8ab52009-05-11 11:54:30 -070047namespace acc {
48
Jack Palevichac0e95e2009-05-29 13:53:44 -070049class ErrorSink {
50public:
51 void error(const char *fmt, ...) {
52 va_list ap;
53 va_start(ap, fmt);
54 verror(fmt, ap);
55 va_end(ap);
56 }
57
58 virtual void verror(const char* fmt, va_list ap) = 0;
59};
60
61class Compiler : public ErrorSink {
Jack Palevich21a15a22009-05-11 14:49:29 -070062 class CodeBuf {
Jack Palevich653f42d2009-05-28 17:15:32 -070063 char* ind; // Output code pointer
Jack Palevich21a15a22009-05-11 14:49:29 -070064 char* pProgramBase;
Jack Palevichac0e95e2009-05-29 13:53:44 -070065 ErrorSink* mErrorSink;
66 int mSize;
Jack Palevichf0cbc922009-05-08 16:35:13 -070067
Jack Palevich21a15a22009-05-11 14:49:29 -070068 void release() {
69 if (pProgramBase != 0) {
70 free(pProgramBase);
71 pProgramBase = 0;
Jack Palevichae54f1f2009-05-08 14:54:15 -070072 }
Jack Palevich21a15a22009-05-11 14:49:29 -070073 }
74
Jack Palevichac0e95e2009-05-29 13:53:44 -070075 void check(int n) {
76 int newSize = ind - pProgramBase + n;
77 if (newSize > mSize) {
78 if (mErrorSink) {
79 mErrorSink->error("Code too large: %d bytes", newSize);
80 }
81 }
82 }
83
Jack Palevich21a15a22009-05-11 14:49:29 -070084 public:
85 CodeBuf() {
86 pProgramBase = 0;
87 ind = 0;
Jack Palevichac0e95e2009-05-29 13:53:44 -070088 mErrorSink = 0;
89 mSize = 0;
Jack Palevich21a15a22009-05-11 14:49:29 -070090 }
91
92 ~CodeBuf() {
93 release();
94 }
95
96 void init(int size) {
97 release();
Jack Palevichac0e95e2009-05-29 13:53:44 -070098 mSize = size;
Jack Palevich21a15a22009-05-11 14:49:29 -070099 pProgramBase = (char*) calloc(1, size);
100 ind = pProgramBase;
101 }
102
Jack Palevichac0e95e2009-05-29 13:53:44 -0700103 void setErrorSink(ErrorSink* pErrorSink) {
104 mErrorSink = pErrorSink;
105 }
106
Jack Palevich546b2242009-05-13 15:10:04 -0700107 int o4(int n) {
Jack Palevichac0e95e2009-05-29 13:53:44 -0700108 check(4);
Jack Palevich8b0624c2009-05-20 12:12:06 -0700109 intptr_t result = (intptr_t) ind;
Jack Palevich546b2242009-05-13 15:10:04 -0700110 * (int*) ind = n;
111 ind += 4;
112 return result;
113 }
114
Jack Palevich21a15a22009-05-11 14:49:29 -0700115 /*
116 * Output a byte. Handles all values, 0..ff.
117 */
118 void ob(int n) {
Jack Palevichac0e95e2009-05-29 13:53:44 -0700119 check(1);
Jack Palevich21a15a22009-05-11 14:49:29 -0700120 *ind++ = n;
121 }
122
Jack Palevich21a15a22009-05-11 14:49:29 -0700123 inline void* getBase() {
124 return (void*) pProgramBase;
125 }
126
Jack Palevich8b0624c2009-05-20 12:12:06 -0700127 intptr_t getSize() {
Jack Palevich21a15a22009-05-11 14:49:29 -0700128 return ind - pProgramBase;
129 }
130
Jack Palevich8b0624c2009-05-20 12:12:06 -0700131 intptr_t getPC() {
132 return (intptr_t) ind;
Jack Palevich21a15a22009-05-11 14:49:29 -0700133 }
134 };
135
Jack Palevich1cdef202009-05-22 12:06:27 -0700136 /**
137 * A code generator creates an in-memory program, generating the code on
138 * the fly. There is one code generator implementation for each supported
139 * architecture.
140 *
141 * The code generator implements the following abstract machine:
142 * R0 - the main accumulator.
143 * R1 - the secondary accumulator.
144 * FP - a frame pointer for accessing function arguments and local
145 * variables.
146 * SP - a stack pointer for storing intermediate results while evaluating
147 * expressions. The stack pointer grows downwards.
148 *
149 * The function calling convention is that all arguments are placed on the
150 * stack such that the first argument has the lowest address.
151 * After the call, the result is in R0. The caller is responsible for
152 * removing the arguments from the stack.
153 * The R0 and R1 registers are not saved across function calls. The
154 * FP and SP registers are saved.
155 */
156
Jack Palevich21a15a22009-05-11 14:49:29 -0700157 class CodeGenerator {
158 public:
Jack Palevichac0e95e2009-05-29 13:53:44 -0700159 CodeGenerator() {
160 mErrorSink = 0;
161 pCodeBuf = 0;
162 }
Jack Palevich21a15a22009-05-11 14:49:29 -0700163 virtual ~CodeGenerator() {}
164
Jack Palevich22305132009-05-13 10:58:45 -0700165 virtual void init(CodeBuf* pCodeBuf) {
Jack Palevich21a15a22009-05-11 14:49:29 -0700166 this->pCodeBuf = pCodeBuf;
Jack Palevichac0e95e2009-05-29 13:53:44 -0700167 pCodeBuf->setErrorSink(mErrorSink);
168 }
169
170 void setErrorSink(ErrorSink* pErrorSink) {
171 mErrorSink = pErrorSink;
172 if (pCodeBuf) {
173 pCodeBuf->setErrorSink(mErrorSink);
174 }
Jack Palevich21a15a22009-05-11 14:49:29 -0700175 }
176
Jack Palevich1cdef202009-05-22 12:06:27 -0700177 /* Emit a function prolog.
178 * argCount is the number of arguments.
179 * Save the old value of the FP.
180 * Set the new value of the FP.
181 * Convert from the native platform calling convention to
182 * our stack-based calling convention. This may require
183 * pushing arguments from registers to the stack.
184 * Allocate "N" bytes of stack space. N isn't known yet, so
185 * just emit the instructions for adjusting the stack, and return
186 * the address to patch up. The patching will be done in
187 * functionExit().
188 * returns address to patch with local variable size.
Jack Palevich22305132009-05-13 10:58:45 -0700189 */
Jack Palevich546b2242009-05-13 15:10:04 -0700190 virtual int functionEntry(int argCount) = 0;
Jack Palevich22305132009-05-13 10:58:45 -0700191
Jack Palevich1cdef202009-05-22 12:06:27 -0700192 /* Emit a function epilog.
193 * Restore the old SP and FP register values.
194 * Return to the calling function.
195 * argCount - the number of arguments to the function.
196 * localVariableAddress - returned from functionEntry()
197 * localVariableSize - the size in bytes of the local variables.
198 */
199 virtual void functionExit(int argCount, int localVariableAddress,
200 int localVariableSize) = 0;
Jack Palevich22305132009-05-13 10:58:45 -0700201
Jack Palevich1cdef202009-05-22 12:06:27 -0700202 /* load immediate value to R0 */
Jack Palevich546b2242009-05-13 15:10:04 -0700203 virtual void li(int t) = 0;
Jack Palevich22305132009-05-13 10:58:45 -0700204
Jack Palevich1cdef202009-05-22 12:06:27 -0700205 /* Jump to a target, and return the address of the word that
206 * holds the target data, in case it needs to be fixed up later.
207 */
Jack Palevich22305132009-05-13 10:58:45 -0700208 virtual int gjmp(int t) = 0;
209
Jack Palevich1cdef202009-05-22 12:06:27 -0700210 /* Test R0 and jump to a target if the test succeeds.
211 * l = 0: je, l == 1: jne
212 * Return the address of the word that holds the targed data, in
213 * case it needs to be fixed up later.
214 */
Jack Palevich22305132009-05-13 10:58:45 -0700215 virtual int gtst(bool l, int t) = 0;
216
Jack Palevich1cdef202009-05-22 12:06:27 -0700217 /* Compare R1 against R0, and store the boolean result in R0.
218 * op specifies the comparison.
219 */
Jack Palevich22305132009-05-13 10:58:45 -0700220 virtual void gcmp(int op) = 0;
221
Jack Palevich1cdef202009-05-22 12:06:27 -0700222 /* Perform the arithmetic op specified by op. R1 is the
223 * left argument, R0 is the right argument.
224 */
Jack Palevich546b2242009-05-13 15:10:04 -0700225 virtual void genOp(int op) = 0;
Jack Palevich22305132009-05-13 10:58:45 -0700226
Jack Palevich1cdef202009-05-22 12:06:27 -0700227 /* Set R1 to 0.
228 */
229 virtual void clearR1() = 0;
Jack Palevich22305132009-05-13 10:58:45 -0700230
Jack Palevich1cdef202009-05-22 12:06:27 -0700231 /* Push R0 onto the stack.
232 */
233 virtual void pushR0() = 0;
Jack Palevich22305132009-05-13 10:58:45 -0700234
Jack Palevich1cdef202009-05-22 12:06:27 -0700235 /* Pop R1 off of the stack.
236 */
237 virtual void popR1() = 0;
Jack Palevich22305132009-05-13 10:58:45 -0700238
Jack Palevich1cdef202009-05-22 12:06:27 -0700239 /* Store R0 to the address stored in R1.
240 * isInt is true if a whole 4-byte integer value
241 * should be stored, otherwise a 1-byte character
242 * value should be stored.
243 */
244 virtual void storeR0ToR1(bool isInt) = 0;
Jack Palevich22305132009-05-13 10:58:45 -0700245
Jack Palevich1cdef202009-05-22 12:06:27 -0700246 /* Load R0 from the address stored in R0.
247 * isInt is true if a whole 4-byte integer value
248 * should be loaded, otherwise a 1-byte character
249 * value should be loaded.
250 */
251 virtual void loadR0FromR0(bool isInt) = 0;
Jack Palevich22305132009-05-13 10:58:45 -0700252
Jack Palevich1cdef202009-05-22 12:06:27 -0700253 /* Load the absolute address of a variable to R0.
254 * If ea <= LOCAL, then this is a local variable, or an
255 * argument, addressed relative to FP.
256 * else it is an absolute global address.
257 */
258 virtual void leaR0(int ea) = 0;
Jack Palevich22305132009-05-13 10:58:45 -0700259
Jack Palevich1cdef202009-05-22 12:06:27 -0700260 /* Store R0 to a variable.
261 * If ea <= LOCAL, then this is a local variable, or an
262 * argument, addressed relative to FP.
263 * else it is an absolute global address.
264 */
265 virtual void storeR0(int ea) = 0;
Jack Palevich22305132009-05-13 10:58:45 -0700266
Jack Palevich1cdef202009-05-22 12:06:27 -0700267 /* load R0 from a variable.
268 * If ea <= LOCAL, then this is a local variable, or an
269 * argument, addressed relative to FP.
270 * else it is an absolute global address.
271 * If isIncDec is true, then the stored variable's value
272 * should be post-incremented or post-decremented, based
273 * on the value of op.
274 */
275 virtual void loadR0(int ea, bool isIncDec, int op) = 0;
Jack Palevich22305132009-05-13 10:58:45 -0700276
Jack Palevich1cdef202009-05-22 12:06:27 -0700277 /* Emit code to adjust the stack for a function call. Return the
278 * label for the address of the instruction that adjusts the
279 * stack size. This will be passed as argument "a" to
280 * endFunctionCallArguments.
281 */
Jack Palevichcb1c9ef2009-05-14 11:38:49 -0700282 virtual int beginFunctionCallArguments() = 0;
283
Jack Palevich1cdef202009-05-22 12:06:27 -0700284 /* Emit code to store R0 to the stack at byte offset l.
285 */
286 virtual void storeR0ToArg(int l) = 0;
Jack Palevich7810bc92009-05-15 14:31:47 -0700287
Jack Palevich1cdef202009-05-22 12:06:27 -0700288 /* Patch the function call preamble.
289 * a is the address returned from beginFunctionCallArguments
290 * l is the number of bytes the arguments took on the stack.
291 * Typically you would also emit code to convert the argument
292 * list into whatever the native function calling convention is.
293 * On ARM for example you would pop the first 5 arguments into
294 * R0..R4
295 */
Jack Palevichcb1c9ef2009-05-14 11:38:49 -0700296 virtual void endFunctionCallArguments(int a, int l) = 0;
Jack Palevich22305132009-05-13 10:58:45 -0700297
Jack Palevich1cdef202009-05-22 12:06:27 -0700298 /* Emit a call to an unknown function. The argument "symbol" needs to
299 * be stored in the location where the address should go. It forms
300 * a chain. The address will be patched later.
301 * Return the address of the word that has to be patched.
302 */
Jack Palevich22305132009-05-13 10:58:45 -0700303 virtual int callForward(int symbol) = 0;
304
Jack Palevich1cdef202009-05-22 12:06:27 -0700305 /* Call a function using PC-relative addressing. t is the PC-relative
306 * address of the function. It has already been adjusted for the
307 * architectural jump offset, so just store it as-is.
308 */
Jack Palevich22305132009-05-13 10:58:45 -0700309 virtual void callRelative(int t) = 0;
310
Jack Palevich1cdef202009-05-22 12:06:27 -0700311 /* Call a function pointer. L is the number of bytes the arguments
312 * take on the stack. The address of the function is stored at
313 * location SP + l.
314 */
Jack Palevich22305132009-05-13 10:58:45 -0700315 virtual void callIndirect(int l) = 0;
316
Jack Palevich1cdef202009-05-22 12:06:27 -0700317 /* Adjust SP after returning from a function call. l is the
318 * number of bytes of arguments stored on the stack. isIndirect
319 * is true if this was an indirect call. (In which case the
320 * address of the function is stored at location SP + l.)
321 */
Jack Palevich7810bc92009-05-15 14:31:47 -0700322 virtual void adjustStackAfterCall(int l, bool isIndirect) = 0;
Jack Palevich22305132009-05-13 10:58:45 -0700323
Jack Palevich1cdef202009-05-22 12:06:27 -0700324 /* Print a disassembly of the assembled code to out. Return
325 * non-zero if there is an error.
326 */
Jack Palevicha6535612009-05-13 16:24:17 -0700327 virtual int disassemble(FILE* out) = 0;
328
Jack Palevich1cdef202009-05-22 12:06:27 -0700329 /* Generate a symbol at the current PC. t is the head of a
330 * linked list of addresses to patch.
331 */
Jack Paleviche7b59062009-05-19 17:12:17 -0700332 virtual void gsym(int t) = 0;
Jack Palevich21a15a22009-05-11 14:49:29 -0700333
Jack Palevich1cdef202009-05-22 12:06:27 -0700334 /*
335 * Do any cleanup work required at the end of a compile.
336 * For example, an instruction cache might need to be
337 * invalidated.
338 * Return non-zero if there is an error.
339 */
340 virtual int finishCompile() = 0;
Jack Palevich546b2242009-05-13 15:10:04 -0700341
Jack Palevicha6535612009-05-13 16:24:17 -0700342 /**
343 * Adjust relative branches by this amount.
344 */
345 virtual int jumpOffset() = 0;
346
Jack Palevich21a15a22009-05-11 14:49:29 -0700347 protected:
Jack Palevich21a15a22009-05-11 14:49:29 -0700348 /*
349 * Output a byte. Handles all values, 0..ff.
350 */
351 void ob(int n) {
352 pCodeBuf->ob(n);
353 }
354
Jack Palevich8b0624c2009-05-20 12:12:06 -0700355 intptr_t o4(int data) {
Jack Paleviche7b59062009-05-19 17:12:17 -0700356 return pCodeBuf->o4(data);
Jack Palevich21a15a22009-05-11 14:49:29 -0700357 }
358
Jack Palevich8b0624c2009-05-20 12:12:06 -0700359 intptr_t getBase() {
360 return (intptr_t) pCodeBuf->getBase();
Jack Palevicha6535612009-05-13 16:24:17 -0700361 }
362
Jack Palevich8b0624c2009-05-20 12:12:06 -0700363 intptr_t getPC() {
Jack Palevich21a15a22009-05-11 14:49:29 -0700364 return pCodeBuf->getPC();
365 }
Jack Palevich1cdef202009-05-22 12:06:27 -0700366
367 intptr_t getSize() {
368 return pCodeBuf->getSize();
369 }
Jack Palevichac0e95e2009-05-29 13:53:44 -0700370
371 void error(const char* fmt,...) {
372 va_list ap;
373 va_start(ap, fmt);
374 mErrorSink->verror(fmt, ap);
375 va_end(ap);
376 }
Jack Palevich21a15a22009-05-11 14:49:29 -0700377 private:
378 CodeBuf* pCodeBuf;
Jack Palevichac0e95e2009-05-29 13:53:44 -0700379 ErrorSink* mErrorSink;
Jack Palevich21a15a22009-05-11 14:49:29 -0700380 };
381
Jack Paleviche7b59062009-05-19 17:12:17 -0700382#ifdef PROVIDE_ARM_CODEGEN
383
Jack Palevich22305132009-05-13 10:58:45 -0700384 class ARMCodeGenerator : public CodeGenerator {
385 public:
386 ARMCodeGenerator() {}
387 virtual ~ARMCodeGenerator() {}
388
389 /* returns address to patch with local variable size
390 */
Jack Palevich546b2242009-05-13 15:10:04 -0700391 virtual int functionEntry(int argCount) {
Jack Palevichb7c81e92009-06-04 19:56:13 -0700392 LOG_API("functionEntry(%d);\n", argCount);
Jack Palevich69796b62009-05-14 15:42:26 -0700393 // sp -> arg4 arg5 ...
394 // Push our register-based arguments back on the stack
395 if (argCount > 0) {
396 int regArgCount = argCount <= 4 ? argCount : 4;
397 o4(0xE92D0000 | ((1 << argCount) - 1)); // stmfd sp!, {}
398 }
399 // sp -> arg0 arg1 ...
400 o4(0xE92D4800); // stmfd sp!, {fp, lr}
401 // sp, fp -> oldfp, retadr, arg0 arg1 ....
402 o4(0xE1A0B00D); // mov fp, sp
403 return o4(0xE24DD000); // sub sp, sp, # <local variables>
Jack Palevich22305132009-05-13 10:58:45 -0700404 }
405
Jack Palevich546b2242009-05-13 15:10:04 -0700406 virtual void functionExit(int argCount, int localVariableAddress, int localVariableSize) {
Jack Palevich09555c72009-05-27 12:25:55 -0700407 LOG_API("functionExit(%d, %d, %d);\n", argCount, localVariableAddress, localVariableSize);
Jack Palevich69796b62009-05-14 15:42:26 -0700408 // Patch local variable allocation code:
409 if (localVariableSize < 0 || localVariableSize > 255) {
Jack Palevich8de461d2009-05-14 17:21:45 -0700410 error("localVariables out of range: %d", localVariableSize);
Jack Palevich546b2242009-05-13 15:10:04 -0700411 }
Jack Palevich69796b62009-05-14 15:42:26 -0700412 *(char*) (localVariableAddress) = localVariableSize;
413
414 // sp -> locals .... fp -> oldfp, retadr, arg0, arg1, ...
415 o4(0xE1A0E00B); // mov lr, fp
416 o4(0xE59BB000); // ldr fp, [fp]
417 o4(0xE28ED004); // add sp, lr, #4
418 // sp -> retadr, arg0, ...
419 o4(0xE8BD4000); // ldmfd sp!, {lr}
420 // sp -> arg0 ....
421 if (argCount > 0) {
422 // We store the PC into the lr so we can adjust the sp before
Jack Palevich8de461d2009-05-14 17:21:45 -0700423 // returning. We need to pull off the registers we pushed
Jack Palevich69796b62009-05-14 15:42:26 -0700424 // earlier. We don't need to actually store them anywhere,
425 // just adjust the stack.
426 int regArgCount = argCount <= 4 ? argCount : 4;
427 o4(0xE28DD000 | (regArgCount << 2)); // add sp, sp, #argCount << 2
428 }
429 o4(0xE12FFF1E); // bx lr
Jack Palevich22305132009-05-13 10:58:45 -0700430 }
431
432 /* load immediate value */
Jack Palevich546b2242009-05-13 15:10:04 -0700433 virtual void li(int t) {
Jack Palevich09555c72009-05-27 12:25:55 -0700434 LOG_API("li(%d);\n", t);
Jack Palevicha6535612009-05-13 16:24:17 -0700435 if (t >= 0 && t < 255) {
Jack Palevich69796b62009-05-14 15:42:26 -0700436 o4(0xE3A00000 + t); // mov r0, #0
Jack Palevicha6535612009-05-13 16:24:17 -0700437 } else if (t >= -256 && t < 0) {
438 // mvn means move constant ^ ~0
Jack Palevich69796b62009-05-14 15:42:26 -0700439 o4(0xE3E00001 - t); // mvn r0, #0
Jack Palevicha6535612009-05-13 16:24:17 -0700440 } else {
Jack Palevichcb1c9ef2009-05-14 11:38:49 -0700441 o4(0xE51F0000); // ldr r0, .L3
442 o4(0xEA000000); // b .L99
443 o4(t); // .L3: .word 0
444 // .L99:
Jack Palevicha6535612009-05-13 16:24:17 -0700445 }
Jack Palevich22305132009-05-13 10:58:45 -0700446 }
447
448 virtual int gjmp(int t) {
Jack Palevich09555c72009-05-27 12:25:55 -0700449 LOG_API("gjmp(%d);\n", t);
Jack Palevich8de461d2009-05-14 17:21:45 -0700450 return o4(0xEA000000 | encodeAddress(t)); // b .L33
Jack Palevich22305132009-05-13 10:58:45 -0700451 }
452
453 /* l = 0: je, l == 1: jne */
454 virtual int gtst(bool l, int t) {
Jack Palevich09555c72009-05-27 12:25:55 -0700455 LOG_API("gtst(%d, %d);\n", l, t);
Jack Palevich8de461d2009-05-14 17:21:45 -0700456 o4(0xE3500000); // cmp r0,#0
457 int branch = l ? 0x1A000000 : 0x0A000000; // bne : beq
458 return o4(branch | encodeAddress(t));
Jack Palevich22305132009-05-13 10:58:45 -0700459 }
460
461 virtual void gcmp(int op) {
Jack Palevich09555c72009-05-27 12:25:55 -0700462 LOG_API("gcmp(%d);\n", op);
Jack Palevich8de461d2009-05-14 17:21:45 -0700463 o4(0xE1510000); // cmp r1, r1
464 switch(op) {
465 case OP_EQUALS:
466 o4(0x03A00001); // moveq r0,#1
467 o4(0x13A00000); // movne r0,#0
468 break;
469 case OP_NOT_EQUALS:
470 o4(0x03A00000); // moveq r0,#0
471 o4(0x13A00001); // movne r0,#1
472 break;
473 case OP_LESS_EQUAL:
474 o4(0xD3A00001); // movle r0,#1
475 o4(0xC3A00000); // movgt r0,#0
476 break;
477 case OP_GREATER:
478 o4(0xD3A00000); // movle r0,#0
479 o4(0xC3A00001); // movgt r0,#1
480 break;
481 case OP_GREATER_EQUAL:
482 o4(0xA3A00001); // movge r0,#1
483 o4(0xB3A00000); // movlt r0,#0
484 break;
485 case OP_LESS:
486 o4(0xA3A00000); // movge r0,#0
487 o4(0xB3A00001); // movlt r0,#1
488 break;
489 default:
490 error("Unknown comparison op %d", op);
491 break;
492 }
Jack Palevich22305132009-05-13 10:58:45 -0700493 }
494
Jack Palevich546b2242009-05-13 15:10:04 -0700495 virtual void genOp(int op) {
Jack Palevich09555c72009-05-27 12:25:55 -0700496 LOG_API("genOp(%d);\n", op);
Jack Palevichcb1c9ef2009-05-14 11:38:49 -0700497 switch(op) {
498 case OP_MUL:
499 o4(0x0E0000091); // mul r0,r1,r0
500 break;
Jack Palevich3d474a72009-05-15 15:12:38 -0700501 case OP_DIV:
502 callRuntime(runtime_DIV);
503 break;
504 case OP_MOD:
505 callRuntime(runtime_MOD);
506 break;
Jack Palevichcb1c9ef2009-05-14 11:38:49 -0700507 case OP_PLUS:
508 o4(0xE0810000); // add r0,r1,r0
509 break;
510 case OP_MINUS:
511 o4(0xE0410000); // sub r0,r1,r0
512 break;
513 case OP_SHIFT_LEFT:
514 o4(0xE1A00011); // lsl r0,r1,r0
515 break;
516 case OP_SHIFT_RIGHT:
517 o4(0xE1A00051); // asr r0,r1,r0
518 break;
519 case OP_BIT_AND:
520 o4(0xE0010000); // and r0,r1,r0
521 break;
522 case OP_BIT_XOR:
523 o4(0xE0210000); // eor r0,r1,r0
524 break;
525 case OP_BIT_OR:
526 o4(0xE1810000); // orr r0,r1,r0
527 break;
528 case OP_BIT_NOT:
529 o4(0xE1E00000); // mvn r0, r0
530 break;
531 default:
Jack Palevich69796b62009-05-14 15:42:26 -0700532 error("Unimplemented op %d\n", op);
Jack Palevichcb1c9ef2009-05-14 11:38:49 -0700533 break;
534 }
Jack Palevich22305132009-05-13 10:58:45 -0700535#if 0
536 o(decodeOp(op));
537 if (op == OP_MOD)
538 o(0x92); /* xchg %edx, %eax */
539#endif
540 }
541
Jack Palevich1cdef202009-05-22 12:06:27 -0700542 virtual void clearR1() {
Jack Palevich09555c72009-05-27 12:25:55 -0700543 LOG_API("clearR1();\n");
Jack Palevichcb1c9ef2009-05-14 11:38:49 -0700544 o4(0xE3A01000); // mov r1, #0
Jack Palevich22305132009-05-13 10:58:45 -0700545 }
546
Jack Palevich1cdef202009-05-22 12:06:27 -0700547 virtual void pushR0() {
Jack Palevich09555c72009-05-27 12:25:55 -0700548 LOG_API("pushR0();\n");
Jack Palevichcb1c9ef2009-05-14 11:38:49 -0700549 o4(0xE92D0001); // stmfd sp!,{r0}
Jack Palevich22305132009-05-13 10:58:45 -0700550 }
551
Jack Palevich1cdef202009-05-22 12:06:27 -0700552 virtual void popR1() {
Jack Palevich09555c72009-05-27 12:25:55 -0700553 LOG_API("popR1();\n");
Jack Palevichcb1c9ef2009-05-14 11:38:49 -0700554 o4(0xE8BD0002); // ldmfd sp!,{r1}
Jack Palevich22305132009-05-13 10:58:45 -0700555 }
556
Jack Palevich1cdef202009-05-22 12:06:27 -0700557 virtual void storeR0ToR1(bool isInt) {
Jack Palevich09555c72009-05-27 12:25:55 -0700558 LOG_API("storeR0ToR1(%d);\n", isInt);
Jack Palevichbd894902009-05-14 19:35:31 -0700559 if (isInt) {
560 o4(0xE5810000); // str r0, [r1]
561 } else {
562 o4(0xE5C10000); // strb r0, [r1]
563 }
Jack Palevich22305132009-05-13 10:58:45 -0700564 }
565
Jack Palevich1cdef202009-05-22 12:06:27 -0700566 virtual void loadR0FromR0(bool isInt) {
Jack Palevich09555c72009-05-27 12:25:55 -0700567 LOG_API("loadR0FromR0(%d);\n", isInt);
Jack Palevich22305132009-05-13 10:58:45 -0700568 if (isInt)
Jack Palevich69796b62009-05-14 15:42:26 -0700569 o4(0xE5900000); // ldr r0, [r0]
Jack Palevich22305132009-05-13 10:58:45 -0700570 else
Jack Palevich69796b62009-05-14 15:42:26 -0700571 o4(0xE5D00000); // ldrb r0, [r0]
Jack Palevich22305132009-05-13 10:58:45 -0700572 }
573
Jack Palevich1cdef202009-05-22 12:06:27 -0700574 virtual void leaR0(int ea) {
Jack Palevich09555c72009-05-27 12:25:55 -0700575 LOG_API("leaR0(%d);\n", ea);
Jack Palevich4d93f302009-05-15 13:30:00 -0700576 if (ea < LOCAL) {
577 // Local, fp relative
578 if (ea < -1023 || ea > 1023 || ((ea & 3) != 0)) {
579 error("Offset out of range: %08x", ea);
580 }
581 if (ea < 0) {
582 o4(0xE24B0F00 | (0xff & ((-ea) >> 2))); // sub r0, fp, #ea
583 } else {
584 o4(0xE28B0F00 | (0xff & (ea >> 2))); // add r0, fp, #ea
585 }
Jack Palevichbd894902009-05-14 19:35:31 -0700586 } else {
Jack Palevich4d93f302009-05-15 13:30:00 -0700587 // Global, absolute.
588 o4(0xE59F0000); // ldr r0, .L1
589 o4(0xEA000000); // b .L99
590 o4(ea); // .L1: .word 0
591 // .L99:
Jack Palevichbd894902009-05-14 19:35:31 -0700592 }
Jack Palevich22305132009-05-13 10:58:45 -0700593 }
594
Jack Palevich1cdef202009-05-22 12:06:27 -0700595 virtual void storeR0(int ea) {
Jack Palevich09555c72009-05-27 12:25:55 -0700596 LOG_API("storeR0(%d);\n", ea);
Jack Palevich4d93f302009-05-15 13:30:00 -0700597 if (ea < LOCAL) {
598 // Local, fp relative
599 if (ea < -4095 || ea > 4095) {
600 error("Offset out of range: %08x", ea);
601 }
602 if (ea < 0) {
603 o4(0xE50B0000 | (0xfff & (-ea))); // str r0, [fp,#-ea]
604 } else {
605 o4(0xE58B0000 | (0xfff & ea)); // str r0, [fp,#ea]
606 }
607 } else{
608 // Global, absolute
609 o4(0xE59F1000); // ldr r1, .L1
610 o4(0xEA000000); // b .L99
611 o4(ea); // .L1: .word 0
612 o4(0xE5810000); // .L99: str r0, [r1]
Jack Palevich69796b62009-05-14 15:42:26 -0700613 }
Jack Palevich22305132009-05-13 10:58:45 -0700614 }
615
Jack Palevich1cdef202009-05-22 12:06:27 -0700616 virtual void loadR0(int ea, bool isIncDec, int op) {
Jack Palevich09555c72009-05-27 12:25:55 -0700617 LOG_API("loadR0(%d, %d, %d);\n", ea, isIncDec, op);
Jack Palevich4d93f302009-05-15 13:30:00 -0700618 if (ea < LOCAL) {
619 // Local, fp relative
620 if (ea < -4095 || ea > 4095) {
621 error("Offset out of range: %08x", ea);
622 }
623 if (ea < 0) {
624 o4(0xE51B0000 | (0xfff & (-ea))); // ldr r0, [fp,#-ea]
625 } else {
626 o4(0xE59B0000 | (0xfff & ea)); // ldr r0, [fp,#ea]
627 }
Jack Palevich69796b62009-05-14 15:42:26 -0700628 } else {
Jack Palevich4d93f302009-05-15 13:30:00 -0700629 // Global, absolute
630 o4(0xE59F2000); // ldr r2, .L1
631 o4(0xEA000000); // b .L99
632 o4(ea); // .L1: .word ea
633 o4(0xE5920000); // .L99: ldr r0, [r2]
Jack Palevich69796b62009-05-14 15:42:26 -0700634 }
Jack Palevich22305132009-05-13 10:58:45 -0700635
Jack Palevich4d93f302009-05-15 13:30:00 -0700636 if (isIncDec) {
637 switch (op) {
638 case OP_INCREMENT:
639 o4(0xE2801001); // add r1, r0, #1
640 break;
641 case OP_DECREMENT:
642 o4(0xE2401001); // sub r1, r0, #1
643 break;
644 default:
645 error("unknown opcode: %d", op);
646 }
647 if (ea < LOCAL) {
648 // Local, fp relative
649 // Don't need range check, was already checked above
650 if (ea < 0) {
651 o4(0xE50B1000 | (0xfff & (-ea))); // str r1, [fp,#-ea]
652 } else {
653 o4(0xE58B1000 | (0xfff & ea)); // str r1, [fp,#ea]
654 }
655 } else{
656 // Global, absolute
657 // r2 is already set up from before.
658 o4(0xE5821000); // str r1, [r2]
659 }
Jack Palevichbd894902009-05-14 19:35:31 -0700660 }
Jack Palevich22305132009-05-13 10:58:45 -0700661 }
662
Jack Palevichcb1c9ef2009-05-14 11:38:49 -0700663 virtual int beginFunctionCallArguments() {
Jack Palevich09555c72009-05-27 12:25:55 -0700664 LOG_API("beginFunctionCallArguments();\n");
Jack Palevichcb1c9ef2009-05-14 11:38:49 -0700665 return o4(0xE24DDF00); // Placeholder
666 }
667
Jack Palevich1cdef202009-05-22 12:06:27 -0700668 virtual void storeR0ToArg(int l) {
Jack Palevich09555c72009-05-27 12:25:55 -0700669 LOG_API("storeR0ToArg(%d);\n", l);
Jack Palevich7810bc92009-05-15 14:31:47 -0700670 if (l < 0 || l > 4096-4) {
671 error("l out of range for stack offset: 0x%08x", l);
672 }
673 o4(0xE58D0000 + l); // str r0, [sp, #4]
674 }
675
Jack Palevichcb1c9ef2009-05-14 11:38:49 -0700676 virtual void endFunctionCallArguments(int a, int l) {
Jack Palevich09555c72009-05-27 12:25:55 -0700677 LOG_API("endFunctionCallArguments(0x%08x, %d);\n", a, l);
Jack Palevichcb1c9ef2009-05-14 11:38:49 -0700678 if (l < 0 || l > 0x3FC) {
679 error("L out of range for stack adjustment: 0x%08x", l);
680 }
681 * (int*) a = 0xE24DDF00 | (l >> 2); // sub sp, sp, #0 << 2
682 int argCount = l >> 2;
683 if (argCount > 0) {
684 int regArgCount = argCount > 4 ? 4 : argCount;
685 o4(0xE8BD0000 | ((1 << regArgCount) - 1)); // ldmfd sp!,{}
686 }
Jack Palevich22305132009-05-13 10:58:45 -0700687 }
688
Jack Palevich22305132009-05-13 10:58:45 -0700689 virtual int callForward(int symbol) {
Jack Palevich09555c72009-05-27 12:25:55 -0700690 LOG_API("callForward(%d);\n", symbol);
Jack Palevichcb1c9ef2009-05-14 11:38:49 -0700691 // Forward calls are always short (local)
692 return o4(0xEB000000 | encodeAddress(symbol));
Jack Palevich22305132009-05-13 10:58:45 -0700693 }
694
695 virtual void callRelative(int t) {
Jack Palevich09555c72009-05-27 12:25:55 -0700696 LOG_API("callRelative(%d);\n", t);
Jack Palevichcb1c9ef2009-05-14 11:38:49 -0700697 int abs = t + getPC() + jumpOffset();
Jack Palevichac0e95e2009-05-29 13:53:44 -0700698 LOG_API("abs=%d (0x%08x)\n", abs, abs);
Jack Palevichcb1c9ef2009-05-14 11:38:49 -0700699 if (t >= - (1 << 25) && t < (1 << 25)) {
700 o4(0xEB000000 | encodeAddress(t));
701 } else {
702 // Long call.
703 o4(0xE59FC000); // ldr r12, .L1
704 o4(0xEA000000); // b .L99
Jack Palevichbd894902009-05-14 19:35:31 -0700705 o4(t - 12); // .L1: .word 0
Jack Palevichcb1c9ef2009-05-14 11:38:49 -0700706 o4(0xE08CC00F); // .L99: add r12,pc
707 o4(0xE12FFF3C); // blx r12
708 }
Jack Palevich22305132009-05-13 10:58:45 -0700709 }
710
711 virtual void callIndirect(int l) {
Jack Palevich09555c72009-05-27 12:25:55 -0700712 LOG_API("callIndirect(%d);\n", l);
Jack Palevich7810bc92009-05-15 14:31:47 -0700713 int argCount = l >> 2;
714 int poppedArgs = argCount > 4 ? 4 : argCount;
715 int adjustedL = l - (poppedArgs << 2);
716 if (adjustedL < 0 || adjustedL > 4096-4) {
717 error("l out of range for stack offset: 0x%08x", l);
718 }
719 o4(0xE59DC000 | (0xfff & adjustedL)); // ldr r12, [sp,#adjustedL]
720 o4(0xE12FFF3C); // blx r12
Jack Palevich22305132009-05-13 10:58:45 -0700721 }
722
Jack Palevich7810bc92009-05-15 14:31:47 -0700723 virtual void adjustStackAfterCall(int l, bool isIndirect) {
Jack Palevich09555c72009-05-27 12:25:55 -0700724 LOG_API("adjustStackAfterCall(%d, %d);\n", l, isIndirect);
Jack Palevichcb1c9ef2009-05-14 11:38:49 -0700725 int argCount = l >> 2;
Jack Palevich7810bc92009-05-15 14:31:47 -0700726 int stackArgs = argCount > 4 ? argCount - 4 : 0;
727 int stackUse = stackArgs + (isIndirect ? 1 : 0);
728 if (stackUse) {
729 if (stackUse < 0 || stackUse > 255) {
730 error("L out of range for stack adjustment: 0x%08x", l);
731 }
732 o4(0xE28DDF00 | stackUse); // add sp, sp, #stackUse << 2
Jack Palevichcb1c9ef2009-05-14 11:38:49 -0700733 }
Jack Palevich22305132009-05-13 10:58:45 -0700734 }
735
Jack Palevicha6535612009-05-13 16:24:17 -0700736 virtual int jumpOffset() {
Jack Palevichbd894902009-05-14 19:35:31 -0700737 return 8;
Jack Palevicha6535612009-05-13 16:24:17 -0700738 }
739
740 /* output a symbol and patch all calls to it */
741 virtual void gsym(int t) {
Jack Palevich09555c72009-05-27 12:25:55 -0700742 LOG_API("gsym(0x%x)\n", t);
Jack Palevicha6535612009-05-13 16:24:17 -0700743 int n;
744 int base = getBase();
745 int pc = getPC();
Jack Palevich09555c72009-05-27 12:25:55 -0700746 LOG_API("pc = 0x%x\n", pc);
Jack Palevicha6535612009-05-13 16:24:17 -0700747 while (t) {
748 int data = * (int*) t;
749 int decodedOffset = ((BRANCH_REL_ADDRESS_MASK & data) << 2);
750 if (decodedOffset == 0) {
751 n = 0;
752 } else {
753 n = base + decodedOffset; /* next value */
754 }
755 *(int *) t = (data & ~BRANCH_REL_ADDRESS_MASK)
756 | encodeRelAddress(pc - t - 8);
757 t = n;
758 }
759 }
760
Jack Palevich1cdef202009-05-22 12:06:27 -0700761 virtual int finishCompile() {
762#if defined(__arm__)
763 const long base = long(getBase());
764 const long curr = long(getPC());
765 int err = cacheflush(base, curr, 0);
766 return err;
767#else
768 return 0;
769#endif
770 }
771
Jack Palevicha6535612009-05-13 16:24:17 -0700772 virtual int disassemble(FILE* out) {
Jack Palevich09555c72009-05-27 12:25:55 -0700773#ifdef ENABLE_ARM_DISASSEMBLY
774 disasmOut = out;
Jack Palevicha6535612009-05-13 16:24:17 -0700775 disasm_interface_t di;
776 di.di_readword = disassemble_readword;
777 di.di_printaddr = disassemble_printaddr;
778 di.di_printf = disassemble_printf;
779
780 int base = getBase();
781 int pc = getPC();
782 for(int i = base; i < pc; i += 4) {
783 fprintf(out, "%08x: %08x ", i, *(int*) i);
784 ::disasm(&di, i, 0);
785 }
Jack Palevich09555c72009-05-27 12:25:55 -0700786#endif
Jack Palevicha6535612009-05-13 16:24:17 -0700787 return 0;
788 }
Jack Palevich7810bc92009-05-15 14:31:47 -0700789
Jack Palevich22305132009-05-13 10:58:45 -0700790 private:
Jack Palevicha6535612009-05-13 16:24:17 -0700791 static FILE* disasmOut;
792
793 static u_int
794 disassemble_readword(u_int address)
795 {
796 return(*((u_int *)address));
797 }
798
799 static void
800 disassemble_printaddr(u_int address)
801 {
802 fprintf(disasmOut, "0x%08x", address);
803 }
804
805 static void
806 disassemble_printf(const char *fmt, ...) {
807 va_list ap;
808 va_start(ap, fmt);
809 vfprintf(disasmOut, fmt, ap);
810 va_end(ap);
811 }
812
813 static const int BRANCH_REL_ADDRESS_MASK = 0x00ffffff;
814
815 /** Encode a relative address that might also be
816 * a label.
817 */
818 int encodeAddress(int value) {
819 int base = getBase();
820 if (value >= base && value <= getPC() ) {
821 // This is a label, encode it relative to the base.
822 value = value - base;
823 }
824 return encodeRelAddress(value);
825 }
826
827 int encodeRelAddress(int value) {
828 return BRANCH_REL_ADDRESS_MASK & (value >> 2);
829 }
Jack Palevich22305132009-05-13 10:58:45 -0700830
Jack Palevich3d474a72009-05-15 15:12:38 -0700831 typedef int (*int2FnPtr)(int a, int b);
832 void callRuntime(int2FnPtr fn) {
833 o4(0xE59F2000); // ldr r2, .L1
834 o4(0xEA000000); // b .L99
835 o4((int) fn); //.L1: .word fn
836 o4(0xE12FFF32); //.L99: blx r2
837 }
838
839 static int runtime_DIV(int a, int b) {
840 return b / a;
841 }
842
843 static int runtime_MOD(int a, int b) {
844 return b % a;
845 }
Jack Palevich22305132009-05-13 10:58:45 -0700846 };
847
Jack Palevich09555c72009-05-27 12:25:55 -0700848#endif // PROVIDE_ARM_CODEGEN
Jack Paleviche7b59062009-05-19 17:12:17 -0700849
850#ifdef PROVIDE_X86_CODEGEN
851
Jack Palevich21a15a22009-05-11 14:49:29 -0700852 class X86CodeGenerator : public CodeGenerator {
853 public:
854 X86CodeGenerator() {}
855 virtual ~X86CodeGenerator() {}
856
Jack Palevichbf42c9c2009-05-12 12:48:35 -0700857 /* returns address to patch with local variable size
858 */
Jack Palevich546b2242009-05-13 15:10:04 -0700859 virtual int functionEntry(int argCount) {
Jack Palevichbf42c9c2009-05-12 12:48:35 -0700860 o(0xe58955); /* push %ebp, mov %esp, %ebp */
861 return oad(0xec81, 0); /* sub $xxx, %esp */
862 }
863
Jack Palevich546b2242009-05-13 15:10:04 -0700864 virtual void functionExit(int argCount, int localVariableAddress, int localVariableSize) {
Jack Palevichbf42c9c2009-05-12 12:48:35 -0700865 o(0xc3c9); /* leave, ret */
Jack Palevich546b2242009-05-13 15:10:04 -0700866 *(int *) localVariableAddress = localVariableSize; /* save local variables */
Jack Palevichbf42c9c2009-05-12 12:48:35 -0700867 }
868
Jack Palevich21a15a22009-05-11 14:49:29 -0700869 /* load immediate value */
Jack Palevich546b2242009-05-13 15:10:04 -0700870 virtual void li(int t) {
Jack Palevich21a15a22009-05-11 14:49:29 -0700871 oad(0xb8, t); /* mov $xx, %eax */
872 }
873
Jack Palevich22305132009-05-13 10:58:45 -0700874 virtual int gjmp(int t) {
Jack Palevich21a15a22009-05-11 14:49:29 -0700875 return psym(0xe9, t);
876 }
877
878 /* l = 0: je, l == 1: jne */
Jack Palevich22305132009-05-13 10:58:45 -0700879 virtual int gtst(bool l, int t) {
Jack Palevich21a15a22009-05-11 14:49:29 -0700880 o(0x0fc085); /* test %eax, %eax, je/jne xxx */
881 return psym(0x84 + l, t);
882 }
883
Jack Palevich22305132009-05-13 10:58:45 -0700884 virtual void gcmp(int op) {
Jack Palevichbf42c9c2009-05-12 12:48:35 -0700885 int t = decodeOp(op);
Jack Palevich21a15a22009-05-11 14:49:29 -0700886 o(0xc139); /* cmp %eax,%ecx */
887 li(0);
888 o(0x0f); /* setxx %al */
889 o(t + 0x90);
890 o(0xc0);
891 }
892
Jack Palevich546b2242009-05-13 15:10:04 -0700893 virtual void genOp(int op) {
Jack Palevichbf42c9c2009-05-12 12:48:35 -0700894 o(decodeOp(op));
895 if (op == OP_MOD)
896 o(0x92); /* xchg %edx, %eax */
897 }
898
Jack Palevich1cdef202009-05-22 12:06:27 -0700899 virtual void clearR1() {
Jack Palevich21a15a22009-05-11 14:49:29 -0700900 oad(0xb9, 0); /* movl $0, %ecx */
901 }
902
Jack Palevich1cdef202009-05-22 12:06:27 -0700903 virtual void pushR0() {
Jack Palevich21a15a22009-05-11 14:49:29 -0700904 o(0x50); /* push %eax */
905 }
906
Jack Palevich1cdef202009-05-22 12:06:27 -0700907 virtual void popR1() {
Jack Palevich21a15a22009-05-11 14:49:29 -0700908 o(0x59); /* pop %ecx */
Jack Palevichbf42c9c2009-05-12 12:48:35 -0700909 }
910
Jack Palevich1cdef202009-05-22 12:06:27 -0700911 virtual void storeR0ToR1(bool isInt) {
Jack Palevich21a15a22009-05-11 14:49:29 -0700912 o(0x0188 + isInt); /* movl %eax/%al, (%ecx) */
913 }
914
Jack Palevich1cdef202009-05-22 12:06:27 -0700915 virtual void loadR0FromR0(bool isInt) {
Jack Palevich21a15a22009-05-11 14:49:29 -0700916 if (isInt)
917 o(0x8b); /* mov (%eax), %eax */
918 else
919 o(0xbe0f); /* movsbl (%eax), %eax */
920 ob(0); /* add zero in code */
921 }
922
Jack Palevich1cdef202009-05-22 12:06:27 -0700923 virtual void leaR0(int ea) {
Jack Palevich21a15a22009-05-11 14:49:29 -0700924 gmov(10, ea); /* leal EA, %eax */
925 }
926
Jack Palevich1cdef202009-05-22 12:06:27 -0700927 virtual void storeR0(int ea) {
Jack Palevich21a15a22009-05-11 14:49:29 -0700928 gmov(6, ea); /* mov %eax, EA */
929 }
930
Jack Palevich1cdef202009-05-22 12:06:27 -0700931 virtual void loadR0(int ea, bool isIncDec, int op) {
Jack Palevich21a15a22009-05-11 14:49:29 -0700932 gmov(8, ea); /* mov EA, %eax */
Jack Palevich4d93f302009-05-15 13:30:00 -0700933 if (isIncDec) {
934 /* Implement post-increment or post decrement.
935 */
936 gmov(0, ea); /* 83 ADD */
937 o(decodeOp(op));
938 }
Jack Palevich21a15a22009-05-11 14:49:29 -0700939 }
940
Jack Palevichcb1c9ef2009-05-14 11:38:49 -0700941 virtual int beginFunctionCallArguments() {
Jack Palevich21a15a22009-05-11 14:49:29 -0700942 return oad(0xec81, 0); /* sub $xxx, %esp */
943 }
944
Jack Palevich1cdef202009-05-22 12:06:27 -0700945 virtual void storeR0ToArg(int l) {
Jack Palevich21a15a22009-05-11 14:49:29 -0700946 oad(0x248489, l); /* movl %eax, xxx(%esp) */
947 }
948
Jack Palevich7810bc92009-05-15 14:31:47 -0700949 virtual void endFunctionCallArguments(int a, int l) {
950 * (int*) a = l;
951 }
952
Jack Palevich22305132009-05-13 10:58:45 -0700953 virtual int callForward(int symbol) {
Jack Palevich21a15a22009-05-11 14:49:29 -0700954 return psym(0xe8, symbol); /* call xxx */
955 }
956
Jack Palevich22305132009-05-13 10:58:45 -0700957 virtual void callRelative(int t) {
Jack Palevich21a15a22009-05-11 14:49:29 -0700958 psym(0xe8, t); /* call xxx */
959 }
960
Jack Palevich22305132009-05-13 10:58:45 -0700961 virtual void callIndirect(int l) {
Jack Palevich21a15a22009-05-11 14:49:29 -0700962 oad(0x2494ff, l); /* call *xxx(%esp) */
963 }
964
Jack Palevich7810bc92009-05-15 14:31:47 -0700965 virtual void adjustStackAfterCall(int l, bool isIndirect) {
966 if (isIndirect) {
967 l += 4;
968 }
Jack Palevich21a15a22009-05-11 14:49:29 -0700969 oad(0xc481, l); /* add $xxx, %esp */
970 }
971
Jack Palevicha6535612009-05-13 16:24:17 -0700972 virtual int jumpOffset() {
973 return 5;
974 }
975
976 virtual int disassemble(FILE* out) {
Jack Palevich1cdef202009-05-22 12:06:27 -0700977 return 0;
Jack Palevicha6535612009-05-13 16:24:17 -0700978 }
979
Jack Paleviche7b59062009-05-19 17:12:17 -0700980 /* output a symbol and patch all calls to it */
981 virtual void gsym(int t) {
982 int n;
983 int pc = getPC();
984 while (t) {
985 n = *(int *) t; /* next value */
986 *(int *) t = pc - t - 4;
987 t = n;
988 }
989 }
990
Jack Palevich1cdef202009-05-22 12:06:27 -0700991 virtual int finishCompile() {
992 return 0;
993 }
994
Jack Palevich21a15a22009-05-11 14:49:29 -0700995 private:
Jack Paleviche7b59062009-05-19 17:12:17 -0700996
997 /** Output 1 to 4 bytes.
998 *
999 */
1000 void o(int n) {
1001 /* cannot use unsigned, so we must do a hack */
1002 while (n && n != -1) {
1003 ob(n & 0xff);
1004 n = n >> 8;
1005 }
1006 }
1007
1008 /* psym is used to put an instruction with a data field which is a
1009 reference to a symbol. It is in fact the same as oad ! */
1010 int psym(int n, int t) {
1011 return oad(n, t);
1012 }
1013
1014 /* instruction + address */
1015 int oad(int n, int t) {
1016 o(n);
1017 int result = getPC();
1018 o4(t);
1019 return result;
1020 }
1021
1022
Jack Palevichbf42c9c2009-05-12 12:48:35 -07001023 static const int operatorHelper[];
1024
1025 int decodeOp(int op) {
1026 if (op < 0 || op > OP_COUNT) {
Jack Palevichac0e95e2009-05-29 13:53:44 -07001027 error("Out-of-range operator: %d\n", op);
Jack Palevichbf42c9c2009-05-12 12:48:35 -07001028 }
1029 return operatorHelper[op];
1030 }
Jack Palevich21a15a22009-05-11 14:49:29 -07001031
Jack Palevich546b2242009-05-13 15:10:04 -07001032 void gmov(int l, int t) {
Jack Palevich21a15a22009-05-11 14:49:29 -07001033 o(l + 0x83);
1034 oad((t < LOCAL) << 7 | 5, t);
1035 }
1036 };
1037
Jack Paleviche7b59062009-05-19 17:12:17 -07001038#endif // PROVIDE_X86_CODEGEN
1039
Jack Palevich1cdef202009-05-22 12:06:27 -07001040 class InputStream {
1041 public:
Jack Palevicheedf9d22009-06-04 16:23:40 -07001042 int getChar() {
1043 if (bumpLine) {
1044 line++;
1045 bumpLine = false;
1046 }
1047 int ch = get();
1048 if (ch == '\n') {
1049 bumpLine = true;
1050 }
1051 return ch;
1052 }
1053 int getLine() {
1054 return line;
1055 }
1056 protected:
1057 InputStream() :
1058 line(1), bumpLine(false) {
1059 }
1060 private:
Jack Palevich1cdef202009-05-22 12:06:27 -07001061 virtual int get() = 0;
Jack Palevicheedf9d22009-06-04 16:23:40 -07001062 int line;
1063 bool bumpLine;
Jack Palevich1cdef202009-05-22 12:06:27 -07001064 };
1065
1066 class FileInputStream : public InputStream {
1067 public:
1068 FileInputStream(FILE* in) : f(in) {}
Jack Palevich1cdef202009-05-22 12:06:27 -07001069 private:
Jack Palevicheedf9d22009-06-04 16:23:40 -07001070 virtual int get() { return fgetc(f); }
Jack Palevich1cdef202009-05-22 12:06:27 -07001071 FILE* f;
1072 };
1073
1074 class TextInputStream : public InputStream {
1075 public:
1076 TextInputStream(const char* text, size_t textLength)
1077 : pText(text), mTextLength(textLength), mPosition(0) {
1078 }
Jack Palevicheedf9d22009-06-04 16:23:40 -07001079
1080 private:
Jack Palevich1cdef202009-05-22 12:06:27 -07001081 virtual int get() {
1082 return mPosition < mTextLength ? pText[mPosition++] : EOF;
1083 }
Jack Palevich1cdef202009-05-22 12:06:27 -07001084
Jack Palevich1cdef202009-05-22 12:06:27 -07001085 const char* pText;
1086 size_t mTextLength;
1087 size_t mPosition;
1088 };
1089
Jack Palevich653f42d2009-05-28 17:15:32 -07001090 int ch; // Current input character, or EOF
1091 intptr_t tok; // token
1092 intptr_t tokc; // token extra info
1093 int tokl; // token operator level
1094 intptr_t rsym; // return symbol
1095 intptr_t loc; // local variable index
1096 char* glo; // global variable index
1097 char* sym_stk;
1098 char* dstk; // Define stack
1099 char* dptr; // Macro state: Points to macro text during macro playback.
1100 int dch; // Macro state: Saves old value of ch during a macro playback.
1101 char* last_id;
Jack Palevichf1f39cc2009-05-29 18:03:15 -07001102 char* pGlobalBase;
Jack Palevich653f42d2009-05-28 17:15:32 -07001103 char* pVarsBase; // Value of variables
Jack Palevich1cdef202009-05-22 12:06:27 -07001104
1105 InputStream* file;
Jack Palevich21a15a22009-05-11 14:49:29 -07001106
1107 CodeBuf codeBuf;
Jack Palevich22305132009-05-13 10:58:45 -07001108 CodeGenerator* pGen;
Jack Palevich21a15a22009-05-11 14:49:29 -07001109
Jack Palevicheedf9d22009-06-04 16:23:40 -07001110 class String {
1111 public:
1112 String() {
1113 mpBase = 0;
1114 mUsed = 0;
1115 mSize = 0;
1116 }
1117
Jack Palevich2d11dfb2009-06-08 14:34:26 -07001118 String(char* item, int len, bool adopt) {
1119 if (adopt) {
1120 mpBase = item;
1121 mUsed = len;
1122 mSize = len + 1;
1123 } else {
1124 mpBase = 0;
1125 mUsed = 0;
1126 mSize = 0;
1127 appendBytes(item, len);
1128 }
1129 }
1130
Jack Palevicheedf9d22009-06-04 16:23:40 -07001131 ~String() {
1132 if (mpBase) {
1133 free(mpBase);
1134 }
1135 }
1136
Jack Palevich2d11dfb2009-06-08 14:34:26 -07001137 inline char* getUnwrapped() {
Jack Palevicheedf9d22009-06-04 16:23:40 -07001138 return mpBase;
1139 }
1140
1141 void appendCStr(const char* s) {
Jack Palevich2d11dfb2009-06-08 14:34:26 -07001142 appendBytes(s, strlen(s));
1143 }
1144
1145 void appendBytes(const char* s, int n) {
Jack Palevicheedf9d22009-06-04 16:23:40 -07001146 memcpy(ensure(n), s, n + 1);
1147 }
1148
1149 void append(char c) {
1150 * ensure(1) = c;
1151 }
1152
Jack Palevich2d11dfb2009-06-08 14:34:26 -07001153 char* orphan() {
1154 char* result = mpBase;
1155 mpBase = 0;
1156 mUsed = 0;
1157 mSize = 0;
1158 return result;
1159 }
1160
Jack Palevicheedf9d22009-06-04 16:23:40 -07001161 void printf(const char* fmt,...) {
1162 va_list ap;
1163 va_start(ap, fmt);
1164 vprintf(fmt, ap);
1165 va_end(ap);
1166 }
1167
1168 void vprintf(const char* fmt, va_list ap) {
1169 char* temp;
1170 int numChars = vasprintf(&temp, fmt, ap);
1171 memcpy(ensure(numChars), temp, numChars+1);
1172 free(temp);
1173 }
1174
Jack Palevich2d11dfb2009-06-08 14:34:26 -07001175 inline size_t len() {
Jack Palevicheedf9d22009-06-04 16:23:40 -07001176 return mUsed;
1177 }
1178
1179 private:
1180 char* ensure(int n) {
1181 size_t newUsed = mUsed + n;
1182 if (newUsed > mSize) {
1183 size_t newSize = mSize * 2 + 10;
1184 if (newSize < newUsed) {
1185 newSize = newUsed;
1186 }
1187 mpBase = (char*) realloc(mpBase, newSize + 1);
1188 mSize = newSize;
1189 }
1190 mpBase[newUsed] = '\0';
1191 char* result = mpBase + mUsed;
1192 mUsed = newUsed;
1193 return result;
1194 }
1195
1196 char* mpBase;
1197 size_t mUsed;
1198 size_t mSize;
1199 };
1200
Jack Palevich2d11dfb2009-06-08 14:34:26 -07001201 /**
1202 * Wrap an externally allocated string for use as a hash key.
1203 */
1204 class FakeString : public String {
1205 public:
1206 FakeString(char* string, size_t length) :
1207 String(string, length, true) {}
1208
1209 ~FakeString() {
1210 orphan();
1211 }
1212 };
1213
1214 template<class V> class StringTable {
1215 public:
1216 StringTable(size_t initialCapacity) {
1217 mpMap = hashmapCreate(initialCapacity, hashFn, equalsFn);
1218 }
1219
1220 ~StringTable() {
1221 clear();
1222 }
1223
1224 void clear() {
1225 hashmapForEach(mpMap, freeKeyValue, this);
1226 }
1227
1228 bool contains(String* pKey) {
1229 bool result = hashmapContainsKey(mpMap, pKey);
1230 return result;
1231 }
1232
1233 V* get(String* pKey) {
1234 V* result = (V*) hashmapGet(mpMap, pKey);
1235 return result;
1236 }
1237
1238 V* remove(String* pKey) {
1239 V* result = (V*) hashmapRemove(mpMap, pKey);
1240 return result;
1241 }
1242
1243 V* put(String* pKey, V* value) {
1244 V* result = (V*) hashmapPut(mpMap, pKey, value);
1245 if (result) {
1246 // The key was not adopted by the map, so delete it here.
1247 delete pKey;
1248 }
1249 return result;
1250 }
1251
1252 protected:
1253 static int hashFn(void* pKey) {
1254 String* pString = (String*) pKey;
1255 return hashmapHash(pString->getUnwrapped(), pString->len());
1256 }
1257
1258 static bool equalsFn(void* keyA, void* keyB) {
1259 String* pStringA = (String*) keyA;
1260 String* pStringB = (String*) keyB;
1261 return pStringA->len() == pStringB->len()
1262 && strcmp(pStringA->getUnwrapped(), pStringB->getUnwrapped())
1263 == 0;
1264 }
1265
1266 static bool freeKeyValue(void* key, void* value, void* context) {
1267 delete (String*) key;
1268 delete (V*) value;
1269 return true;
1270 }
1271
1272 Hashmap* mpMap;
1273 };
1274
1275 class MacroTable : public StringTable<String> {
1276 public:
1277 MacroTable() : StringTable<String>(10) {}
1278 };
1279
1280 template<class E> class Array {
1281 public:
1282 Array() {
1283 mpBase = 0;
1284 mUsed = 0;
1285 mSize = 0;
1286 }
1287
1288 ~Array() {
1289 if (mpBase) {
1290 free(mpBase);
1291 }
1292 }
1293
1294 E get(int i) {
1295 if (i < 0 || i > mUsed) {
1296 error("internal error: Index out of range");
1297 return E();
1298 }
1299 return mpBase[i];
1300 }
1301
1302 void set(int i, E val) {
1303 mpBase[i] = val;
1304 }
1305
1306 void pop() {
1307 if (mUsed > 0) {
1308 mUsed -= 1;
1309 }
1310 }
1311
1312 void push(E item) {
1313 * ensure(1) = item;
1314 }
1315
1316 size_t len() {
1317 return mUsed;
1318 }
1319
1320 private:
1321 E* ensure(int n) {
1322 size_t newUsed = mUsed + n;
1323 if (newUsed > mSize) {
1324 size_t newSize = mSize * 2 + 10;
1325 if (newSize < newUsed) {
1326 newSize = newUsed;
1327 }
1328 mpBase = (E*) realloc(mpBase, sizeof(E) * newSize);
1329 mSize = newSize;
1330 }
1331 E* result = mpBase + mUsed;
1332 mUsed = newUsed;
1333 return result;
1334 }
1335
1336 E* mpBase;
1337 size_t mUsed;
1338 size_t mSize;
1339 };
1340
1341 MacroTable mMacros;
1342
Jack Palevicheedf9d22009-06-04 16:23:40 -07001343 String mErrorBuf;
1344
Jack Palevichac0e95e2009-05-29 13:53:44 -07001345 jmp_buf mErrorRecoveryJumpBuf;
1346
Jack Palevicheedf9d22009-06-04 16:23:40 -07001347 String mPragmas;
1348 int mPragmaStringCount;
1349
Jack Palevich21a15a22009-05-11 14:49:29 -07001350 static const int ALLOC_SIZE = 99999;
1351
Jack Palevicheedf9d22009-06-04 16:23:40 -07001352 // Indentifiers start at 0x100 and increase by # (chars + 1) * 8
Jack Palevich21a15a22009-05-11 14:49:29 -07001353 static const int TOK_IDENT = 0x100;
1354 static const int TOK_INT = 0x100;
Jack Palevichb7c81e92009-06-04 19:56:13 -07001355 static const int TOK_CHAR = TOK_INT + 4*8;
1356 static const int TOK_VOID = TOK_CHAR + 5*8;
1357 static const int TOK_IF = TOK_VOID + 5*8;
1358 static const int TOK_ELSE = TOK_IF + 3*8;
1359 static const int TOK_WHILE = TOK_ELSE + 5*8;
1360 static const int TOK_BREAK = TOK_WHILE + 6*8;
1361 static const int TOK_RETURN = TOK_BREAK + 6*8;
1362 static const int TOK_FOR = TOK_RETURN + 7*8;
1363 static const int TOK_PRAGMA = TOK_FOR + 4*8;
1364 static const int TOK_DEFINE = TOK_PRAGMA + 7*8;
1365 static const int TOK_MAIN = TOK_DEFINE + 7*8;
Jack Palevich21a15a22009-05-11 14:49:29 -07001366
1367 static const int TOK_DUMMY = 1;
1368 static const int TOK_NUM = 2;
1369
1370 static const int LOCAL = 0x200;
1371
1372 static const int SYM_FORWARD = 0;
1373 static const int SYM_DEFINE = 1;
1374
1375 /* tokens in string heap */
1376 static const int TAG_TOK = ' ';
Jack Palevich21a15a22009-05-11 14:49:29 -07001377
Jack Palevichbf42c9c2009-05-12 12:48:35 -07001378 static const int OP_INCREMENT = 0;
1379 static const int OP_DECREMENT = 1;
1380 static const int OP_MUL = 2;
1381 static const int OP_DIV = 3;
1382 static const int OP_MOD = 4;
1383 static const int OP_PLUS = 5;
1384 static const int OP_MINUS = 6;
1385 static const int OP_SHIFT_LEFT = 7;
1386 static const int OP_SHIFT_RIGHT = 8;
1387 static const int OP_LESS_EQUAL = 9;
1388 static const int OP_GREATER_EQUAL = 10;
1389 static const int OP_LESS = 11;
1390 static const int OP_GREATER = 12;
1391 static const int OP_EQUALS = 13;
1392 static const int OP_NOT_EQUALS = 14;
1393 static const int OP_LOGICAL_AND = 15;
1394 static const int OP_LOGICAL_OR = 16;
1395 static const int OP_BIT_AND = 17;
1396 static const int OP_BIT_XOR = 18;
1397 static const int OP_BIT_OR = 19;
1398 static const int OP_BIT_NOT = 20;
1399 static const int OP_LOGICAL_NOT = 21;
1400 static const int OP_COUNT = 22;
1401
1402 /* Operators are searched from front, the two-character operators appear
1403 * before the single-character operators with the same first character.
1404 * @ is used to pad out single-character operators.
1405 */
1406 static const char* operatorChars;
1407 static const char operatorLevel[];
1408
Jack Palevich21a15a22009-05-11 14:49:29 -07001409 void pdef(int t) {
Jack Palevichf1f39cc2009-05-29 18:03:15 -07001410 if (dstk - sym_stk >= ALLOC_SIZE) {
1411 error("Symbol table exhausted");
1412 }
Jack Palevich653f42d2009-05-28 17:15:32 -07001413 *dstk++ = t;
Jack Palevich21a15a22009-05-11 14:49:29 -07001414 }
1415
1416 void inp() {
1417 if (dptr) {
Jack Palevich653f42d2009-05-28 17:15:32 -07001418 ch = *dptr++;
Jack Palevich2d11dfb2009-06-08 14:34:26 -07001419 if (ch == 0) {
Jack Palevich21a15a22009-05-11 14:49:29 -07001420 dptr = 0;
1421 ch = dch;
1422 }
1423 } else
Jack Palevicheedf9d22009-06-04 16:23:40 -07001424 ch = file->getChar();
Jack Palevichb7c81e92009-06-04 19:56:13 -07001425#if 0
1426 printf("ch='%c' 0x%x\n", ch, ch);
1427#endif
Jack Palevich21a15a22009-05-11 14:49:29 -07001428 }
1429
1430 int isid() {
Jack Palevich546b2242009-05-13 15:10:04 -07001431 return isalnum(ch) | (ch == '_');
Jack Palevich21a15a22009-05-11 14:49:29 -07001432 }
1433
1434 /* read a character constant */
1435 void getq() {
1436 if (ch == '\\') {
1437 inp();
1438 if (ch == 'n')
1439 ch = '\n';
1440 }
1441 }
1442
1443 void next() {
1444 int l, a;
1445
Jack Palevich546b2242009-05-13 15:10:04 -07001446 while (isspace(ch) | (ch == '#')) {
Jack Palevich21a15a22009-05-11 14:49:29 -07001447 if (ch == '#') {
1448 inp();
1449 next();
1450 if (tok == TOK_DEFINE) {
Jack Palevich2d11dfb2009-06-08 14:34:26 -07001451 doDefine();
Jack Palevicheedf9d22009-06-04 16:23:40 -07001452 } else if (tok == TOK_PRAGMA) {
1453 doPragma();
1454 } else {
1455 error("Unsupported preprocessor directive \"%s\"", last_id);
Jack Palevich21a15a22009-05-11 14:49:29 -07001456 }
Jack Palevicheedf9d22009-06-04 16:23:40 -07001457
Jack Palevich21a15a22009-05-11 14:49:29 -07001458 }
1459 inp();
1460 }
1461 tokl = 0;
1462 tok = ch;
1463 /* encode identifiers & numbers */
1464 if (isid()) {
1465 pdef(TAG_TOK);
1466 last_id = dstk;
1467 while (isid()) {
Jack Paleviche27bf3e2009-05-10 14:09:03 -07001468 pdef(ch);
1469 inp();
Jack Palevichae54f1f2009-05-08 14:54:15 -07001470 }
Jack Palevich21a15a22009-05-11 14:49:29 -07001471 if (isdigit(tok)) {
Jack Palevich653f42d2009-05-28 17:15:32 -07001472 tokc = strtol(last_id, 0, 0);
Jack Palevich21a15a22009-05-11 14:49:29 -07001473 tok = TOK_NUM;
Jack Paleviche27bf3e2009-05-10 14:09:03 -07001474 } else {
Jack Palevichf1f39cc2009-05-29 18:03:15 -07001475 if (dstk - sym_stk + 1 > ALLOC_SIZE) {
1476 error("symbol stack overflow");
1477 }
Jack Palevich2d11dfb2009-06-08 14:34:26 -07001478 FakeString token(last_id, dstk-last_id);
1479 // Is this a macro?
1480 String* pValue = mMacros.get(&token);
1481 if (pValue) {
1482 // Yes, it is a macro
1483 dstk = last_id-1;
1484 dptr = pValue->getUnwrapped();
1485 dch = ch;
1486 inp();
1487 next();
1488 } else {
1489 * dstk = TAG_TOK; /* no need to mark end of string (we
1490 suppose data is initialized to zero by calloc) */
1491 tok = (intptr_t) (strstr(sym_stk, (last_id - 1))
1492 - sym_stk);
1493 * dstk = 0; /* mark real end of ident for dlsym() */
1494 tok = tok * 8 + TOK_IDENT;
1495 if (tok > TOK_DEFINE) {
1496 if (tok + 8 > ALLOC_SIZE) {
1497 error("Variable Table overflow.");
1498 }
1499 tok = (intptr_t) (pVarsBase + tok);
1500 /* printf("tok=%s %x\n", last_id, tok); */
Jack Palevich21a15a22009-05-11 14:49:29 -07001501 }
Jack Paleviche27bf3e2009-05-10 14:09:03 -07001502 }
1503 }
Jack Paleviche27bf3e2009-05-10 14:09:03 -07001504 } else {
Jack Palevich21a15a22009-05-11 14:49:29 -07001505 inp();
1506 if (tok == '\'') {
1507 tok = TOK_NUM;
1508 getq();
1509 tokc = ch;
1510 inp();
1511 inp();
Jack Palevich546b2242009-05-13 15:10:04 -07001512 } else if ((tok == '/') & (ch == '*')) {
Jack Palevich21a15a22009-05-11 14:49:29 -07001513 inp();
1514 while (ch) {
1515 while (ch != '*')
1516 inp();
1517 inp();
1518 if (ch == '/')
1519 ch = 0;
Jack Paleviche27bf3e2009-05-10 14:09:03 -07001520 }
Jack Palevich21a15a22009-05-11 14:49:29 -07001521 inp();
Jack Paleviche27bf3e2009-05-10 14:09:03 -07001522 next();
Jack Palevichbd894902009-05-14 19:35:31 -07001523 } else if ((tok == '/') & (ch == '/')) {
1524 inp();
1525 while (ch && (ch != '\n')) {
1526 inp();
1527 }
1528 inp();
1529 next();
Jack Palevich21a15a22009-05-11 14:49:29 -07001530 } else {
Jack Palevichbf42c9c2009-05-12 12:48:35 -07001531 const char* t = operatorChars;
1532 int opIndex = 0;
Jack Palevich546b2242009-05-13 15:10:04 -07001533 while ((l = *t++) != 0) {
Jack Palevich21a15a22009-05-11 14:49:29 -07001534 a = *t++;
Jack Palevichbf42c9c2009-05-12 12:48:35 -07001535 tokl = operatorLevel[opIndex];
1536 tokc = opIndex;
Jack Palevich546b2242009-05-13 15:10:04 -07001537 if ((l == tok) & ((a == ch) | (a == '@'))) {
Jack Palevich21a15a22009-05-11 14:49:29 -07001538#if 0
1539 printf("%c%c -> tokl=%d tokc=0x%x\n",
1540 l, a, tokl, tokc);
1541#endif
1542 if (a == ch) {
1543 inp();
1544 tok = TOK_DUMMY; /* dummy token for double tokens */
1545 }
1546 break;
1547 }
Jack Palevichbf42c9c2009-05-12 12:48:35 -07001548 opIndex++;
1549 }
1550 if (l == 0) {
1551 tokl = 0;
1552 tokc = 0;
Jack Palevich21a15a22009-05-11 14:49:29 -07001553 }
1554 }
1555 }
1556#if 0
1557 {
Jack Palevich653f42d2009-05-28 17:15:32 -07001558 char* p;
Jack Palevich21a15a22009-05-11 14:49:29 -07001559
1560 printf("tok=0x%x ", tok);
1561 if (tok >= TOK_IDENT) {
1562 printf("'");
1563 if (tok> TOK_DEFINE)
Jack Palevich653f42d2009-05-28 17:15:32 -07001564 p = sym_stk + 1 + ((char*) tok - pVarsBase - TOK_IDENT) / 8;
Jack Palevich21a15a22009-05-11 14:49:29 -07001565 else
1566 p = sym_stk + 1 + (tok - TOK_IDENT) / 8;
Jack Palevich653f42d2009-05-28 17:15:32 -07001567 while (*p != TAG_TOK && *p)
1568 printf("%c", *p++);
Jack Palevich21a15a22009-05-11 14:49:29 -07001569 printf("'\n");
1570 } else if (tok == TOK_NUM) {
1571 printf("%d\n", tokc);
1572 } else {
1573 printf("'%c'\n", tok);
1574 }
1575 }
1576#endif
1577 }
1578
Jack Palevich2d11dfb2009-06-08 14:34:26 -07001579 void doDefine() {
1580 String* pName = new String();
1581 while (isspace(ch)) {
1582 inp();
1583 }
1584 while (isid()) {
1585 pName->append(ch);
1586 inp();
1587 }
1588 if (ch == '(') {
1589 delete pName;
1590 error("Defines with arguments not supported");
1591 }
1592 while (isspace(ch)) {
1593 inp();
1594 }
1595 String* pValue = new String();
1596 while (ch != '\n' && ch != EOF) {
1597 pValue->append(ch);
1598 inp();
1599 }
1600 delete mMacros.put(pName, pValue);
1601 }
1602
Jack Palevicheedf9d22009-06-04 16:23:40 -07001603 void doPragma() {
1604 // # pragma name(val)
1605 int state = 0;
1606 while(ch != EOF && ch != '\n' && state < 10) {
1607 switch(state) {
1608 case 0:
1609 if (isspace(ch)) {
1610 inp();
1611 } else {
1612 state++;
1613 }
1614 break;
1615 case 1:
1616 if (isalnum(ch)) {
1617 mPragmas.append(ch);
1618 inp();
1619 } else if (ch == '(') {
1620 mPragmas.append(0);
1621 inp();
1622 state++;
1623 } else {
1624 state = 11;
1625 }
1626 break;
1627 case 2:
1628 if (isalnum(ch)) {
1629 mPragmas.append(ch);
1630 inp();
1631 } else if (ch == ')') {
1632 mPragmas.append(0);
1633 inp();
1634 state = 10;
1635 } else {
1636 state = 11;
1637 }
1638 break;
1639 }
1640 }
1641 if(state != 10) {
1642 error("Unexpected pragma syntax");
1643 }
1644 mPragmaStringCount += 2;
1645 }
Jack Palevich21a15a22009-05-11 14:49:29 -07001646
Jack Palevichac0e95e2009-05-29 13:53:44 -07001647 virtual void verror(const char* fmt, va_list ap) {
Jack Palevicheedf9d22009-06-04 16:23:40 -07001648 mErrorBuf.printf("%ld: ", file->getLine());
1649 mErrorBuf.vprintf(fmt, ap);
1650 mErrorBuf.printf("\n");
Jack Palevichac0e95e2009-05-29 13:53:44 -07001651 longjmp(mErrorRecoveryJumpBuf, 1);
Jack Palevich21a15a22009-05-11 14:49:29 -07001652 }
1653
Jack Palevich8b0624c2009-05-20 12:12:06 -07001654 void skip(intptr_t c) {
Jack Palevich21a15a22009-05-11 14:49:29 -07001655 if (tok != c) {
1656 error("'%c' expected", c);
1657 }
1658 next();
1659 }
1660
Jack Palevich21a15a22009-05-11 14:49:29 -07001661 /* l is one if '=' parsing wanted (quick hack) */
Jack Palevich8b0624c2009-05-20 12:12:06 -07001662 void unary(intptr_t l) {
Jack Palevich653f42d2009-05-28 17:15:32 -07001663 intptr_t n, t, a;
1664 int c;
Jack Palevich546b2242009-05-13 15:10:04 -07001665 t = 0;
Jack Palevich21a15a22009-05-11 14:49:29 -07001666 n = 1; /* type of expression 0 = forward, 1 = value, other =
1667 lvalue */
1668 if (tok == '\"') {
Jack Palevich653f42d2009-05-28 17:15:32 -07001669 pGen->li((int) glo);
Jack Palevich21a15a22009-05-11 14:49:29 -07001670 while (ch != '\"') {
1671 getq();
Jack Palevichf1f39cc2009-05-29 18:03:15 -07001672 *allocGlobalSpace(1) = ch;
Jack Palevich21a15a22009-05-11 14:49:29 -07001673 inp();
1674 }
Jack Palevich653f42d2009-05-28 17:15:32 -07001675 *glo = 0;
Jack Palevichf1f39cc2009-05-29 18:03:15 -07001676 /* align heap */
1677 allocGlobalSpace((char*) (((intptr_t) glo + 4) & -4) - glo);
Jack Palevich21a15a22009-05-11 14:49:29 -07001678 inp();
1679 next();
1680 } else {
1681 c = tokl;
1682 a = tokc;
1683 t = tok;
1684 next();
1685 if (t == TOK_NUM) {
Jack Palevichbf42c9c2009-05-12 12:48:35 -07001686 pGen->li(a);
Jack Palevich21a15a22009-05-11 14:49:29 -07001687 } else if (c == 2) {
1688 /* -, +, !, ~ */
1689 unary(0);
Jack Palevich1cdef202009-05-22 12:06:27 -07001690 pGen->clearR1();
Jack Palevich21a15a22009-05-11 14:49:29 -07001691 if (t == '!')
Jack Palevichbf42c9c2009-05-12 12:48:35 -07001692 pGen->gcmp(a);
Jack Palevich21a15a22009-05-11 14:49:29 -07001693 else
Jack Palevichbf42c9c2009-05-12 12:48:35 -07001694 pGen->genOp(a);
Jack Palevich21a15a22009-05-11 14:49:29 -07001695 } else if (t == '(') {
1696 expr();
1697 skip(')');
1698 } else if (t == '*') {
1699 /* parse cast */
1700 skip('(');
1701 t = tok; /* get type */
1702 next(); /* skip int/char/void */
1703 next(); /* skip '*' or '(' */
1704 if (tok == '*') {
1705 /* function type */
1706 skip('*');
1707 skip(')');
1708 skip('(');
1709 skip(')');
1710 t = 0;
1711 }
1712 skip(')');
1713 unary(0);
1714 if (tok == '=') {
1715 next();
Jack Palevich1cdef202009-05-22 12:06:27 -07001716 pGen->pushR0();
Jack Palevich21a15a22009-05-11 14:49:29 -07001717 expr();
Jack Palevich1cdef202009-05-22 12:06:27 -07001718 pGen->popR1();
1719 pGen->storeR0ToR1(t == TOK_INT);
Jack Palevich21a15a22009-05-11 14:49:29 -07001720 } else if (t) {
Jack Palevich1cdef202009-05-22 12:06:27 -07001721 pGen->loadR0FromR0(t == TOK_INT);
Jack Palevich21a15a22009-05-11 14:49:29 -07001722 }
1723 } else if (t == '&') {
Jack Palevich1cdef202009-05-22 12:06:27 -07001724 pGen->leaR0(*(int *) tok);
Jack Palevich21a15a22009-05-11 14:49:29 -07001725 next();
1726 } else {
1727 n = *(int *) t;
1728 /* forward reference: try dlsym */
Jack Palevichcb1c9ef2009-05-14 11:38:49 -07001729 if (!n) {
Jack Palevich653f42d2009-05-28 17:15:32 -07001730 n = (intptr_t) dlsym(RTLD_DEFAULT, last_id);
Jack Palevichcb1c9ef2009-05-14 11:38:49 -07001731 }
Jack Palevich546b2242009-05-13 15:10:04 -07001732 if ((tok == '=') & l) {
Jack Palevich21a15a22009-05-11 14:49:29 -07001733 /* assignment */
1734 next();
1735 expr();
Jack Palevich1cdef202009-05-22 12:06:27 -07001736 pGen->storeR0(n);
Jack Palevich21a15a22009-05-11 14:49:29 -07001737 } else if (tok != '(') {
1738 /* variable */
Jack Palevich1cdef202009-05-22 12:06:27 -07001739 pGen->loadR0(n, tokl == 11, tokc);
Jack Palevich21a15a22009-05-11 14:49:29 -07001740 if (tokl == 11) {
Jack Palevich21a15a22009-05-11 14:49:29 -07001741 next();
1742 }
1743 }
1744 }
1745 }
1746
1747 /* function call */
1748 if (tok == '(') {
1749 if (n == 1)
Jack Palevich1cdef202009-05-22 12:06:27 -07001750 pGen->pushR0();
Jack Palevich21a15a22009-05-11 14:49:29 -07001751
1752 /* push args and invert order */
Jack Palevichcb1c9ef2009-05-14 11:38:49 -07001753 a = pGen->beginFunctionCallArguments();
Jack Palevich21a15a22009-05-11 14:49:29 -07001754 next();
1755 l = 0;
1756 while (tok != ')') {
1757 expr();
Jack Palevich1cdef202009-05-22 12:06:27 -07001758 pGen->storeR0ToArg(l);
Jack Palevichbbf8ab52009-05-11 11:54:30 -07001759 if (tok == ',')
Jack Paleviche27bf3e2009-05-10 14:09:03 -07001760 next();
Jack Palevich21a15a22009-05-11 14:49:29 -07001761 l = l + 4;
Jack Paleviche27bf3e2009-05-10 14:09:03 -07001762 }
Jack Palevichcb1c9ef2009-05-14 11:38:49 -07001763 pGen->endFunctionCallArguments(a, l);
Jack Palevich21a15a22009-05-11 14:49:29 -07001764 next();
1765 if (!n) {
1766 /* forward reference */
1767 t = t + 4;
1768 *(int *) t = pGen->callForward(*(int *) t);
1769 } else if (n == 1) {
1770 pGen->callIndirect(l);
Jack Palevich21a15a22009-05-11 14:49:29 -07001771 } else {
Jack Palevich7810bc92009-05-15 14:31:47 -07001772 pGen->callRelative(n - codeBuf.getPC() - pGen->jumpOffset());
Jack Palevich21a15a22009-05-11 14:49:29 -07001773 }
Jack Palevich3d474a72009-05-15 15:12:38 -07001774 if (l | (n == 1))
Jack Palevich7810bc92009-05-15 14:31:47 -07001775 pGen->adjustStackAfterCall(l, n == 1);
Jack Palevich21a15a22009-05-11 14:49:29 -07001776 }
1777 }
1778
Jack Palevich653f42d2009-05-28 17:15:32 -07001779 void sum(int l) {
Jack Palevich8b0624c2009-05-20 12:12:06 -07001780 intptr_t t, n, a;
Jack Palevich546b2242009-05-13 15:10:04 -07001781 t = 0;
Jack Palevich21a15a22009-05-11 14:49:29 -07001782 if (l-- == 1)
1783 unary(1);
1784 else {
1785 sum(l);
1786 a = 0;
1787 while (l == tokl) {
1788 n = tok;
1789 t = tokc;
1790 next();
1791
1792 if (l > 8) {
Jack Palevichbf42c9c2009-05-12 12:48:35 -07001793 a = pGen->gtst(t == OP_LOGICAL_OR, a); /* && and || output code generation */
Jack Palevich21a15a22009-05-11 14:49:29 -07001794 sum(l);
1795 } else {
Jack Palevich1cdef202009-05-22 12:06:27 -07001796 pGen->pushR0();
Jack Palevich21a15a22009-05-11 14:49:29 -07001797 sum(l);
Jack Palevich1cdef202009-05-22 12:06:27 -07001798 pGen->popR1();
Jack Palevich21a15a22009-05-11 14:49:29 -07001799
Jack Palevich546b2242009-05-13 15:10:04 -07001800 if ((l == 4) | (l == 5)) {
Jack Palevichbf42c9c2009-05-12 12:48:35 -07001801 pGen->gcmp(t);
Jack Palevich21a15a22009-05-11 14:49:29 -07001802 } else {
Jack Palevichbf42c9c2009-05-12 12:48:35 -07001803 pGen->genOp(t);
Jack Palevich21a15a22009-05-11 14:49:29 -07001804 }
1805 }
1806 }
1807 /* && and || output code generation */
1808 if (a && l > 8) {
Jack Palevichbf42c9c2009-05-12 12:48:35 -07001809 a = pGen->gtst(t == OP_LOGICAL_OR, a);
1810 pGen->li(t != OP_LOGICAL_OR);
Jack Palevicha6535612009-05-13 16:24:17 -07001811 pGen->gjmp(5); /* jmp $ + 5 (sizeof li, FIXME for ARM) */
Jack Palevichbf42c9c2009-05-12 12:48:35 -07001812 pGen->gsym(a);
1813 pGen->li(t == OP_LOGICAL_OR);
Jack Palevich21a15a22009-05-11 14:49:29 -07001814 }
1815 }
1816 }
1817
1818 void expr() {
1819 sum(11);
1820 }
1821
1822 int test_expr() {
1823 expr();
Jack Palevichbf42c9c2009-05-12 12:48:35 -07001824 return pGen->gtst(0, 0);
Jack Palevich21a15a22009-05-11 14:49:29 -07001825 }
1826
Jack Palevich8b0624c2009-05-20 12:12:06 -07001827 void block(intptr_t l) {
1828 intptr_t a, n, t;
Jack Palevich21a15a22009-05-11 14:49:29 -07001829
1830 if (tok == TOK_IF) {
Jack Paleviche27bf3e2009-05-10 14:09:03 -07001831 next();
1832 skip('(');
Jack Palevich21a15a22009-05-11 14:49:29 -07001833 a = test_expr();
1834 skip(')');
1835 block(l);
1836 if (tok == TOK_ELSE) {
Jack Paleviche27bf3e2009-05-10 14:09:03 -07001837 next();
Jack Palevichbf42c9c2009-05-12 12:48:35 -07001838 n = pGen->gjmp(0); /* jmp */
1839 pGen->gsym(a);
Jack Palevich21a15a22009-05-11 14:49:29 -07001840 block(l);
Jack Palevichbf42c9c2009-05-12 12:48:35 -07001841 pGen->gsym(n); /* patch else jmp */
Jack Palevich21a15a22009-05-11 14:49:29 -07001842 } else {
Jack Palevichbf42c9c2009-05-12 12:48:35 -07001843 pGen->gsym(a); /* patch if test */
Jack Paleviche27bf3e2009-05-10 14:09:03 -07001844 }
Jack Palevich546b2242009-05-13 15:10:04 -07001845 } else if ((tok == TOK_WHILE) | (tok == TOK_FOR)) {
Jack Palevich21a15a22009-05-11 14:49:29 -07001846 t = tok;
1847 next();
1848 skip('(');
1849 if (t == TOK_WHILE) {
Jack Palevicha6535612009-05-13 16:24:17 -07001850 n = codeBuf.getPC(); // top of loop, target of "next" iteration
Jack Palevich21a15a22009-05-11 14:49:29 -07001851 a = test_expr();
1852 } else {
1853 if (tok != ';')
1854 expr();
1855 skip(';');
1856 n = codeBuf.getPC();
1857 a = 0;
1858 if (tok != ';')
1859 a = test_expr();
1860 skip(';');
1861 if (tok != ')') {
Jack Palevichbf42c9c2009-05-12 12:48:35 -07001862 t = pGen->gjmp(0);
Jack Palevich21a15a22009-05-11 14:49:29 -07001863 expr();
Jack Palevicha6535612009-05-13 16:24:17 -07001864 pGen->gjmp(n - codeBuf.getPC() - pGen->jumpOffset());
Jack Palevichbf42c9c2009-05-12 12:48:35 -07001865 pGen->gsym(t);
Jack Palevich21a15a22009-05-11 14:49:29 -07001866 n = t + 4;
1867 }
1868 }
1869 skip(')');
Jack Palevich8b0624c2009-05-20 12:12:06 -07001870 block((intptr_t) &a);
Jack Palevicha6535612009-05-13 16:24:17 -07001871 pGen->gjmp(n - codeBuf.getPC() - pGen->jumpOffset()); /* jmp */
Jack Palevichbf42c9c2009-05-12 12:48:35 -07001872 pGen->gsym(a);
Jack Palevich21a15a22009-05-11 14:49:29 -07001873 } else if (tok == '{') {
1874 next();
1875 /* declarations */
Jack Palevichb7c81e92009-06-04 19:56:13 -07001876 localDeclarations();
Jack Palevich21a15a22009-05-11 14:49:29 -07001877 while (tok != '}')
1878 block(l);
1879 next();
1880 } else {
1881 if (tok == TOK_RETURN) {
1882 next();
1883 if (tok != ';')
1884 expr();
Jack Palevichbf42c9c2009-05-12 12:48:35 -07001885 rsym = pGen->gjmp(rsym); /* jmp */
Jack Palevich21a15a22009-05-11 14:49:29 -07001886 } else if (tok == TOK_BREAK) {
1887 next();
Jack Palevichbf42c9c2009-05-12 12:48:35 -07001888 *(int *) l = pGen->gjmp(*(int *) l);
Jack Palevich21a15a22009-05-11 14:49:29 -07001889 } else if (tok != ';')
1890 expr();
1891 skip(';');
Jack Paleviche27bf3e2009-05-10 14:09:03 -07001892 }
1893 }
Jack Palevich21a15a22009-05-11 14:49:29 -07001894
Jack Palevichb7c81e92009-06-04 19:56:13 -07001895 typedef int Type;
1896 static const Type TY_UNKNOWN = 0;
1897 static const Type TY_INT = 1;
1898 static const Type TY_CHAR = 2;
1899 static const Type TY_VOID = 3;
1900 static const int TY_BASE_TYPE_MASK = 0xf;
1901 static const int TY_INDIRECTION_MASK = 0xf0;
1902 static const int TY_INDIRECTION_SHIFT = 4;
1903 static const int MAX_INDIRECTION_COUNT = 15;
Jack Palevich21a15a22009-05-11 14:49:29 -07001904
Jack Palevichb7c81e92009-06-04 19:56:13 -07001905 Type getBaseType(Type t) {
1906 return t & TY_BASE_TYPE_MASK;
1907 }
1908
1909 int getIndirectionCount(Type t) {
1910 return (TY_INDIRECTION_MASK & t) >> TY_INDIRECTION_SHIFT;
1911 }
1912
1913 void setIndirectionCount(Type& t, int count) {
1914 t = ((TY_INDIRECTION_MASK & (count << TY_INDIRECTION_SHIFT))
1915 | (t & ~TY_INDIRECTION_MASK));
1916 }
1917
1918 bool acceptType(Type& t) {
1919 t = TY_UNKNOWN;
1920 if (tok == TOK_INT) {
1921 t = TY_INT;
1922 } else if (tok == TOK_CHAR) {
1923 t = TY_CHAR;
1924 } else if (tok == TOK_VOID) {
1925 t = TY_VOID;
1926 } else {
1927 return false;
1928 }
1929 next();
1930 return true;
1931 }
1932
1933 Type acceptPointerDeclaration(Type& base) {
1934 Type t = base;
1935 int indirectionCount = 0;
1936 while (tok == '*' && indirectionCount <= MAX_INDIRECTION_COUNT) {
1937 next();
1938 indirectionCount++;
1939 }
1940 if (indirectionCount > MAX_INDIRECTION_COUNT) {
1941 error("Too many levels of pointer. Max %d", MAX_INDIRECTION_COUNT);
1942 }
1943 setIndirectionCount(t, indirectionCount);
1944 return t;
1945 }
1946
1947 void expectType(Type& t) {
1948 if (!acceptType(t)) {
1949 error("Expected a type.");
1950 }
1951 }
1952
1953 void checkSymbol() {
1954 if (tok <= TOK_DEFINE) {
1955 error("Expected a symbol");
1956 }
1957 }
1958
1959 void localDeclarations() {
1960 intptr_t a;
1961 Type base;
1962
1963 while (acceptType(base)) {
1964 while (tok != ';') {
1965 Type t = acceptPointerDeclaration(t);
1966 checkSymbol();
1967 loc = loc + 4;
1968 *(int *) tok = -loc;
1969
Jack Palevich21a15a22009-05-11 14:49:29 -07001970 next();
Jack Palevichb7c81e92009-06-04 19:56:13 -07001971 if (tok == ',')
1972 next();
1973 }
1974 skip(';');
1975 }
1976 }
1977
1978 void globalDeclarations() {
1979 while (tok != EOF) {
1980 Type base;
1981 expectType(base);
1982 Type t = acceptPointerDeclaration(t);
1983 checkSymbol();
1984 int name = tok;
1985 next();
1986 if (tok == ',' || tok == ';') {
1987 // it's a variable declaration
1988 for(;;) {
1989 *(int* *) name = (int*) allocGlobalSpace(4);
1990 if (tok != ',') {
1991 break;
Jack Palevich21a15a22009-05-11 14:49:29 -07001992 }
1993 next();
Jack Palevichb7c81e92009-06-04 19:56:13 -07001994 t = acceptPointerDeclaration(t);
1995 checkSymbol();
1996 name = tok;
1997 next();
Jack Palevich21a15a22009-05-11 14:49:29 -07001998 }
1999 skip(';');
2000 } else {
Jack Palevichb7c81e92009-06-04 19:56:13 -07002001 /* patch forward references (XXX: does not work for function
Jack Palevich21a15a22009-05-11 14:49:29 -07002002 pointers) */
Jack Palevichb7c81e92009-06-04 19:56:13 -07002003 pGen->gsym(*(int *) (name + 4));
Jack Palevich21a15a22009-05-11 14:49:29 -07002004 /* put function address */
Jack Palevichb7c81e92009-06-04 19:56:13 -07002005 *(int *) name = codeBuf.getPC();
Jack Palevich21a15a22009-05-11 14:49:29 -07002006 skip('(');
Jack Palevichb7c81e92009-06-04 19:56:13 -07002007 intptr_t a = 8;
Jack Palevich546b2242009-05-13 15:10:04 -07002008 int argCount = 0;
Jack Palevich21a15a22009-05-11 14:49:29 -07002009 while (tok != ')') {
Jack Palevichb7c81e92009-06-04 19:56:13 -07002010 Type aType;
2011 expectType(aType);
2012 aType = acceptPointerDeclaration(aType);
2013 checkSymbol();
Jack Palevich21a15a22009-05-11 14:49:29 -07002014 /* read param name and compute offset */
2015 *(int *) tok = a;
2016 a = a + 4;
2017 next();
2018 if (tok == ',')
2019 next();
Jack Palevich546b2242009-05-13 15:10:04 -07002020 argCount++;
Jack Palevich21a15a22009-05-11 14:49:29 -07002021 }
Jack Palevichb7c81e92009-06-04 19:56:13 -07002022 skip(')'); /* skip ')' */
Jack Palevich21a15a22009-05-11 14:49:29 -07002023 rsym = loc = 0;
Jack Palevich546b2242009-05-13 15:10:04 -07002024 a = pGen->functionEntry(argCount);
Jack Palevich21a15a22009-05-11 14:49:29 -07002025 block(0);
Jack Palevichbf42c9c2009-05-12 12:48:35 -07002026 pGen->gsym(rsym);
Jack Palevich546b2242009-05-13 15:10:04 -07002027 pGen->functionExit(argCount, a, loc);
Jack Palevich21a15a22009-05-11 14:49:29 -07002028 }
2029 }
2030 }
2031
Jack Palevichf1f39cc2009-05-29 18:03:15 -07002032 char* allocGlobalSpace(int bytes) {
2033 if (glo - pGlobalBase + bytes > ALLOC_SIZE) {
2034 error("Global space exhausted");
2035 }
2036 char* result = glo;
2037 glo += bytes;
2038 return result;
2039 }
2040
Jack Palevich21a15a22009-05-11 14:49:29 -07002041 void cleanup() {
2042 if (sym_stk != 0) {
Jack Palevich653f42d2009-05-28 17:15:32 -07002043 free(sym_stk);
Jack Palevich21a15a22009-05-11 14:49:29 -07002044 sym_stk = 0;
2045 }
2046 if (pGlobalBase != 0) {
Jack Palevichf1f39cc2009-05-29 18:03:15 -07002047 free(pGlobalBase);
Jack Palevich21a15a22009-05-11 14:49:29 -07002048 pGlobalBase = 0;
2049 }
2050 if (pVarsBase != 0) {
2051 free(pVarsBase);
2052 pVarsBase = 0;
2053 }
2054 if (pGen) {
2055 delete pGen;
2056 pGen = 0;
2057 }
Jack Palevich1cdef202009-05-22 12:06:27 -07002058 if (file) {
2059 delete file;
2060 file = 0;
2061 }
Jack Palevich21a15a22009-05-11 14:49:29 -07002062 }
2063
2064 void clear() {
2065 tok = 0;
2066 tokc = 0;
2067 tokl = 0;
2068 ch = 0;
Jack Palevich653f42d2009-05-28 17:15:32 -07002069 pVarsBase = 0;
Jack Palevich21a15a22009-05-11 14:49:29 -07002070 rsym = 0;
2071 loc = 0;
2072 glo = 0;
2073 sym_stk = 0;
2074 dstk = 0;
2075 dptr = 0;
2076 dch = 0;
2077 last_id = 0;
2078 file = 0;
2079 pGlobalBase = 0;
2080 pVarsBase = 0;
2081 pGen = 0;
Jack Palevicheedf9d22009-06-04 16:23:40 -07002082 mPragmaStringCount = 0;
Jack Palevich21a15a22009-05-11 14:49:29 -07002083 }
Jack Paleviche27bf3e2009-05-10 14:09:03 -07002084
Jack Palevich22305132009-05-13 10:58:45 -07002085 void setArchitecture(const char* architecture) {
2086 delete pGen;
2087 pGen = 0;
2088
2089 if (architecture != NULL) {
Jack Paleviche7b59062009-05-19 17:12:17 -07002090#ifdef PROVIDE_ARM_CODEGEN
Jack Palevich8b0624c2009-05-20 12:12:06 -07002091 if (! pGen && strcmp(architecture, "arm") == 0) {
Jack Palevich22305132009-05-13 10:58:45 -07002092 pGen = new ARMCodeGenerator();
Jack Palevich8b0624c2009-05-20 12:12:06 -07002093 }
Jack Paleviche7b59062009-05-19 17:12:17 -07002094#endif
Jack Paleviche7b59062009-05-19 17:12:17 -07002095#ifdef PROVIDE_X86_CODEGEN
Jack Palevich8b0624c2009-05-20 12:12:06 -07002096 if (! pGen && strcmp(architecture, "x86") == 0) {
Jack Palevich22305132009-05-13 10:58:45 -07002097 pGen = new X86CodeGenerator();
Jack Palevich8b0624c2009-05-20 12:12:06 -07002098 }
Jack Paleviche7b59062009-05-19 17:12:17 -07002099#endif
Jack Palevich8b0624c2009-05-20 12:12:06 -07002100 if (!pGen ) {
Jack Palevichac0e95e2009-05-29 13:53:44 -07002101 error("Unknown architecture %s\n", architecture);
Jack Palevich22305132009-05-13 10:58:45 -07002102 }
2103 }
2104
2105 if (pGen == NULL) {
Jack Paleviche7b59062009-05-19 17:12:17 -07002106#if defined(DEFAULT_ARM_CODEGEN)
Jack Palevich22305132009-05-13 10:58:45 -07002107 pGen = new ARMCodeGenerator();
Jack Paleviche7b59062009-05-19 17:12:17 -07002108#elif defined(DEFAULT_X86_CODEGEN)
2109 pGen = new X86CodeGenerator();
2110#endif
2111 }
2112 if (pGen == NULL) {
Jack Palevichac0e95e2009-05-29 13:53:44 -07002113 error("No code generator defined.");
Jack Palevich22305132009-05-13 10:58:45 -07002114 }
Jack Palevichac0e95e2009-05-29 13:53:44 -07002115 pGen->setErrorSink(this);
Jack Palevich22305132009-05-13 10:58:45 -07002116 }
2117
Jack Palevich77ae76e2009-05-10 19:59:24 -07002118public:
Jack Palevich22305132009-05-13 10:58:45 -07002119 struct args {
2120 args() {
2121 architecture = 0;
2122 }
2123 const char* architecture;
2124 };
2125
Jack Paleviche7b59062009-05-19 17:12:17 -07002126 Compiler() {
Jack Palevich21a15a22009-05-11 14:49:29 -07002127 clear();
Jack Paleviche27bf3e2009-05-10 14:09:03 -07002128 }
Jack Palevichbbf8ab52009-05-11 11:54:30 -07002129
Jack Paleviche7b59062009-05-19 17:12:17 -07002130 ~Compiler() {
Jack Palevich21a15a22009-05-11 14:49:29 -07002131 cleanup();
2132 }
2133
Jack Palevich1cdef202009-05-22 12:06:27 -07002134 int compile(const char* text, size_t textLength) {
Jack Palevichac0e95e2009-05-29 13:53:44 -07002135 int result;
2136 if (! (result = setjmp(mErrorRecoveryJumpBuf))) {
2137 cleanup();
2138 clear();
2139 codeBuf.init(ALLOC_SIZE);
2140 setArchitecture(NULL);
2141 if (!pGen) {
2142 return -1;
2143 }
2144 pGen->init(&codeBuf);
2145 file = new TextInputStream(text, textLength);
2146 sym_stk = (char*) calloc(1, ALLOC_SIZE);
Jack Palevicheedf9d22009-06-04 16:23:40 -07002147 static const char* predefinedSymbols =
Jack Palevichb7c81e92009-06-04 19:56:13 -07002148 " int char void"
2149 " if else while break return for"
2150 " pragma define main ";
Jack Palevicheedf9d22009-06-04 16:23:40 -07002151 dstk = strcpy(sym_stk, predefinedSymbols)
2152 + strlen(predefinedSymbols);
Jack Palevichf1f39cc2009-05-29 18:03:15 -07002153 pGlobalBase = (char*) calloc(1, ALLOC_SIZE);
2154 glo = pGlobalBase;
Jack Palevichac0e95e2009-05-29 13:53:44 -07002155 pVarsBase = (char*) calloc(1, ALLOC_SIZE);
2156 inp();
2157 next();
Jack Palevichb7c81e92009-06-04 19:56:13 -07002158 globalDeclarations();
Jack Palevichac0e95e2009-05-29 13:53:44 -07002159 pGen->finishCompile();
Jack Palevich8b0624c2009-05-20 12:12:06 -07002160 }
Jack Palevichac0e95e2009-05-29 13:53:44 -07002161 return result;
Jack Palevich21a15a22009-05-11 14:49:29 -07002162 }
2163
2164 int run(int argc, char** argv) {
2165 typedef int (*mainPtr)(int argc, char** argv);
Jack Palevich653f42d2009-05-28 17:15:32 -07002166 mainPtr aMain = (mainPtr) *(int*) (pVarsBase + TOK_MAIN);
Jack Palevich21a15a22009-05-11 14:49:29 -07002167 if (!aMain) {
2168 fprintf(stderr, "Could not find function \"main\".\n");
2169 return -1;
2170 }
2171 return aMain(argc, argv);
2172 }
2173
2174 int dump(FILE* out) {
2175 fwrite(codeBuf.getBase(), 1, codeBuf.getSize(), out);
2176 return 0;
2177 }
Jack Palevich77ae76e2009-05-10 19:59:24 -07002178
Jack Palevicha6535612009-05-13 16:24:17 -07002179 int disassemble(FILE* out) {
2180 return pGen->disassemble(out);
2181 }
2182
Jack Palevich1cdef202009-05-22 12:06:27 -07002183 /* Look through the symbol table to find a symbol.
2184 * If found, return its value.
2185 */
2186 void* lookup(const char* name) {
2187 if (!sym_stk) {
2188 return NULL;
2189 }
2190 size_t nameLen = strlen(name);
Jack Palevich653f42d2009-05-28 17:15:32 -07002191 char* pSym = sym_stk;
Jack Palevich1cdef202009-05-22 12:06:27 -07002192 char c;
2193 for(;;) {
2194 c = *pSym++;
2195 if (c == 0) {
2196 break;
2197 }
2198 if (c == TAG_TOK) {
2199 if (memcmp(pSym, name, nameLen) == 0
2200 && pSym[nameLen] == TAG_TOK) {
Jack Palevich653f42d2009-05-28 17:15:32 -07002201 int tok = pSym - 1 - sym_stk;
Jack Palevich1cdef202009-05-22 12:06:27 -07002202 tok = tok * 8 + TOK_IDENT;
2203 if (tok <= TOK_DEFINE) {
2204 return 0;
2205 } else {
Jack Palevich653f42d2009-05-28 17:15:32 -07002206 tok = (intptr_t) (pVarsBase + tok);
Jack Palevich1cdef202009-05-22 12:06:27 -07002207 return * (void**) tok;
2208 }
2209 }
2210 }
2211 }
2212 return NULL;
2213 }
2214
Jack Palevicheedf9d22009-06-04 16:23:40 -07002215 void getPragmas(ACCsizei* actualStringCount,
2216 ACCsizei maxStringCount, ACCchar** strings) {
2217 int stringCount = mPragmaStringCount;
2218 if (actualStringCount) {
2219 *actualStringCount = stringCount;
2220 }
2221 if (stringCount > maxStringCount) {
2222 stringCount = maxStringCount;
2223 }
2224 if (strings) {
2225 char* pPragmas = mPragmas.getUnwrapped();
2226 while (stringCount-- > 0) {
2227 *strings++ = pPragmas;
2228 pPragmas += strlen(pPragmas) + 1;
2229 }
2230 }
2231 }
2232
Jack Palevichac0e95e2009-05-29 13:53:44 -07002233 char* getErrorMessage() {
Jack Palevicheedf9d22009-06-04 16:23:40 -07002234 return mErrorBuf.getUnwrapped();
Jack Palevichac0e95e2009-05-29 13:53:44 -07002235 }
2236
Jack Palevich77ae76e2009-05-10 19:59:24 -07002237};
2238
Jack Paleviche7b59062009-05-19 17:12:17 -07002239const char* Compiler::operatorChars =
Jack Palevichbf42c9c2009-05-12 12:48:35 -07002240 "++--*@/@%@+@-@<<>><=>=<@>@==!=&&||&@^@|@~@!@";
2241
Jack Paleviche7b59062009-05-19 17:12:17 -07002242const char Compiler::operatorLevel[] =
Jack Palevichbf42c9c2009-05-12 12:48:35 -07002243 {11, 11, 1, 1, 1, 2, 2, 3, 3, 4, 4, 4, 4,
2244 5, 5, /* ==, != */
2245 9, 10, /* &&, || */
2246 6, 7, 8, /* & ^ | */
2247 2, 2 /* ~ ! */
2248 };
2249
Jack Palevich8b0624c2009-05-20 12:12:06 -07002250#ifdef PROVIDE_ARM_CODEGEN
Jack Paleviche7b59062009-05-19 17:12:17 -07002251FILE* Compiler::ARMCodeGenerator::disasmOut;
Jack Palevich8b0624c2009-05-20 12:12:06 -07002252#endif
Jack Palevicha6535612009-05-13 16:24:17 -07002253
Jack Palevich8b0624c2009-05-20 12:12:06 -07002254#ifdef PROVIDE_X86_CODEGEN
Jack Paleviche7b59062009-05-19 17:12:17 -07002255const int Compiler::X86CodeGenerator::operatorHelper[] = {
Jack Palevichbf42c9c2009-05-12 12:48:35 -07002256 0x1, // ++
2257 0xff, // --
2258 0xc1af0f, // *
2259 0xf9f79991, // /
2260 0xf9f79991, // % (With manual assist to swap results)
2261 0xc801, // +
2262 0xd8f7c829, // -
2263 0xe0d391, // <<
2264 0xf8d391, // >>
2265 0xe, // <=
2266 0xd, // >=
2267 0xc, // <
2268 0xf, // >
2269 0x4, // ==
2270 0x5, // !=
2271 0x0, // &&
2272 0x1, // ||
2273 0xc821, // &
2274 0xc831, // ^
2275 0xc809, // |
2276 0xd0f7, // ~
2277 0x4 // !
2278};
Jack Palevich8b0624c2009-05-20 12:12:06 -07002279#endif
Jack Palevichbf42c9c2009-05-12 12:48:35 -07002280
Jack Palevich1cdef202009-05-22 12:06:27 -07002281struct ACCscript {
2282 ACCscript() {
2283 text = 0;
2284 textLength = 0;
2285 accError = ACC_NO_ERROR;
2286 }
Jack Palevichbbf8ab52009-05-11 11:54:30 -07002287
Jack Palevich1cdef202009-05-22 12:06:27 -07002288 ~ACCscript() {
2289 delete text;
2290 }
Jack Palevich546b2242009-05-13 15:10:04 -07002291
Jack Palevich1cdef202009-05-22 12:06:27 -07002292 void setError(ACCenum error) {
2293 if (accError == ACC_NO_ERROR && error != ACC_NO_ERROR) {
2294 accError = error;
Jack Palevichbbf8ab52009-05-11 11:54:30 -07002295 }
2296 }
2297
Jack Palevich1cdef202009-05-22 12:06:27 -07002298 ACCenum getError() {
2299 ACCenum result = accError;
2300 accError = ACC_NO_ERROR;
Jack Palevich22305132009-05-13 10:58:45 -07002301 return result;
Jack Palevichbbf8ab52009-05-11 11:54:30 -07002302 }
2303
Jack Palevich1cdef202009-05-22 12:06:27 -07002304 Compiler compiler;
2305 char* text;
2306 int textLength;
2307 ACCenum accError;
2308};
2309
2310
2311extern "C"
2312ACCscript* accCreateScript() {
2313 return new ACCscript();
Jack Palevichbbf8ab52009-05-11 11:54:30 -07002314}
Jack Palevich1cdef202009-05-22 12:06:27 -07002315
2316extern "C"
2317ACCenum accGetError( ACCscript* script ) {
2318 return script->getError();
2319}
2320
2321extern "C"
2322void accDeleteScript(ACCscript* script) {
2323 delete script;
2324}
2325
2326extern "C"
2327void accScriptSource(ACCscript* script,
2328 ACCsizei count,
2329 const ACCchar ** string,
2330 const ACCint * length) {
2331 int totalLength = 0;
2332 for(int i = 0; i < count; i++) {
2333 int len = -1;
2334 const ACCchar* s = string[i];
2335 if (length) {
2336 len = length[i];
2337 }
2338 if (len < 0) {
2339 len = strlen(s);
2340 }
2341 totalLength += len;
2342 }
2343 delete script->text;
2344 char* text = new char[totalLength + 1];
2345 script->text = text;
2346 script->textLength = totalLength;
Jack Palevich09555c72009-05-27 12:25:55 -07002347 char* dest = text;
Jack Palevich1cdef202009-05-22 12:06:27 -07002348 for(int i = 0; i < count; i++) {
2349 int len = -1;
2350 const ACCchar* s = string[i];
2351 if (length) {
2352 len = length[i];
2353 }
2354 if (len < 0) {
2355 len = strlen(s);
2356 }
Jack Palevich09555c72009-05-27 12:25:55 -07002357 memcpy(dest, s, len);
2358 dest += len;
Jack Palevich1cdef202009-05-22 12:06:27 -07002359 }
2360 text[totalLength] = '\0';
2361}
2362
2363extern "C"
2364void accCompileScript(ACCscript* script) {
2365 int result = script->compiler.compile(script->text, script->textLength);
2366 if (result) {
2367 script->setError(ACC_INVALID_OPERATION);
2368 }
2369}
2370
2371extern "C"
2372void accGetScriptiv(ACCscript* script,
2373 ACCenum pname,
2374 ACCint * params) {
2375 switch (pname) {
2376 case ACC_INFO_LOG_LENGTH:
2377 *params = 0;
2378 break;
2379 }
2380}
2381
2382extern "C"
2383void accGetScriptInfoLog(ACCscript* script,
2384 ACCsizei maxLength,
2385 ACCsizei * length,
2386 ACCchar * infoLog) {
Jack Palevichac0e95e2009-05-29 13:53:44 -07002387 char* message = script->compiler.getErrorMessage();
2388 int messageLength = strlen(message) + 1;
Jack Palevich1cdef202009-05-22 12:06:27 -07002389 if (length) {
Jack Palevichac0e95e2009-05-29 13:53:44 -07002390 *length = messageLength;
Jack Palevich1cdef202009-05-22 12:06:27 -07002391 }
Jack Palevichac0e95e2009-05-29 13:53:44 -07002392 if (infoLog && maxLength > 0) {
2393 int trimmedLength = maxLength < messageLength ?
2394 maxLength : messageLength;
2395 memcpy(infoLog, message, trimmedLength);
2396 infoLog[trimmedLength] = 0;
Jack Palevich1cdef202009-05-22 12:06:27 -07002397 }
2398}
2399
2400extern "C"
2401void accGetScriptLabel(ACCscript* script, const ACCchar * name,
2402 ACCvoid ** address) {
2403 void* value = script->compiler.lookup(name);
2404 if (value) {
2405 *address = value;
2406 } else {
2407 script->setError(ACC_INVALID_VALUE);
2408 }
2409}
2410
Jack Palevicheedf9d22009-06-04 16:23:40 -07002411extern "C"
2412void accGetPragmas(ACCscript* script, ACCsizei* actualStringCount,
2413 ACCsizei maxStringCount, ACCchar** strings){
2414 script->compiler.getPragmas(actualStringCount, maxStringCount, strings);
2415}
2416
2417
Jack Palevich1cdef202009-05-22 12:06:27 -07002418} // namespace acc
2419