blob: 0d26a5cad350231faafdaa058c940596b8417bdf [file] [log] [blame]
Jack Palevichae54f1f2009-05-08 14:54:15 -07001/*
Jack Paleviche7b59062009-05-19 17:12:17 -07002 * Android "Almost" C Compiler.
3 * This is a compiler for a small subset of the C language, intended for use
4 * in scripting environments where speed and memory footprint are important.
5 *
6 * This code is based upon the "unobfuscated" version of the
Jack Palevich1cdef202009-05-22 12:06:27 -07007 * Obfuscated Tiny C compiler, see the file LICENSE for details.
Jack Paleviche7b59062009-05-19 17:12:17 -07008 *
9 */
10
Jack Palevich77ae76e2009-05-10 19:59:24 -070011#include <ctype.h>
12#include <dlfcn.h>
Jack Palevich8dc662e2009-06-09 22:53:47 +000013#include <errno.h>
Jack Paleviche27bf3e2009-05-10 14:09:03 -070014#include <stdarg.h>
Jack Palevich8b0624c2009-05-20 12:12:06 -070015#include <stdint.h>
Jack Palevichae54f1f2009-05-08 14:54:15 -070016#include <stdio.h>
Jack Palevichf6b5a532009-05-10 19:16:42 -070017#include <stdlib.h>
18#include <string.h>
Jack Palevich2d11dfb2009-06-08 14:34:26 -070019#include <cutils/hashmap.h>
Jack Palevichae54f1f2009-05-08 14:54:15 -070020
Jack Palevich8dc662e2009-06-09 22:53:47 +000021#if defined(__i386__)
22#include <sys/mman.h>
23#endif
24
Jack Palevich546b2242009-05-13 15:10:04 -070025#if defined(__arm__)
26#include <unistd.h>
27#endif
28
Jack Paleviche7b59062009-05-19 17:12:17 -070029#if defined(__arm__)
30#define DEFAULT_ARM_CODEGEN
Jack Palevich8b0624c2009-05-20 12:12:06 -070031#define PROVIDE_ARM_CODEGEN
Jack Paleviche7b59062009-05-19 17:12:17 -070032#elif defined(__i386__)
33#define DEFAULT_X86_CODEGEN
Jack Palevich8b0624c2009-05-20 12:12:06 -070034#define PROVIDE_X86_CODEGEN
Jack Paleviche7b59062009-05-19 17:12:17 -070035#elif defined(__x86_64__)
36#define DEFAULT_X64_CODEGEN
Jack Palevich8b0624c2009-05-20 12:12:06 -070037#define PROVIDE_X64_CODEGEN
Jack Paleviche7b59062009-05-19 17:12:17 -070038#endif
39
Jack Paleviche7b59062009-05-19 17:12:17 -070040
41#ifdef PROVIDE_ARM_CODEGEN
Jack Palevicha6535612009-05-13 16:24:17 -070042#include "disassem.h"
Jack Paleviche7b59062009-05-19 17:12:17 -070043#endif
Jack Palevicha6535612009-05-13 16:24:17 -070044
Jack Palevich1cdef202009-05-22 12:06:27 -070045#include <acc/acc.h>
46
Jack Palevich09555c72009-05-27 12:25:55 -070047#define LOG_API(...) do {} while(0)
48// #define LOG_API(...) fprintf (stderr, __VA_ARGS__)
Jack Palevich09555c72009-05-27 12:25:55 -070049
-b master422972c2009-06-17 19:13:52 -070050#define LOG_STACK(...) do {} while(0)
51// #define LOG_STACK(...) fprintf (stderr, __VA_ARGS__)
52
53// #define ENABLE_ARM_DISASSEMBLY
Jack Palevichb67b18f2009-06-11 21:12:23 -070054// #define PROVIDE_TRACE_CODEGEN
55
Jack Palevichbbf8ab52009-05-11 11:54:30 -070056namespace acc {
57
Jack Palevichac0e95e2009-05-29 13:53:44 -070058class ErrorSink {
59public:
60 void error(const char *fmt, ...) {
61 va_list ap;
62 va_start(ap, fmt);
63 verror(fmt, ap);
64 va_end(ap);
65 }
66
67 virtual void verror(const char* fmt, va_list ap) = 0;
68};
69
70class Compiler : public ErrorSink {
Jack Palevich21a15a22009-05-11 14:49:29 -070071 class CodeBuf {
Jack Palevich653f42d2009-05-28 17:15:32 -070072 char* ind; // Output code pointer
Jack Palevich21a15a22009-05-11 14:49:29 -070073 char* pProgramBase;
Jack Palevichac0e95e2009-05-29 13:53:44 -070074 ErrorSink* mErrorSink;
75 int mSize;
Jack Palevich0a280a02009-06-11 10:53:51 -070076 bool mOverflowed;
Jack Palevichf0cbc922009-05-08 16:35:13 -070077
Jack Palevich21a15a22009-05-11 14:49:29 -070078 void release() {
79 if (pProgramBase != 0) {
80 free(pProgramBase);
81 pProgramBase = 0;
Jack Palevichae54f1f2009-05-08 14:54:15 -070082 }
Jack Palevich21a15a22009-05-11 14:49:29 -070083 }
84
Jack Palevich0a280a02009-06-11 10:53:51 -070085 bool check(int n) {
Jack Palevichac0e95e2009-05-29 13:53:44 -070086 int newSize = ind - pProgramBase + n;
Jack Palevich0a280a02009-06-11 10:53:51 -070087 bool overflow = newSize > mSize;
88 if (overflow && !mOverflowed) {
89 mOverflowed = true;
Jack Palevichac0e95e2009-05-29 13:53:44 -070090 if (mErrorSink) {
91 mErrorSink->error("Code too large: %d bytes", newSize);
92 }
93 }
Jack Palevich0a280a02009-06-11 10:53:51 -070094 return overflow;
Jack Palevichac0e95e2009-05-29 13:53:44 -070095 }
96
Jack Palevich21a15a22009-05-11 14:49:29 -070097 public:
98 CodeBuf() {
99 pProgramBase = 0;
100 ind = 0;
Jack Palevichac0e95e2009-05-29 13:53:44 -0700101 mErrorSink = 0;
102 mSize = 0;
Jack Palevich0a280a02009-06-11 10:53:51 -0700103 mOverflowed = false;
Jack Palevich21a15a22009-05-11 14:49:29 -0700104 }
105
106 ~CodeBuf() {
107 release();
108 }
109
110 void init(int size) {
111 release();
Jack Palevichac0e95e2009-05-29 13:53:44 -0700112 mSize = size;
Jack Palevich21a15a22009-05-11 14:49:29 -0700113 pProgramBase = (char*) calloc(1, size);
114 ind = pProgramBase;
115 }
116
Jack Palevichac0e95e2009-05-29 13:53:44 -0700117 void setErrorSink(ErrorSink* pErrorSink) {
118 mErrorSink = pErrorSink;
119 }
120
Jack Palevich546b2242009-05-13 15:10:04 -0700121 int o4(int n) {
Jack Palevich0a280a02009-06-11 10:53:51 -0700122 if(check(4)) {
123 return 0;
124 }
Jack Palevich8b0624c2009-05-20 12:12:06 -0700125 intptr_t result = (intptr_t) ind;
Jack Palevich546b2242009-05-13 15:10:04 -0700126 * (int*) ind = n;
127 ind += 4;
128 return result;
129 }
130
Jack Palevich21a15a22009-05-11 14:49:29 -0700131 /*
132 * Output a byte. Handles all values, 0..ff.
133 */
134 void ob(int n) {
Jack Palevich0a280a02009-06-11 10:53:51 -0700135 if(check(1)) {
136 return;
137 }
Jack Palevich21a15a22009-05-11 14:49:29 -0700138 *ind++ = n;
139 }
140
Jack Palevich21a15a22009-05-11 14:49:29 -0700141 inline void* getBase() {
142 return (void*) pProgramBase;
143 }
144
Jack Palevich8b0624c2009-05-20 12:12:06 -0700145 intptr_t getSize() {
Jack Palevich21a15a22009-05-11 14:49:29 -0700146 return ind - pProgramBase;
147 }
148
Jack Palevich8b0624c2009-05-20 12:12:06 -0700149 intptr_t getPC() {
150 return (intptr_t) ind;
Jack Palevich21a15a22009-05-11 14:49:29 -0700151 }
152 };
153
Jack Palevich1cdef202009-05-22 12:06:27 -0700154 /**
155 * A code generator creates an in-memory program, generating the code on
156 * the fly. There is one code generator implementation for each supported
157 * architecture.
158 *
159 * The code generator implements the following abstract machine:
160 * R0 - the main accumulator.
161 * R1 - the secondary accumulator.
162 * FP - a frame pointer for accessing function arguments and local
163 * variables.
164 * SP - a stack pointer for storing intermediate results while evaluating
165 * expressions. The stack pointer grows downwards.
166 *
167 * The function calling convention is that all arguments are placed on the
168 * stack such that the first argument has the lowest address.
169 * After the call, the result is in R0. The caller is responsible for
170 * removing the arguments from the stack.
171 * The R0 and R1 registers are not saved across function calls. The
172 * FP and SP registers are saved.
173 */
174
Jack Palevich21a15a22009-05-11 14:49:29 -0700175 class CodeGenerator {
176 public:
Jack Palevichac0e95e2009-05-29 13:53:44 -0700177 CodeGenerator() {
178 mErrorSink = 0;
179 pCodeBuf = 0;
180 }
Jack Palevich21a15a22009-05-11 14:49:29 -0700181 virtual ~CodeGenerator() {}
182
Jack Palevich22305132009-05-13 10:58:45 -0700183 virtual void init(CodeBuf* pCodeBuf) {
Jack Palevich21a15a22009-05-11 14:49:29 -0700184 this->pCodeBuf = pCodeBuf;
Jack Palevichac0e95e2009-05-29 13:53:44 -0700185 pCodeBuf->setErrorSink(mErrorSink);
186 }
187
Jack Palevichb67b18f2009-06-11 21:12:23 -0700188 virtual void setErrorSink(ErrorSink* pErrorSink) {
Jack Palevichac0e95e2009-05-29 13:53:44 -0700189 mErrorSink = pErrorSink;
190 if (pCodeBuf) {
191 pCodeBuf->setErrorSink(mErrorSink);
192 }
Jack Palevich21a15a22009-05-11 14:49:29 -0700193 }
194
Jack Palevich1cdef202009-05-22 12:06:27 -0700195 /* Emit a function prolog.
196 * argCount is the number of arguments.
197 * Save the old value of the FP.
198 * Set the new value of the FP.
199 * Convert from the native platform calling convention to
200 * our stack-based calling convention. This may require
201 * pushing arguments from registers to the stack.
202 * Allocate "N" bytes of stack space. N isn't known yet, so
203 * just emit the instructions for adjusting the stack, and return
204 * the address to patch up. The patching will be done in
205 * functionExit().
206 * returns address to patch with local variable size.
Jack Palevich22305132009-05-13 10:58:45 -0700207 */
Jack Palevich546b2242009-05-13 15:10:04 -0700208 virtual int functionEntry(int argCount) = 0;
Jack Palevich22305132009-05-13 10:58:45 -0700209
Jack Palevich1cdef202009-05-22 12:06:27 -0700210 /* Emit a function epilog.
211 * Restore the old SP and FP register values.
212 * Return to the calling function.
213 * argCount - the number of arguments to the function.
214 * localVariableAddress - returned from functionEntry()
215 * localVariableSize - the size in bytes of the local variables.
216 */
217 virtual void functionExit(int argCount, int localVariableAddress,
218 int localVariableSize) = 0;
Jack Palevich22305132009-05-13 10:58:45 -0700219
Jack Palevich1cdef202009-05-22 12:06:27 -0700220 /* load immediate value to R0 */
Jack Palevich546b2242009-05-13 15:10:04 -0700221 virtual void li(int t) = 0;
Jack Palevich22305132009-05-13 10:58:45 -0700222
Jack Palevich1cdef202009-05-22 12:06:27 -0700223 /* Jump to a target, and return the address of the word that
224 * holds the target data, in case it needs to be fixed up later.
225 */
Jack Palevich22305132009-05-13 10:58:45 -0700226 virtual int gjmp(int t) = 0;
227
Jack Palevich1cdef202009-05-22 12:06:27 -0700228 /* Test R0 and jump to a target if the test succeeds.
229 * l = 0: je, l == 1: jne
230 * Return the address of the word that holds the targed data, in
231 * case it needs to be fixed up later.
232 */
Jack Palevich22305132009-05-13 10:58:45 -0700233 virtual int gtst(bool l, int t) = 0;
234
Jack Palevich1cdef202009-05-22 12:06:27 -0700235 /* Compare R1 against R0, and store the boolean result in R0.
236 * op specifies the comparison.
237 */
Jack Palevich22305132009-05-13 10:58:45 -0700238 virtual void gcmp(int op) = 0;
239
Jack Palevich1cdef202009-05-22 12:06:27 -0700240 /* Perform the arithmetic op specified by op. R1 is the
241 * left argument, R0 is the right argument.
242 */
Jack Palevich546b2242009-05-13 15:10:04 -0700243 virtual void genOp(int op) = 0;
Jack Palevich22305132009-05-13 10:58:45 -0700244
Jack Palevich1cdef202009-05-22 12:06:27 -0700245 /* Set R1 to 0.
246 */
247 virtual void clearR1() = 0;
Jack Palevich22305132009-05-13 10:58:45 -0700248
Jack Palevich1cdef202009-05-22 12:06:27 -0700249 /* Push R0 onto the stack.
250 */
251 virtual void pushR0() = 0;
Jack Palevich22305132009-05-13 10:58:45 -0700252
Jack Palevich1cdef202009-05-22 12:06:27 -0700253 /* Pop R1 off of the stack.
254 */
255 virtual void popR1() = 0;
Jack Palevich22305132009-05-13 10:58:45 -0700256
Jack Palevich1cdef202009-05-22 12:06:27 -0700257 /* Store R0 to the address stored in R1.
258 * isInt is true if a whole 4-byte integer value
259 * should be stored, otherwise a 1-byte character
260 * value should be stored.
261 */
262 virtual void storeR0ToR1(bool isInt) = 0;
Jack Palevich22305132009-05-13 10:58:45 -0700263
Jack Palevich1cdef202009-05-22 12:06:27 -0700264 /* Load R0 from the address stored in R0.
265 * isInt is true if a whole 4-byte integer value
266 * should be loaded, otherwise a 1-byte character
267 * value should be loaded.
268 */
269 virtual void loadR0FromR0(bool isInt) = 0;
Jack Palevich22305132009-05-13 10:58:45 -0700270
Jack Palevich1cdef202009-05-22 12:06:27 -0700271 /* Load the absolute address of a variable to R0.
272 * If ea <= LOCAL, then this is a local variable, or an
273 * argument, addressed relative to FP.
274 * else it is an absolute global address.
275 */
276 virtual void leaR0(int ea) = 0;
Jack Palevich22305132009-05-13 10:58:45 -0700277
Jack Palevich1cdef202009-05-22 12:06:27 -0700278 /* Store R0 to a variable.
279 * If ea <= LOCAL, then this is a local variable, or an
280 * argument, addressed relative to FP.
281 * else it is an absolute global address.
282 */
283 virtual void storeR0(int ea) = 0;
Jack Palevich22305132009-05-13 10:58:45 -0700284
Jack Palevich1cdef202009-05-22 12:06:27 -0700285 /* load R0 from a variable.
286 * If ea <= LOCAL, then this is a local variable, or an
287 * argument, addressed relative to FP.
288 * else it is an absolute global address.
289 * If isIncDec is true, then the stored variable's value
290 * should be post-incremented or post-decremented, based
291 * on the value of op.
292 */
293 virtual void loadR0(int ea, bool isIncDec, int op) = 0;
Jack Palevich22305132009-05-13 10:58:45 -0700294
Jack Palevich1cdef202009-05-22 12:06:27 -0700295 /* Emit code to adjust the stack for a function call. Return the
296 * label for the address of the instruction that adjusts the
297 * stack size. This will be passed as argument "a" to
298 * endFunctionCallArguments.
299 */
Jack Palevichcb1c9ef2009-05-14 11:38:49 -0700300 virtual int beginFunctionCallArguments() = 0;
301
Jack Palevich1cdef202009-05-22 12:06:27 -0700302 /* Emit code to store R0 to the stack at byte offset l.
303 */
304 virtual void storeR0ToArg(int l) = 0;
Jack Palevich7810bc92009-05-15 14:31:47 -0700305
Jack Palevich1cdef202009-05-22 12:06:27 -0700306 /* Patch the function call preamble.
307 * a is the address returned from beginFunctionCallArguments
308 * l is the number of bytes the arguments took on the stack.
309 * Typically you would also emit code to convert the argument
310 * list into whatever the native function calling convention is.
311 * On ARM for example you would pop the first 5 arguments into
312 * R0..R4
313 */
Jack Palevichcb1c9ef2009-05-14 11:38:49 -0700314 virtual void endFunctionCallArguments(int a, int l) = 0;
Jack Palevich22305132009-05-13 10:58:45 -0700315
Jack Palevich1cdef202009-05-22 12:06:27 -0700316 /* Emit a call to an unknown function. The argument "symbol" needs to
317 * be stored in the location where the address should go. It forms
318 * a chain. The address will be patched later.
319 * Return the address of the word that has to be patched.
320 */
Jack Palevich22305132009-05-13 10:58:45 -0700321 virtual int callForward(int symbol) = 0;
322
Jack Palevich1cdef202009-05-22 12:06:27 -0700323 /* Call a function using PC-relative addressing. t is the PC-relative
324 * address of the function. It has already been adjusted for the
325 * architectural jump offset, so just store it as-is.
326 */
Jack Palevich22305132009-05-13 10:58:45 -0700327 virtual void callRelative(int t) = 0;
328
Jack Palevich1cdef202009-05-22 12:06:27 -0700329 /* Call a function pointer. L is the number of bytes the arguments
330 * take on the stack. The address of the function is stored at
331 * location SP + l.
332 */
Jack Palevich22305132009-05-13 10:58:45 -0700333 virtual void callIndirect(int l) = 0;
334
Jack Palevich1cdef202009-05-22 12:06:27 -0700335 /* Adjust SP after returning from a function call. l is the
336 * number of bytes of arguments stored on the stack. isIndirect
337 * is true if this was an indirect call. (In which case the
338 * address of the function is stored at location SP + l.)
339 */
Jack Palevich7810bc92009-05-15 14:31:47 -0700340 virtual void adjustStackAfterCall(int l, bool isIndirect) = 0;
Jack Palevich22305132009-05-13 10:58:45 -0700341
Jack Palevich1cdef202009-05-22 12:06:27 -0700342 /* Print a disassembly of the assembled code to out. Return
343 * non-zero if there is an error.
344 */
Jack Palevicha6535612009-05-13 16:24:17 -0700345 virtual int disassemble(FILE* out) = 0;
346
Jack Palevich1cdef202009-05-22 12:06:27 -0700347 /* Generate a symbol at the current PC. t is the head of a
348 * linked list of addresses to patch.
349 */
Jack Paleviche7b59062009-05-19 17:12:17 -0700350 virtual void gsym(int t) = 0;
Jack Palevich21a15a22009-05-11 14:49:29 -0700351
Jack Palevich1cdef202009-05-22 12:06:27 -0700352 /*
353 * Do any cleanup work required at the end of a compile.
354 * For example, an instruction cache might need to be
355 * invalidated.
356 * Return non-zero if there is an error.
357 */
358 virtual int finishCompile() = 0;
Jack Palevich546b2242009-05-13 15:10:04 -0700359
Jack Palevicha6535612009-05-13 16:24:17 -0700360 /**
361 * Adjust relative branches by this amount.
362 */
363 virtual int jumpOffset() = 0;
364
Jack Palevich21a15a22009-05-11 14:49:29 -0700365 protected:
Jack Palevich21a15a22009-05-11 14:49:29 -0700366 /*
367 * Output a byte. Handles all values, 0..ff.
368 */
369 void ob(int n) {
370 pCodeBuf->ob(n);
371 }
372
Jack Palevich8b0624c2009-05-20 12:12:06 -0700373 intptr_t o4(int data) {
Jack Paleviche7b59062009-05-19 17:12:17 -0700374 return pCodeBuf->o4(data);
Jack Palevich21a15a22009-05-11 14:49:29 -0700375 }
376
Jack Palevich8b0624c2009-05-20 12:12:06 -0700377 intptr_t getBase() {
378 return (intptr_t) pCodeBuf->getBase();
Jack Palevicha6535612009-05-13 16:24:17 -0700379 }
380
Jack Palevich8b0624c2009-05-20 12:12:06 -0700381 intptr_t getPC() {
Jack Palevich21a15a22009-05-11 14:49:29 -0700382 return pCodeBuf->getPC();
383 }
Jack Palevich1cdef202009-05-22 12:06:27 -0700384
385 intptr_t getSize() {
386 return pCodeBuf->getSize();
387 }
Jack Palevichac0e95e2009-05-29 13:53:44 -0700388
389 void error(const char* fmt,...) {
390 va_list ap;
391 va_start(ap, fmt);
392 mErrorSink->verror(fmt, ap);
393 va_end(ap);
394 }
Jack Palevich21a15a22009-05-11 14:49:29 -0700395 private:
396 CodeBuf* pCodeBuf;
Jack Palevichac0e95e2009-05-29 13:53:44 -0700397 ErrorSink* mErrorSink;
Jack Palevich21a15a22009-05-11 14:49:29 -0700398 };
399
Jack Paleviche7b59062009-05-19 17:12:17 -0700400#ifdef PROVIDE_ARM_CODEGEN
401
Jack Palevich22305132009-05-13 10:58:45 -0700402 class ARMCodeGenerator : public CodeGenerator {
403 public:
404 ARMCodeGenerator() {}
-b master422972c2009-06-17 19:13:52 -0700405
Jack Palevich22305132009-05-13 10:58:45 -0700406 virtual ~ARMCodeGenerator() {}
407
408 /* returns address to patch with local variable size
409 */
Jack Palevich546b2242009-05-13 15:10:04 -0700410 virtual int functionEntry(int argCount) {
Jack Palevichb7c81e92009-06-04 19:56:13 -0700411 LOG_API("functionEntry(%d);\n", argCount);
-b master422972c2009-06-17 19:13:52 -0700412 mStackUse = 0;
Jack Palevich69796b62009-05-14 15:42:26 -0700413 // sp -> arg4 arg5 ...
414 // Push our register-based arguments back on the stack
415 if (argCount > 0) {
416 int regArgCount = argCount <= 4 ? argCount : 4;
417 o4(0xE92D0000 | ((1 << argCount) - 1)); // stmfd sp!, {}
-b master422972c2009-06-17 19:13:52 -0700418 mStackUse += regArgCount * 4;
Jack Palevich69796b62009-05-14 15:42:26 -0700419 }
420 // sp -> arg0 arg1 ...
421 o4(0xE92D4800); // stmfd sp!, {fp, lr}
-b master422972c2009-06-17 19:13:52 -0700422 mStackUse += 2 * 4;
Jack Palevich69796b62009-05-14 15:42:26 -0700423 // sp, fp -> oldfp, retadr, arg0 arg1 ....
424 o4(0xE1A0B00D); // mov fp, sp
-b master422972c2009-06-17 19:13:52 -0700425 LOG_STACK("functionEntry: %d\n", mStackUse);
Jack Palevich69796b62009-05-14 15:42:26 -0700426 return o4(0xE24DD000); // sub sp, sp, # <local variables>
-b master422972c2009-06-17 19:13:52 -0700427 // We don't know how many local variables we are going to use,
428 // but we will round the allocation up to a multiple of
429 // STACK_ALIGNMENT, so it won't affect the stack alignment.
Jack Palevich22305132009-05-13 10:58:45 -0700430 }
431
Jack Palevich546b2242009-05-13 15:10:04 -0700432 virtual void functionExit(int argCount, int localVariableAddress, int localVariableSize) {
Jack Palevich09555c72009-05-27 12:25:55 -0700433 LOG_API("functionExit(%d, %d, %d);\n", argCount, localVariableAddress, localVariableSize);
-b master422972c2009-06-17 19:13:52 -0700434 // Round local variable size up to a multiple of stack alignment
435 localVariableSize = ((localVariableSize + STACK_ALIGNMENT - 1) /
436 STACK_ALIGNMENT) * STACK_ALIGNMENT;
Jack Palevich69796b62009-05-14 15:42:26 -0700437 // Patch local variable allocation code:
438 if (localVariableSize < 0 || localVariableSize > 255) {
Jack Palevich8de461d2009-05-14 17:21:45 -0700439 error("localVariables out of range: %d", localVariableSize);
Jack Palevich546b2242009-05-13 15:10:04 -0700440 }
Jack Palevich69796b62009-05-14 15:42:26 -0700441 *(char*) (localVariableAddress) = localVariableSize;
442
443 // sp -> locals .... fp -> oldfp, retadr, arg0, arg1, ...
444 o4(0xE1A0E00B); // mov lr, fp
445 o4(0xE59BB000); // ldr fp, [fp]
446 o4(0xE28ED004); // add sp, lr, #4
447 // sp -> retadr, arg0, ...
448 o4(0xE8BD4000); // ldmfd sp!, {lr}
449 // sp -> arg0 ....
450 if (argCount > 0) {
451 // We store the PC into the lr so we can adjust the sp before
Jack Palevich8de461d2009-05-14 17:21:45 -0700452 // returning. We need to pull off the registers we pushed
Jack Palevich69796b62009-05-14 15:42:26 -0700453 // earlier. We don't need to actually store them anywhere,
454 // just adjust the stack.
455 int regArgCount = argCount <= 4 ? argCount : 4;
456 o4(0xE28DD000 | (regArgCount << 2)); // add sp, sp, #argCount << 2
457 }
458 o4(0xE12FFF1E); // bx lr
Jack Palevich22305132009-05-13 10:58:45 -0700459 }
460
461 /* load immediate value */
Jack Palevich546b2242009-05-13 15:10:04 -0700462 virtual void li(int t) {
Jack Palevich09555c72009-05-27 12:25:55 -0700463 LOG_API("li(%d);\n", t);
Jack Palevicha6535612009-05-13 16:24:17 -0700464 if (t >= 0 && t < 255) {
Jack Palevich69796b62009-05-14 15:42:26 -0700465 o4(0xE3A00000 + t); // mov r0, #0
Jack Palevicha6535612009-05-13 16:24:17 -0700466 } else if (t >= -256 && t < 0) {
467 // mvn means move constant ^ ~0
Jack Palevich69796b62009-05-14 15:42:26 -0700468 o4(0xE3E00001 - t); // mvn r0, #0
Jack Palevicha6535612009-05-13 16:24:17 -0700469 } else {
Jack Palevichcb1c9ef2009-05-14 11:38:49 -0700470 o4(0xE51F0000); // ldr r0, .L3
471 o4(0xEA000000); // b .L99
472 o4(t); // .L3: .word 0
473 // .L99:
Jack Palevicha6535612009-05-13 16:24:17 -0700474 }
Jack Palevich22305132009-05-13 10:58:45 -0700475 }
476
477 virtual int gjmp(int t) {
Jack Palevich09555c72009-05-27 12:25:55 -0700478 LOG_API("gjmp(%d);\n", t);
Jack Palevich8de461d2009-05-14 17:21:45 -0700479 return o4(0xEA000000 | encodeAddress(t)); // b .L33
Jack Palevich22305132009-05-13 10:58:45 -0700480 }
481
482 /* l = 0: je, l == 1: jne */
483 virtual int gtst(bool l, int t) {
Jack Palevich09555c72009-05-27 12:25:55 -0700484 LOG_API("gtst(%d, %d);\n", l, t);
Jack Palevich8de461d2009-05-14 17:21:45 -0700485 o4(0xE3500000); // cmp r0,#0
486 int branch = l ? 0x1A000000 : 0x0A000000; // bne : beq
487 return o4(branch | encodeAddress(t));
Jack Palevich22305132009-05-13 10:58:45 -0700488 }
489
490 virtual void gcmp(int op) {
Jack Palevich09555c72009-05-27 12:25:55 -0700491 LOG_API("gcmp(%d);\n", op);
Jack Palevich8de461d2009-05-14 17:21:45 -0700492 o4(0xE1510000); // cmp r1, r1
493 switch(op) {
494 case OP_EQUALS:
495 o4(0x03A00001); // moveq r0,#1
496 o4(0x13A00000); // movne r0,#0
497 break;
498 case OP_NOT_EQUALS:
499 o4(0x03A00000); // moveq r0,#0
500 o4(0x13A00001); // movne r0,#1
501 break;
502 case OP_LESS_EQUAL:
503 o4(0xD3A00001); // movle r0,#1
504 o4(0xC3A00000); // movgt r0,#0
505 break;
506 case OP_GREATER:
507 o4(0xD3A00000); // movle r0,#0
508 o4(0xC3A00001); // movgt r0,#1
509 break;
510 case OP_GREATER_EQUAL:
511 o4(0xA3A00001); // movge r0,#1
512 o4(0xB3A00000); // movlt r0,#0
513 break;
514 case OP_LESS:
515 o4(0xA3A00000); // movge r0,#0
516 o4(0xB3A00001); // movlt r0,#1
517 break;
518 default:
519 error("Unknown comparison op %d", op);
520 break;
521 }
Jack Palevich22305132009-05-13 10:58:45 -0700522 }
523
Jack Palevich546b2242009-05-13 15:10:04 -0700524 virtual void genOp(int op) {
Jack Palevich09555c72009-05-27 12:25:55 -0700525 LOG_API("genOp(%d);\n", op);
Jack Palevichcb1c9ef2009-05-14 11:38:49 -0700526 switch(op) {
527 case OP_MUL:
528 o4(0x0E0000091); // mul r0,r1,r0
529 break;
Jack Palevich3d474a72009-05-15 15:12:38 -0700530 case OP_DIV:
531 callRuntime(runtime_DIV);
532 break;
533 case OP_MOD:
534 callRuntime(runtime_MOD);
535 break;
Jack Palevichcb1c9ef2009-05-14 11:38:49 -0700536 case OP_PLUS:
537 o4(0xE0810000); // add r0,r1,r0
538 break;
539 case OP_MINUS:
540 o4(0xE0410000); // sub r0,r1,r0
541 break;
542 case OP_SHIFT_LEFT:
543 o4(0xE1A00011); // lsl r0,r1,r0
544 break;
545 case OP_SHIFT_RIGHT:
546 o4(0xE1A00051); // asr r0,r1,r0
547 break;
548 case OP_BIT_AND:
549 o4(0xE0010000); // and r0,r1,r0
550 break;
551 case OP_BIT_XOR:
552 o4(0xE0210000); // eor r0,r1,r0
553 break;
554 case OP_BIT_OR:
555 o4(0xE1810000); // orr r0,r1,r0
556 break;
557 case OP_BIT_NOT:
558 o4(0xE1E00000); // mvn r0, r0
559 break;
560 default:
Jack Palevich69796b62009-05-14 15:42:26 -0700561 error("Unimplemented op %d\n", op);
Jack Palevichcb1c9ef2009-05-14 11:38:49 -0700562 break;
563 }
Jack Palevich22305132009-05-13 10:58:45 -0700564 }
565
Jack Palevich1cdef202009-05-22 12:06:27 -0700566 virtual void clearR1() {
Jack Palevich09555c72009-05-27 12:25:55 -0700567 LOG_API("clearR1();\n");
Jack Palevichcb1c9ef2009-05-14 11:38:49 -0700568 o4(0xE3A01000); // mov r1, #0
Jack Palevich22305132009-05-13 10:58:45 -0700569 }
570
Jack Palevich1cdef202009-05-22 12:06:27 -0700571 virtual void pushR0() {
Jack Palevich09555c72009-05-27 12:25:55 -0700572 LOG_API("pushR0();\n");
Jack Palevichcb1c9ef2009-05-14 11:38:49 -0700573 o4(0xE92D0001); // stmfd sp!,{r0}
-b master422972c2009-06-17 19:13:52 -0700574 mStackUse += 4;
575 LOG_STACK("pushR0: %d\n", mStackUse);
Jack Palevich22305132009-05-13 10:58:45 -0700576 }
577
Jack Palevich1cdef202009-05-22 12:06:27 -0700578 virtual void popR1() {
Jack Palevich09555c72009-05-27 12:25:55 -0700579 LOG_API("popR1();\n");
Jack Palevichcb1c9ef2009-05-14 11:38:49 -0700580 o4(0xE8BD0002); // ldmfd sp!,{r1}
-b master422972c2009-06-17 19:13:52 -0700581 mStackUse -= 4;
582 LOG_STACK("popR1: %d\n", mStackUse);
Jack Palevich22305132009-05-13 10:58:45 -0700583 }
584
Jack Palevich1cdef202009-05-22 12:06:27 -0700585 virtual void storeR0ToR1(bool isInt) {
Jack Palevich09555c72009-05-27 12:25:55 -0700586 LOG_API("storeR0ToR1(%d);\n", isInt);
Jack Palevichbd894902009-05-14 19:35:31 -0700587 if (isInt) {
588 o4(0xE5810000); // str r0, [r1]
589 } else {
590 o4(0xE5C10000); // strb r0, [r1]
591 }
Jack Palevich22305132009-05-13 10:58:45 -0700592 }
593
Jack Palevich1cdef202009-05-22 12:06:27 -0700594 virtual void loadR0FromR0(bool isInt) {
Jack Palevich09555c72009-05-27 12:25:55 -0700595 LOG_API("loadR0FromR0(%d);\n", isInt);
Jack Palevich22305132009-05-13 10:58:45 -0700596 if (isInt)
Jack Palevich69796b62009-05-14 15:42:26 -0700597 o4(0xE5900000); // ldr r0, [r0]
Jack Palevich22305132009-05-13 10:58:45 -0700598 else
Jack Palevich69796b62009-05-14 15:42:26 -0700599 o4(0xE5D00000); // ldrb r0, [r0]
Jack Palevich22305132009-05-13 10:58:45 -0700600 }
601
Jack Palevich1cdef202009-05-22 12:06:27 -0700602 virtual void leaR0(int ea) {
Jack Palevich09555c72009-05-27 12:25:55 -0700603 LOG_API("leaR0(%d);\n", ea);
Jack Palevich4d93f302009-05-15 13:30:00 -0700604 if (ea < LOCAL) {
605 // Local, fp relative
606 if (ea < -1023 || ea > 1023 || ((ea & 3) != 0)) {
607 error("Offset out of range: %08x", ea);
608 }
609 if (ea < 0) {
610 o4(0xE24B0F00 | (0xff & ((-ea) >> 2))); // sub r0, fp, #ea
611 } else {
612 o4(0xE28B0F00 | (0xff & (ea >> 2))); // add r0, fp, #ea
613 }
Jack Palevichbd894902009-05-14 19:35:31 -0700614 } else {
Jack Palevich4d93f302009-05-15 13:30:00 -0700615 // Global, absolute.
616 o4(0xE59F0000); // ldr r0, .L1
617 o4(0xEA000000); // b .L99
618 o4(ea); // .L1: .word 0
619 // .L99:
Jack Palevichbd894902009-05-14 19:35:31 -0700620 }
Jack Palevich22305132009-05-13 10:58:45 -0700621 }
622
Jack Palevich1cdef202009-05-22 12:06:27 -0700623 virtual void storeR0(int ea) {
Jack Palevich09555c72009-05-27 12:25:55 -0700624 LOG_API("storeR0(%d);\n", ea);
Jack Palevich4d93f302009-05-15 13:30:00 -0700625 if (ea < LOCAL) {
626 // Local, fp relative
627 if (ea < -4095 || ea > 4095) {
628 error("Offset out of range: %08x", ea);
629 }
630 if (ea < 0) {
631 o4(0xE50B0000 | (0xfff & (-ea))); // str r0, [fp,#-ea]
632 } else {
633 o4(0xE58B0000 | (0xfff & ea)); // str r0, [fp,#ea]
634 }
635 } else{
636 // Global, absolute
637 o4(0xE59F1000); // ldr r1, .L1
638 o4(0xEA000000); // b .L99
639 o4(ea); // .L1: .word 0
640 o4(0xE5810000); // .L99: str r0, [r1]
Jack Palevich69796b62009-05-14 15:42:26 -0700641 }
Jack Palevich22305132009-05-13 10:58:45 -0700642 }
643
Jack Palevich1cdef202009-05-22 12:06:27 -0700644 virtual void loadR0(int ea, bool isIncDec, int op) {
Jack Palevich09555c72009-05-27 12:25:55 -0700645 LOG_API("loadR0(%d, %d, %d);\n", ea, isIncDec, op);
Jack Palevich4d93f302009-05-15 13:30:00 -0700646 if (ea < LOCAL) {
647 // Local, fp relative
648 if (ea < -4095 || ea > 4095) {
649 error("Offset out of range: %08x", ea);
650 }
651 if (ea < 0) {
652 o4(0xE51B0000 | (0xfff & (-ea))); // ldr r0, [fp,#-ea]
653 } else {
654 o4(0xE59B0000 | (0xfff & ea)); // ldr r0, [fp,#ea]
655 }
Jack Palevich69796b62009-05-14 15:42:26 -0700656 } else {
Jack Palevich4d93f302009-05-15 13:30:00 -0700657 // Global, absolute
658 o4(0xE59F2000); // ldr r2, .L1
659 o4(0xEA000000); // b .L99
660 o4(ea); // .L1: .word ea
661 o4(0xE5920000); // .L99: ldr r0, [r2]
Jack Palevich69796b62009-05-14 15:42:26 -0700662 }
Jack Palevich22305132009-05-13 10:58:45 -0700663
Jack Palevich4d93f302009-05-15 13:30:00 -0700664 if (isIncDec) {
665 switch (op) {
666 case OP_INCREMENT:
667 o4(0xE2801001); // add r1, r0, #1
668 break;
669 case OP_DECREMENT:
670 o4(0xE2401001); // sub r1, r0, #1
671 break;
672 default:
673 error("unknown opcode: %d", op);
674 }
675 if (ea < LOCAL) {
676 // Local, fp relative
677 // Don't need range check, was already checked above
678 if (ea < 0) {
679 o4(0xE50B1000 | (0xfff & (-ea))); // str r1, [fp,#-ea]
680 } else {
681 o4(0xE58B1000 | (0xfff & ea)); // str r1, [fp,#ea]
682 }
683 } else{
684 // Global, absolute
685 // r2 is already set up from before.
686 o4(0xE5821000); // str r1, [r2]
687 }
Jack Palevichbd894902009-05-14 19:35:31 -0700688 }
Jack Palevich22305132009-05-13 10:58:45 -0700689 }
690
Jack Palevichcb1c9ef2009-05-14 11:38:49 -0700691 virtual int beginFunctionCallArguments() {
Jack Palevich09555c72009-05-27 12:25:55 -0700692 LOG_API("beginFunctionCallArguments();\n");
Jack Palevichcb1c9ef2009-05-14 11:38:49 -0700693 return o4(0xE24DDF00); // Placeholder
694 }
695
Jack Palevich1cdef202009-05-22 12:06:27 -0700696 virtual void storeR0ToArg(int l) {
Jack Palevich09555c72009-05-27 12:25:55 -0700697 LOG_API("storeR0ToArg(%d);\n", l);
Jack Palevich7810bc92009-05-15 14:31:47 -0700698 if (l < 0 || l > 4096-4) {
699 error("l out of range for stack offset: 0x%08x", l);
700 }
701 o4(0xE58D0000 + l); // str r0, [sp, #4]
702 }
703
Jack Palevichcb1c9ef2009-05-14 11:38:49 -0700704 virtual void endFunctionCallArguments(int a, int l) {
Jack Palevich09555c72009-05-27 12:25:55 -0700705 LOG_API("endFunctionCallArguments(0x%08x, %d);\n", a, l);
-b master422972c2009-06-17 19:13:52 -0700706 int argCount = l >> 2;
707 int argumentStackUse = l;
708 if (argCount > 0) {
709 int regArgCount = argCount > 4 ? 4 : argCount;
710 argumentStackUse -= regArgCount * 4;
711 o4(0xE8BD0000 | ((1 << regArgCount) - 1)); // ldmfd sp!,{}
712 }
713 mStackUse += argumentStackUse;
714
715 // Align stack.
716 int missalignment = mStackUse - ((mStackUse / STACK_ALIGNMENT)
717 * STACK_ALIGNMENT);
718 mStackAlignmentAdjustment = 0;
719 if (missalignment > 0) {
720 mStackAlignmentAdjustment = STACK_ALIGNMENT - missalignment;
721 }
722 l += mStackAlignmentAdjustment;
723
Jack Palevichcb1c9ef2009-05-14 11:38:49 -0700724 if (l < 0 || l > 0x3FC) {
725 error("L out of range for stack adjustment: 0x%08x", l);
726 }
727 * (int*) a = 0xE24DDF00 | (l >> 2); // sub sp, sp, #0 << 2
-b master422972c2009-06-17 19:13:52 -0700728 mStackUse += mStackAlignmentAdjustment;
729 LOG_STACK("endFunctionCallArguments mStackUse: %d, mStackAlignmentAdjustment %d\n",
730 mStackUse, mStackAlignmentAdjustment);
Jack Palevich22305132009-05-13 10:58:45 -0700731 }
732
Jack Palevich22305132009-05-13 10:58:45 -0700733 virtual int callForward(int symbol) {
Jack Palevich09555c72009-05-27 12:25:55 -0700734 LOG_API("callForward(%d);\n", symbol);
Jack Palevichcb1c9ef2009-05-14 11:38:49 -0700735 // Forward calls are always short (local)
736 return o4(0xEB000000 | encodeAddress(symbol));
Jack Palevich22305132009-05-13 10:58:45 -0700737 }
738
739 virtual void callRelative(int t) {
Jack Palevich09555c72009-05-27 12:25:55 -0700740 LOG_API("callRelative(%d);\n", t);
Jack Palevichcb1c9ef2009-05-14 11:38:49 -0700741 int abs = t + getPC() + jumpOffset();
Jack Palevichac0e95e2009-05-29 13:53:44 -0700742 LOG_API("abs=%d (0x%08x)\n", abs, abs);
Jack Palevichcb1c9ef2009-05-14 11:38:49 -0700743 if (t >= - (1 << 25) && t < (1 << 25)) {
744 o4(0xEB000000 | encodeAddress(t));
745 } else {
746 // Long call.
747 o4(0xE59FC000); // ldr r12, .L1
748 o4(0xEA000000); // b .L99
Jack Palevichbd894902009-05-14 19:35:31 -0700749 o4(t - 12); // .L1: .word 0
Jack Palevichcb1c9ef2009-05-14 11:38:49 -0700750 o4(0xE08CC00F); // .L99: add r12,pc
751 o4(0xE12FFF3C); // blx r12
752 }
Jack Palevich22305132009-05-13 10:58:45 -0700753 }
754
755 virtual void callIndirect(int l) {
Jack Palevich09555c72009-05-27 12:25:55 -0700756 LOG_API("callIndirect(%d);\n", l);
Jack Palevich7810bc92009-05-15 14:31:47 -0700757 int argCount = l >> 2;
758 int poppedArgs = argCount > 4 ? 4 : argCount;
-b master422972c2009-06-17 19:13:52 -0700759 int adjustedL = l - (poppedArgs << 2) + mStackAlignmentAdjustment;
Jack Palevich7810bc92009-05-15 14:31:47 -0700760 if (adjustedL < 0 || adjustedL > 4096-4) {
761 error("l out of range for stack offset: 0x%08x", l);
762 }
763 o4(0xE59DC000 | (0xfff & adjustedL)); // ldr r12, [sp,#adjustedL]
764 o4(0xE12FFF3C); // blx r12
Jack Palevich22305132009-05-13 10:58:45 -0700765 }
766
Jack Palevich7810bc92009-05-15 14:31:47 -0700767 virtual void adjustStackAfterCall(int l, bool isIndirect) {
Jack Palevich09555c72009-05-27 12:25:55 -0700768 LOG_API("adjustStackAfterCall(%d, %d);\n", l, isIndirect);
Jack Palevichcb1c9ef2009-05-14 11:38:49 -0700769 int argCount = l >> 2;
Jack Palevich7810bc92009-05-15 14:31:47 -0700770 int stackArgs = argCount > 4 ? argCount - 4 : 0;
-b master422972c2009-06-17 19:13:52 -0700771 int stackUse = stackArgs + (isIndirect ? 1 : 0)
772 + (mStackAlignmentAdjustment >> 2);
Jack Palevich7810bc92009-05-15 14:31:47 -0700773 if (stackUse) {
774 if (stackUse < 0 || stackUse > 255) {
775 error("L out of range for stack adjustment: 0x%08x", l);
776 }
777 o4(0xE28DDF00 | stackUse); // add sp, sp, #stackUse << 2
-b master422972c2009-06-17 19:13:52 -0700778 mStackUse -= stackUse * 4;
779 LOG_STACK("adjustStackAfterCall: %d\n", mStackUse);
Jack Palevichcb1c9ef2009-05-14 11:38:49 -0700780 }
Jack Palevich22305132009-05-13 10:58:45 -0700781 }
782
Jack Palevicha6535612009-05-13 16:24:17 -0700783 virtual int jumpOffset() {
Jack Palevichbd894902009-05-14 19:35:31 -0700784 return 8;
Jack Palevicha6535612009-05-13 16:24:17 -0700785 }
786
787 /* output a symbol and patch all calls to it */
788 virtual void gsym(int t) {
Jack Palevich09555c72009-05-27 12:25:55 -0700789 LOG_API("gsym(0x%x)\n", t);
Jack Palevicha6535612009-05-13 16:24:17 -0700790 int n;
791 int base = getBase();
792 int pc = getPC();
Jack Palevich09555c72009-05-27 12:25:55 -0700793 LOG_API("pc = 0x%x\n", pc);
Jack Palevicha6535612009-05-13 16:24:17 -0700794 while (t) {
795 int data = * (int*) t;
796 int decodedOffset = ((BRANCH_REL_ADDRESS_MASK & data) << 2);
797 if (decodedOffset == 0) {
798 n = 0;
799 } else {
800 n = base + decodedOffset; /* next value */
801 }
802 *(int *) t = (data & ~BRANCH_REL_ADDRESS_MASK)
803 | encodeRelAddress(pc - t - 8);
804 t = n;
805 }
806 }
807
Jack Palevich1cdef202009-05-22 12:06:27 -0700808 virtual int finishCompile() {
809#if defined(__arm__)
810 const long base = long(getBase());
811 const long curr = long(getPC());
812 int err = cacheflush(base, curr, 0);
813 return err;
814#else
815 return 0;
816#endif
817 }
818
Jack Palevicha6535612009-05-13 16:24:17 -0700819 virtual int disassemble(FILE* out) {
Jack Palevich09555c72009-05-27 12:25:55 -0700820#ifdef ENABLE_ARM_DISASSEMBLY
821 disasmOut = out;
Jack Palevicha6535612009-05-13 16:24:17 -0700822 disasm_interface_t di;
823 di.di_readword = disassemble_readword;
824 di.di_printaddr = disassemble_printaddr;
825 di.di_printf = disassemble_printf;
826
827 int base = getBase();
828 int pc = getPC();
829 for(int i = base; i < pc; i += 4) {
830 fprintf(out, "%08x: %08x ", i, *(int*) i);
831 ::disasm(&di, i, 0);
832 }
Jack Palevich09555c72009-05-27 12:25:55 -0700833#endif
Jack Palevicha6535612009-05-13 16:24:17 -0700834 return 0;
835 }
Jack Palevich7810bc92009-05-15 14:31:47 -0700836
Jack Palevich22305132009-05-13 10:58:45 -0700837 private:
Jack Palevicha6535612009-05-13 16:24:17 -0700838 static FILE* disasmOut;
839
840 static u_int
841 disassemble_readword(u_int address)
842 {
843 return(*((u_int *)address));
844 }
845
846 static void
847 disassemble_printaddr(u_int address)
848 {
849 fprintf(disasmOut, "0x%08x", address);
850 }
851
852 static void
853 disassemble_printf(const char *fmt, ...) {
854 va_list ap;
855 va_start(ap, fmt);
856 vfprintf(disasmOut, fmt, ap);
857 va_end(ap);
858 }
859
860 static const int BRANCH_REL_ADDRESS_MASK = 0x00ffffff;
861
862 /** Encode a relative address that might also be
863 * a label.
864 */
865 int encodeAddress(int value) {
866 int base = getBase();
867 if (value >= base && value <= getPC() ) {
868 // This is a label, encode it relative to the base.
869 value = value - base;
870 }
871 return encodeRelAddress(value);
872 }
873
874 int encodeRelAddress(int value) {
875 return BRANCH_REL_ADDRESS_MASK & (value >> 2);
876 }
Jack Palevich22305132009-05-13 10:58:45 -0700877
Jack Palevich3d474a72009-05-15 15:12:38 -0700878 typedef int (*int2FnPtr)(int a, int b);
879 void callRuntime(int2FnPtr fn) {
880 o4(0xE59F2000); // ldr r2, .L1
881 o4(0xEA000000); // b .L99
882 o4((int) fn); //.L1: .word fn
883 o4(0xE12FFF32); //.L99: blx r2
884 }
885
886 static int runtime_DIV(int a, int b) {
887 return b / a;
888 }
889
890 static int runtime_MOD(int a, int b) {
891 return b % a;
892 }
-b master422972c2009-06-17 19:13:52 -0700893
894 static const int STACK_ALIGNMENT = 8;
895 int mStackUse;
896 // This variable holds the amount we adjusted the stack in the most
897 // recent endFunctionCallArguments call. It's examined by the
898 // following adjustStackAfterCall call.
899 int mStackAlignmentAdjustment;
Jack Palevich22305132009-05-13 10:58:45 -0700900 };
901
Jack Palevich09555c72009-05-27 12:25:55 -0700902#endif // PROVIDE_ARM_CODEGEN
Jack Paleviche7b59062009-05-19 17:12:17 -0700903
904#ifdef PROVIDE_X86_CODEGEN
905
Jack Palevich21a15a22009-05-11 14:49:29 -0700906 class X86CodeGenerator : public CodeGenerator {
907 public:
908 X86CodeGenerator() {}
909 virtual ~X86CodeGenerator() {}
910
Jack Palevichbf42c9c2009-05-12 12:48:35 -0700911 /* returns address to patch with local variable size
912 */
Jack Palevich546b2242009-05-13 15:10:04 -0700913 virtual int functionEntry(int argCount) {
Jack Palevichbf42c9c2009-05-12 12:48:35 -0700914 o(0xe58955); /* push %ebp, mov %esp, %ebp */
915 return oad(0xec81, 0); /* sub $xxx, %esp */
916 }
917
Jack Palevich546b2242009-05-13 15:10:04 -0700918 virtual void functionExit(int argCount, int localVariableAddress, int localVariableSize) {
Jack Palevichbf42c9c2009-05-12 12:48:35 -0700919 o(0xc3c9); /* leave, ret */
Jack Palevich546b2242009-05-13 15:10:04 -0700920 *(int *) localVariableAddress = localVariableSize; /* save local variables */
Jack Palevichbf42c9c2009-05-12 12:48:35 -0700921 }
922
Jack Palevich21a15a22009-05-11 14:49:29 -0700923 /* load immediate value */
Jack Palevich546b2242009-05-13 15:10:04 -0700924 virtual void li(int t) {
Jack Palevich21a15a22009-05-11 14:49:29 -0700925 oad(0xb8, t); /* mov $xx, %eax */
926 }
927
Jack Palevich22305132009-05-13 10:58:45 -0700928 virtual int gjmp(int t) {
Jack Palevich21a15a22009-05-11 14:49:29 -0700929 return psym(0xe9, t);
930 }
931
932 /* l = 0: je, l == 1: jne */
Jack Palevich22305132009-05-13 10:58:45 -0700933 virtual int gtst(bool l, int t) {
Jack Palevich21a15a22009-05-11 14:49:29 -0700934 o(0x0fc085); /* test %eax, %eax, je/jne xxx */
935 return psym(0x84 + l, t);
936 }
937
Jack Palevich22305132009-05-13 10:58:45 -0700938 virtual void gcmp(int op) {
Jack Palevichbf42c9c2009-05-12 12:48:35 -0700939 int t = decodeOp(op);
Jack Palevich21a15a22009-05-11 14:49:29 -0700940 o(0xc139); /* cmp %eax,%ecx */
941 li(0);
942 o(0x0f); /* setxx %al */
943 o(t + 0x90);
944 o(0xc0);
945 }
946
Jack Palevich546b2242009-05-13 15:10:04 -0700947 virtual void genOp(int op) {
Jack Palevichbf42c9c2009-05-12 12:48:35 -0700948 o(decodeOp(op));
949 if (op == OP_MOD)
950 o(0x92); /* xchg %edx, %eax */
951 }
952
Jack Palevich1cdef202009-05-22 12:06:27 -0700953 virtual void clearR1() {
Jack Palevich21a15a22009-05-11 14:49:29 -0700954 oad(0xb9, 0); /* movl $0, %ecx */
955 }
956
Jack Palevich1cdef202009-05-22 12:06:27 -0700957 virtual void pushR0() {
Jack Palevich21a15a22009-05-11 14:49:29 -0700958 o(0x50); /* push %eax */
959 }
960
Jack Palevich1cdef202009-05-22 12:06:27 -0700961 virtual void popR1() {
Jack Palevich21a15a22009-05-11 14:49:29 -0700962 o(0x59); /* pop %ecx */
Jack Palevichbf42c9c2009-05-12 12:48:35 -0700963 }
964
Jack Palevich1cdef202009-05-22 12:06:27 -0700965 virtual void storeR0ToR1(bool isInt) {
Jack Palevich21a15a22009-05-11 14:49:29 -0700966 o(0x0188 + isInt); /* movl %eax/%al, (%ecx) */
967 }
968
Jack Palevich1cdef202009-05-22 12:06:27 -0700969 virtual void loadR0FromR0(bool isInt) {
Jack Palevich21a15a22009-05-11 14:49:29 -0700970 if (isInt)
971 o(0x8b); /* mov (%eax), %eax */
972 else
973 o(0xbe0f); /* movsbl (%eax), %eax */
974 ob(0); /* add zero in code */
975 }
976
Jack Palevich1cdef202009-05-22 12:06:27 -0700977 virtual void leaR0(int ea) {
Jack Palevich21a15a22009-05-11 14:49:29 -0700978 gmov(10, ea); /* leal EA, %eax */
979 }
980
Jack Palevich1cdef202009-05-22 12:06:27 -0700981 virtual void storeR0(int ea) {
Jack Palevich21a15a22009-05-11 14:49:29 -0700982 gmov(6, ea); /* mov %eax, EA */
983 }
984
Jack Palevich1cdef202009-05-22 12:06:27 -0700985 virtual void loadR0(int ea, bool isIncDec, int op) {
Jack Palevich21a15a22009-05-11 14:49:29 -0700986 gmov(8, ea); /* mov EA, %eax */
Jack Palevich4d93f302009-05-15 13:30:00 -0700987 if (isIncDec) {
988 /* Implement post-increment or post decrement.
989 */
990 gmov(0, ea); /* 83 ADD */
991 o(decodeOp(op));
992 }
Jack Palevich21a15a22009-05-11 14:49:29 -0700993 }
994
Jack Palevichcb1c9ef2009-05-14 11:38:49 -0700995 virtual int beginFunctionCallArguments() {
Jack Palevich21a15a22009-05-11 14:49:29 -0700996 return oad(0xec81, 0); /* sub $xxx, %esp */
997 }
998
Jack Palevich1cdef202009-05-22 12:06:27 -0700999 virtual void storeR0ToArg(int l) {
Jack Palevich21a15a22009-05-11 14:49:29 -07001000 oad(0x248489, l); /* movl %eax, xxx(%esp) */
1001 }
1002
Jack Palevich7810bc92009-05-15 14:31:47 -07001003 virtual void endFunctionCallArguments(int a, int l) {
1004 * (int*) a = l;
1005 }
1006
Jack Palevich22305132009-05-13 10:58:45 -07001007 virtual int callForward(int symbol) {
Jack Palevich21a15a22009-05-11 14:49:29 -07001008 return psym(0xe8, symbol); /* call xxx */
1009 }
1010
Jack Palevich22305132009-05-13 10:58:45 -07001011 virtual void callRelative(int t) {
Jack Palevich21a15a22009-05-11 14:49:29 -07001012 psym(0xe8, t); /* call xxx */
1013 }
1014
Jack Palevich22305132009-05-13 10:58:45 -07001015 virtual void callIndirect(int l) {
Jack Palevich21a15a22009-05-11 14:49:29 -07001016 oad(0x2494ff, l); /* call *xxx(%esp) */
1017 }
1018
Jack Palevich7810bc92009-05-15 14:31:47 -07001019 virtual void adjustStackAfterCall(int l, bool isIndirect) {
1020 if (isIndirect) {
1021 l += 4;
1022 }
-b master422972c2009-06-17 19:13:52 -07001023 if (l > 0) {
1024 oad(0xc481, l); /* add $xxx, %esp */
1025 }
Jack Palevich21a15a22009-05-11 14:49:29 -07001026 }
1027
Jack Palevicha6535612009-05-13 16:24:17 -07001028 virtual int jumpOffset() {
1029 return 5;
1030 }
1031
1032 virtual int disassemble(FILE* out) {
Jack Palevich1cdef202009-05-22 12:06:27 -07001033 return 0;
Jack Palevicha6535612009-05-13 16:24:17 -07001034 }
1035
Jack Paleviche7b59062009-05-19 17:12:17 -07001036 /* output a symbol and patch all calls to it */
1037 virtual void gsym(int t) {
1038 int n;
1039 int pc = getPC();
1040 while (t) {
1041 n = *(int *) t; /* next value */
1042 *(int *) t = pc - t - 4;
1043 t = n;
1044 }
1045 }
1046
Jack Palevich1cdef202009-05-22 12:06:27 -07001047 virtual int finishCompile() {
Jack Palevich8dc662e2009-06-09 22:53:47 +00001048 size_t pagesize = 4096;
1049 size_t base = (size_t) getBase() & ~ (pagesize - 1);
1050 size_t top = ((size_t) getPC() + pagesize - 1) & ~ (pagesize - 1);
1051 int err = mprotect((void*) base, top - base, PROT_READ | PROT_WRITE | PROT_EXEC);
1052 if (err) {
1053 error("mprotect() failed: %d", errno);
1054 }
1055 return err;
Jack Palevich1cdef202009-05-22 12:06:27 -07001056 }
1057
Jack Palevich21a15a22009-05-11 14:49:29 -07001058 private:
Jack Paleviche7b59062009-05-19 17:12:17 -07001059
1060 /** Output 1 to 4 bytes.
1061 *
1062 */
1063 void o(int n) {
1064 /* cannot use unsigned, so we must do a hack */
1065 while (n && n != -1) {
1066 ob(n & 0xff);
1067 n = n >> 8;
1068 }
1069 }
1070
1071 /* psym is used to put an instruction with a data field which is a
1072 reference to a symbol. It is in fact the same as oad ! */
1073 int psym(int n, int t) {
1074 return oad(n, t);
1075 }
1076
1077 /* instruction + address */
1078 int oad(int n, int t) {
1079 o(n);
1080 int result = getPC();
1081 o4(t);
1082 return result;
1083 }
1084
1085
Jack Palevichbf42c9c2009-05-12 12:48:35 -07001086 static const int operatorHelper[];
1087
1088 int decodeOp(int op) {
1089 if (op < 0 || op > OP_COUNT) {
Jack Palevichac0e95e2009-05-29 13:53:44 -07001090 error("Out-of-range operator: %d\n", op);
Jack Palevich0a280a02009-06-11 10:53:51 -07001091 op = 0;
Jack Palevichbf42c9c2009-05-12 12:48:35 -07001092 }
1093 return operatorHelper[op];
1094 }
Jack Palevich21a15a22009-05-11 14:49:29 -07001095
Jack Palevich546b2242009-05-13 15:10:04 -07001096 void gmov(int l, int t) {
Jack Palevich21a15a22009-05-11 14:49:29 -07001097 o(l + 0x83);
Jack Palevich8dc662e2009-06-09 22:53:47 +00001098 oad((t > -LOCAL && t < LOCAL) << 7 | 5, t);
Jack Palevich21a15a22009-05-11 14:49:29 -07001099 }
1100 };
1101
Jack Paleviche7b59062009-05-19 17:12:17 -07001102#endif // PROVIDE_X86_CODEGEN
1103
Jack Palevichb67b18f2009-06-11 21:12:23 -07001104#ifdef PROVIDE_TRACE_CODEGEN
1105 class TraceCodeGenerator : public CodeGenerator {
1106 private:
1107 CodeGenerator* mpBase;
1108
1109 public:
1110 TraceCodeGenerator(CodeGenerator* pBase) {
1111 mpBase = pBase;
1112 }
1113
1114 virtual ~TraceCodeGenerator() {
1115 delete mpBase;
1116 }
1117
1118 virtual void init(CodeBuf* pCodeBuf) {
1119 mpBase->init(pCodeBuf);
1120 }
1121
1122 void setErrorSink(ErrorSink* pErrorSink) {
1123 mpBase->setErrorSink(pErrorSink);
1124 }
1125
1126 /* returns address to patch with local variable size
1127 */
1128 virtual int functionEntry(int argCount) {
1129 int result = mpBase->functionEntry(argCount);
1130 fprintf(stderr, "functionEntry(%d) -> %d\n", argCount, result);
1131 return result;
1132 }
1133
1134 virtual void functionExit(int argCount, int localVariableAddress, int localVariableSize) {
1135 fprintf(stderr, "functionExit(%d, %d, %d)\n",
1136 argCount, localVariableAddress, localVariableSize);
1137 mpBase->functionExit(argCount, localVariableAddress, localVariableSize);
1138 }
1139
1140 /* load immediate value */
1141 virtual void li(int t) {
1142 fprintf(stderr, "li(%d)\n", t);
1143 mpBase->li(t);
1144 }
1145
1146 virtual int gjmp(int t) {
1147 int result = mpBase->gjmp(t);
1148 fprintf(stderr, "gjmp(%d) = %d\n", t, result);
1149 return result;
1150 }
1151
1152 /* l = 0: je, l == 1: jne */
1153 virtual int gtst(bool l, int t) {
1154 int result = mpBase->gtst(l, t);
1155 fprintf(stderr, "gtst(%d,%d) = %d\n", l, t, result);
1156 return result;
1157 }
1158
1159 virtual void gcmp(int op) {
1160 fprintf(stderr, "gcmp(%d)\n", op);
1161 mpBase->gcmp(op);
1162 }
1163
1164 virtual void genOp(int op) {
1165 fprintf(stderr, "genOp(%d)\n", op);
1166 mpBase->genOp(op);
1167 }
1168
1169 virtual void clearR1() {
1170 fprintf(stderr, "clearR1()\n");
1171 mpBase->clearR1();
1172 }
1173
1174 virtual void pushR0() {
1175 fprintf(stderr, "pushR0()\n");
1176 mpBase->pushR0();
1177 }
1178
1179 virtual void popR1() {
1180 fprintf(stderr, "popR1()\n");
1181 mpBase->popR1();
1182 }
1183
1184 virtual void storeR0ToR1(bool isInt) {
1185 fprintf(stderr, "storeR0ToR1(%d)\n", isInt);
1186 mpBase->storeR0ToR1(isInt);
1187 }
1188
1189 virtual void loadR0FromR0(bool isInt) {
1190 fprintf(stderr, "loadR0FromR0(%d)\n", isInt);
1191 mpBase->loadR0FromR0(isInt);
1192 }
1193
1194 virtual void leaR0(int ea) {
1195 fprintf(stderr, "leaR0(%d)\n", ea);
1196 mpBase->leaR0(ea);
1197 }
1198
1199 virtual void storeR0(int ea) {
1200 fprintf(stderr, "storeR0(%d)\n", ea);
1201 mpBase->storeR0(ea);
1202 }
1203
1204 virtual void loadR0(int ea, bool isIncDec, int op) {
1205 fprintf(stderr, "loadR0(%d, %d, %d)\n", ea, isIncDec, op);
1206 mpBase->loadR0(ea, isIncDec, op);
1207 }
1208
1209 virtual int beginFunctionCallArguments() {
1210 int result = mpBase->beginFunctionCallArguments();
1211 fprintf(stderr, "beginFunctionCallArguments() = %d\n", result);
1212 return result;
1213 }
1214
1215 virtual void storeR0ToArg(int l) {
1216 fprintf(stderr, "storeR0ToArg(%d)\n", l);
1217 mpBase->storeR0ToArg(l);
1218 }
1219
1220 virtual void endFunctionCallArguments(int a, int l) {
1221 fprintf(stderr, "endFunctionCallArguments(%d, %d)\n", a, l);
1222 mpBase->endFunctionCallArguments(a, l);
1223 }
1224
1225 virtual int callForward(int symbol) {
1226 int result = mpBase->callForward(symbol);
1227 fprintf(stderr, "callForward(%d) = %d\n", symbol, result);
1228 return result;
1229 }
1230
1231 virtual void callRelative(int t) {
1232 fprintf(stderr, "callRelative(%d)\n", t);
1233 mpBase->callRelative(t);
1234 }
1235
1236 virtual void callIndirect(int l) {
1237 fprintf(stderr, "callIndirect(%d)\n", l);
1238 mpBase->callIndirect(l);
1239 }
1240
1241 virtual void adjustStackAfterCall(int l, bool isIndirect) {
1242 fprintf(stderr, "adjustStackAfterCall(%d, %d)\n", l, isIndirect);
1243 mpBase->adjustStackAfterCall(l, isIndirect);
1244 }
1245
1246 virtual int jumpOffset() {
1247 return mpBase->jumpOffset();
1248 }
1249
1250 virtual int disassemble(FILE* out) {
1251 return mpBase->disassemble(out);
1252 }
1253
1254 /* output a symbol and patch all calls to it */
1255 virtual void gsym(int t) {
1256 fprintf(stderr, "gsym(%d)\n", t);
1257 mpBase->gsym(t);
1258 }
1259
1260 virtual int finishCompile() {
1261 int result = mpBase->finishCompile();
1262 fprintf(stderr, "finishCompile() = %d\n", result);
1263 return result;
1264 }
1265 };
1266
1267#endif // PROVIDE_TRACE_CODEGEN
1268
Jack Palevich569f1352009-06-29 14:29:08 -07001269
1270 // Subset of STL vector.
1271 template<class E> class Vector {
1272 public:
1273 Vector() {
1274 mpBase = 0;
1275 mUsed = 0;
1276 mSize = 0;
1277 }
1278
1279 ~Vector() {
1280 if (mpBase) {
1281 for(size_t i = 0; i < mUsed; i++) {
1282 mpBase[mUsed].~E();
1283 }
1284 free(mpBase);
1285 }
1286 }
1287
1288 inline E& operator[](size_t i) {
1289 return mpBase[i];
1290 }
1291
1292 inline E& front() {
1293 return mpBase[0];
1294 }
1295
1296 inline E& back() {
1297 return mpBase[mUsed - 1];
1298 }
1299
1300 void pop_back() {
1301 mUsed -= 1;
1302 mpBase[mUsed].~E();
1303 }
1304
1305 void push_back(const E& item) {
1306 * ensure(1) = item;
1307 }
1308
1309 size_t size() {
1310 return mUsed;
1311 }
1312
1313 private:
1314 E* ensure(int n) {
1315 size_t newUsed = mUsed + n;
1316 if (newUsed > mSize) {
1317 size_t newSize = mSize * 2 + 10;
1318 if (newSize < newUsed) {
1319 newSize = newUsed;
1320 }
1321 mpBase = (E*) realloc(mpBase, sizeof(E) * newSize);
1322 mSize = newSize;
1323 }
1324 E* result = mpBase + mUsed;
1325 mUsed = newUsed;
1326 return result;
1327 }
1328
1329 E* mpBase;
1330 size_t mUsed;
1331 size_t mSize;
1332 };
1333
1334 class Arena {
1335 public:
1336 // Used to record a given allocation amount.
1337 // Used:
1338 // Mark mark = arena.mark();
1339 // ... lots of arena.allocate()
1340 // arena.free(mark);
1341
1342 struct Mark {
1343 size_t chunk;
1344 size_t offset;
1345 };
1346
1347 Arena() {
1348 mCurrentChunk = 0;
1349 Chunk start(CHUNK_SIZE);
1350 mData.push_back(start);
1351 }
1352
1353 ~Arena() {
1354 for(size_t i = 0; i < mData.size(); i++) {
1355 mData[i].free();
1356 }
1357 }
1358
1359 // Alloc using the standard alignment size safe for any variable
1360 void* alloc(size_t size) {
1361 return alloc(size, 8);
1362 }
1363
1364 Mark mark(){
1365 Mark result;
1366 result.chunk = mCurrentChunk;
1367 result.offset = mData[mCurrentChunk].mOffset;
1368 return result;
1369 }
1370
1371 void freeToMark(const Mark& mark) {
1372 mCurrentChunk = mark.chunk;
1373 mData[mCurrentChunk].mOffset = mark.offset;
1374 }
1375
1376 private:
1377 // Allocate memory aligned to a given size
1378 // and a given power-of-two-sized alignment (e.g. 1,2,4,8,...)
1379 // Memory is not zero filled.
1380
1381 void* alloc(size_t size, size_t alignment) {
1382 while (size > mData[mCurrentChunk].remainingCapacity(alignment)) {
1383 if (mCurrentChunk + 1 < mData.size()) {
1384 mCurrentChunk++;
1385 } else {
1386 size_t allocSize = CHUNK_SIZE;
1387 if (allocSize < size + alignment - 1) {
1388 allocSize = size + alignment - 1;
1389 }
1390 Chunk chunk(allocSize);
1391 mData.push_back(chunk);
1392 mCurrentChunk++;
1393 }
1394 }
1395 return mData[mCurrentChunk].allocate(size, alignment);
1396 }
1397
1398 static const size_t CHUNK_SIZE = 128*1024;
1399 // Note: this class does not deallocate its
1400 // memory when it's destroyed. It depends upon
1401 // its parent to deallocate the memory.
1402 struct Chunk {
1403 Chunk() {
1404 mpData = 0;
1405 mSize = 0;
1406 mOffset = 0;
1407 }
1408
1409 Chunk(size_t size) {
1410 mSize = size;
1411 mpData = (char*) malloc(size);
1412 mOffset = 0;
1413 }
1414
1415 ~Chunk() {
1416 // Doesn't deallocate memory.
1417 }
1418
1419 void* allocate(size_t size, size_t alignment) {
1420 size_t alignedOffset = aligned(mOffset, alignment);
1421 void* result = mpData + alignedOffset;
1422 mOffset = alignedOffset + size;
1423 return result;
1424 }
1425
1426 void free() {
1427 if (mpData) {
1428 ::free(mpData);
1429 mpData = 0;
1430 }
1431 }
1432
1433 size_t remainingCapacity(size_t alignment) {
1434 return aligned(mSize, alignment) - aligned(mOffset, alignment);
1435 }
1436
1437 // Assume alignment is a power of two
1438 inline size_t aligned(size_t v, size_t alignment) {
1439 size_t mask = alignment-1;
1440 return (v + mask) & ~mask;
1441 }
1442
1443 char* mpData;
1444 size_t mSize;
1445 size_t mOffset;
1446 };
1447
1448 size_t mCurrentChunk;
1449
1450 Vector<Chunk> mData;
1451 };
1452
1453 typedef int tokenid_t;
1454 struct VariableInfo;
1455
1456 struct Token {
1457 int hash;
1458 size_t length;
1459 char* pText;
1460 tokenid_t id;
1461
1462 // Current values for the token
1463 char* mpMacroDefinition;
1464 VariableInfo* mpVariableInfo;
1465 };
1466
1467 class TokenTable {
1468 public:
1469 // Don't use 0..0xff, allows characters and operators to be tokens too.
1470
1471 static const int TOKEN_BASE = 0x100;
1472 TokenTable() {
1473 mpMap = hashmapCreate(128, hashFn, equalsFn);
1474 }
1475
1476 ~TokenTable() {
1477 hashmapFree(mpMap);
1478 }
1479
1480 void setArena(Arena* pArena) {
1481 mpArena = pArena;
1482 }
1483
1484 // Returns a token for a given string of characters.
1485 tokenid_t intern(const char* pText, size_t length) {
1486 Token probe;
1487 int hash = hashmapHash((void*) pText, length);
1488 {
1489 Token probe;
1490 probe.hash = hash;
1491 probe.length = length;
1492 probe.pText = (char*) pText;
1493 Token* pValue = (Token*) hashmapGet(mpMap, &probe);
1494 if (pValue) {
Jack Palevich569f1352009-06-29 14:29:08 -07001495 return pValue->id;
1496 }
1497 }
1498
1499 Token* pToken = (Token*) mpArena->alloc(sizeof(Token));
1500 memset(pToken, 0, sizeof(*pToken));
1501 pToken->hash = hash;
1502 pToken->length = length;
1503 pToken->pText = (char*) mpArena->alloc(length + 1);
1504 memcpy(pToken->pText, pText, length);
1505 pToken->pText[length] = 0;
1506 pToken->id = mTokens.size() + TOKEN_BASE;
1507 mTokens.push_back(pToken);
1508 hashmapPut(mpMap, pToken, pToken);
Jack Palevich569f1352009-06-29 14:29:08 -07001509 return pToken->id;
1510 }
1511
1512 // Return the Token for a given tokenid.
1513 Token& operator[](tokenid_t id) {
1514 return *mTokens[id - TOKEN_BASE];
1515 }
1516
1517 inline size_t size() {
1518 return mTokens.size();
1519 }
1520
1521 private:
1522
1523 static int hashFn(void* pKey) {
1524 Token* pToken = (Token*) pKey;
1525 return pToken->hash;
1526 }
1527
1528 static bool equalsFn(void* keyA, void* keyB) {
1529 Token* pTokenA = (Token*) keyA;
1530 Token* pTokenB = (Token*) keyB;
1531 // Don't need to compare hash values, they should always be equal
1532 return pTokenA->length == pTokenB->length
1533 && strcmp(pTokenA->pText, pTokenB->pText) == 0;
1534 }
1535
1536 Hashmap* mpMap;
1537 Vector<Token*> mTokens;
1538 Arena* mpArena;
1539 };
1540
Jack Palevich1cdef202009-05-22 12:06:27 -07001541 class InputStream {
1542 public:
Jack Palevicheedf9d22009-06-04 16:23:40 -07001543 int getChar() {
1544 if (bumpLine) {
1545 line++;
1546 bumpLine = false;
1547 }
1548 int ch = get();
1549 if (ch == '\n') {
1550 bumpLine = true;
1551 }
1552 return ch;
1553 }
1554 int getLine() {
1555 return line;
1556 }
1557 protected:
1558 InputStream() :
1559 line(1), bumpLine(false) {
1560 }
1561 private:
Jack Palevich1cdef202009-05-22 12:06:27 -07001562 virtual int get() = 0;
Jack Palevicheedf9d22009-06-04 16:23:40 -07001563 int line;
1564 bool bumpLine;
Jack Palevich1cdef202009-05-22 12:06:27 -07001565 };
1566
1567 class FileInputStream : public InputStream {
1568 public:
1569 FileInputStream(FILE* in) : f(in) {}
Jack Palevich1cdef202009-05-22 12:06:27 -07001570 private:
Jack Palevicheedf9d22009-06-04 16:23:40 -07001571 virtual int get() { return fgetc(f); }
Jack Palevich1cdef202009-05-22 12:06:27 -07001572 FILE* f;
1573 };
1574
1575 class TextInputStream : public InputStream {
1576 public:
1577 TextInputStream(const char* text, size_t textLength)
1578 : pText(text), mTextLength(textLength), mPosition(0) {
1579 }
Jack Palevicheedf9d22009-06-04 16:23:40 -07001580
1581 private:
Jack Palevich1cdef202009-05-22 12:06:27 -07001582 virtual int get() {
1583 return mPosition < mTextLength ? pText[mPosition++] : EOF;
1584 }
Jack Palevich1cdef202009-05-22 12:06:27 -07001585
Jack Palevich1cdef202009-05-22 12:06:27 -07001586 const char* pText;
1587 size_t mTextLength;
1588 size_t mPosition;
1589 };
1590
Jack Palevicheedf9d22009-06-04 16:23:40 -07001591 class String {
1592 public:
1593 String() {
1594 mpBase = 0;
1595 mUsed = 0;
1596 mSize = 0;
1597 }
1598
Jack Palevich303d8ff2009-06-11 19:06:24 -07001599 String(const char* item, int len, bool adopt) {
1600 if (len < 0) {
1601 len = strlen(item);
1602 }
Jack Palevich2d11dfb2009-06-08 14:34:26 -07001603 if (adopt) {
Jack Palevich303d8ff2009-06-11 19:06:24 -07001604 mpBase = (char*) item;
Jack Palevich2d11dfb2009-06-08 14:34:26 -07001605 mUsed = len;
1606 mSize = len + 1;
1607 } else {
1608 mpBase = 0;
1609 mUsed = 0;
1610 mSize = 0;
1611 appendBytes(item, len);
1612 }
1613 }
1614
Jack Palevich303d8ff2009-06-11 19:06:24 -07001615 String(const String& other) {
1616 mpBase = 0;
1617 mUsed = 0;
1618 mSize = 0;
1619 appendBytes(other.getUnwrapped(), other.len());
1620 }
1621
Jack Palevicheedf9d22009-06-04 16:23:40 -07001622 ~String() {
1623 if (mpBase) {
1624 free(mpBase);
1625 }
1626 }
1627
Jack Palevicha6baa232009-06-12 11:25:59 -07001628 String& operator=(const String& other) {
1629 clear();
1630 appendBytes(other.getUnwrapped(), other.len());
1631 return *this;
1632 }
1633
Jack Palevich303d8ff2009-06-11 19:06:24 -07001634 inline char* getUnwrapped() const {
Jack Palevicheedf9d22009-06-04 16:23:40 -07001635 return mpBase;
1636 }
1637
Jack Palevich303d8ff2009-06-11 19:06:24 -07001638 void clear() {
1639 mUsed = 0;
1640 if (mSize > 0) {
1641 mpBase[0] = 0;
1642 }
1643 }
1644
Jack Palevicheedf9d22009-06-04 16:23:40 -07001645 void appendCStr(const char* s) {
Jack Palevich2d11dfb2009-06-08 14:34:26 -07001646 appendBytes(s, strlen(s));
1647 }
1648
1649 void appendBytes(const char* s, int n) {
Jack Palevicheedf9d22009-06-04 16:23:40 -07001650 memcpy(ensure(n), s, n + 1);
1651 }
1652
1653 void append(char c) {
1654 * ensure(1) = c;
1655 }
1656
Jack Palevich86351982009-06-30 18:09:56 -07001657 void append(String& other) {
1658 appendBytes(other.getUnwrapped(), other.len());
1659 }
1660
Jack Palevich2d11dfb2009-06-08 14:34:26 -07001661 char* orphan() {
1662 char* result = mpBase;
1663 mpBase = 0;
1664 mUsed = 0;
1665 mSize = 0;
1666 return result;
1667 }
1668
Jack Palevicheedf9d22009-06-04 16:23:40 -07001669 void printf(const char* fmt,...) {
1670 va_list ap;
1671 va_start(ap, fmt);
1672 vprintf(fmt, ap);
1673 va_end(ap);
1674 }
1675
1676 void vprintf(const char* fmt, va_list ap) {
1677 char* temp;
1678 int numChars = vasprintf(&temp, fmt, ap);
1679 memcpy(ensure(numChars), temp, numChars+1);
1680 free(temp);
1681 }
1682
Jack Palevich303d8ff2009-06-11 19:06:24 -07001683 inline size_t len() const {
Jack Palevicheedf9d22009-06-04 16:23:40 -07001684 return mUsed;
1685 }
1686
1687 private:
1688 char* ensure(int n) {
1689 size_t newUsed = mUsed + n;
1690 if (newUsed > mSize) {
1691 size_t newSize = mSize * 2 + 10;
1692 if (newSize < newUsed) {
1693 newSize = newUsed;
1694 }
1695 mpBase = (char*) realloc(mpBase, newSize + 1);
1696 mSize = newSize;
1697 }
1698 mpBase[newUsed] = '\0';
1699 char* result = mpBase + mUsed;
1700 mUsed = newUsed;
1701 return result;
1702 }
1703
1704 char* mpBase;
1705 size_t mUsed;
1706 size_t mSize;
1707 };
1708
Jack Palevich569f1352009-06-29 14:29:08 -07001709 void internKeywords() {
1710 // Note: order has to match TOK_ constants
1711 static const char* keywords[] = {
1712 "int",
1713 "char",
1714 "void",
1715 "if",
1716 "else",
1717 "while",
1718 "break",
1719 "return",
1720 "for",
1721 "pragma",
1722 "define",
1723 "auto",
1724 "case",
1725 "const",
1726 "continue",
1727 "default",
1728 "do",
1729 "double",
1730 "enum",
1731 "extern",
1732 "float",
1733 "goto",
1734 "long",
1735 "register",
1736 "short",
1737 "signed",
1738 "sizeof",
1739 "static",
1740 "struct",
1741 "switch",
1742 "typedef",
1743 "union",
1744 "unsigned",
1745 "volatile",
1746 "_Bool",
1747 "_Complex",
1748 "_Imaginary",
1749 "inline",
1750 "restrict",
1751 0};
Jack Palevich2d11dfb2009-06-08 14:34:26 -07001752
Jack Palevich569f1352009-06-29 14:29:08 -07001753 for(int i = 0; keywords[i]; i++) {
1754 mTokenTable.intern(keywords[i], strlen(keywords[i]));
Jack Palevich2d11dfb2009-06-08 14:34:26 -07001755 }
Jack Palevich569f1352009-06-29 14:29:08 -07001756 }
Jack Palevich2d11dfb2009-06-08 14:34:26 -07001757
Jack Palevich36d94142009-06-08 15:55:32 -07001758 struct InputState {
1759 InputStream* pStream;
1760 int oldCh;
1761 };
1762
Jack Palevich86351982009-06-30 18:09:56 -07001763 struct Type;
1764
Jack Palevich2db168f2009-06-11 14:29:47 -07001765 struct VariableInfo {
Jack Palevich303d8ff2009-06-11 19:06:24 -07001766 void* pAddress;
1767 void* pForward; // For a forward direction, linked list of data to fix up
Jack Palevich569f1352009-06-29 14:29:08 -07001768 tokenid_t tok;
1769 size_t level;
1770 VariableInfo* pOldDefinition;
Jack Palevich86351982009-06-30 18:09:56 -07001771 Type* pType;
Jack Palevich2db168f2009-06-11 14:29:47 -07001772 };
1773
Jack Palevich303d8ff2009-06-11 19:06:24 -07001774 class SymbolStack {
1775 public:
1776 SymbolStack() {
Jack Palevich569f1352009-06-29 14:29:08 -07001777 mpArena = 0;
1778 mpTokenTable = 0;
1779 }
1780
1781 void setArena(Arena* pArena) {
1782 mpArena = pArena;
1783 }
1784
1785 void setTokenTable(TokenTable* pTokenTable) {
1786 mpTokenTable = pTokenTable;
Jack Palevich303d8ff2009-06-11 19:06:24 -07001787 }
1788
1789 void pushLevel() {
Jack Palevich569f1352009-06-29 14:29:08 -07001790 Mark mark;
1791 mark.mArenaMark = mpArena->mark();
1792 mark.mSymbolHead = mStack.size();
1793 mLevelStack.push_back(mark);
Jack Palevich303d8ff2009-06-11 19:06:24 -07001794 }
1795
1796 void popLevel() {
Jack Palevich569f1352009-06-29 14:29:08 -07001797 // Undo any shadowing that was done:
1798 Mark mark = mLevelStack.back();
1799 mLevelStack.pop_back();
1800 while (mStack.size() > mark.mSymbolHead) {
1801 VariableInfo* pV = mStack.back();
1802 mStack.pop_back();
1803 (*mpTokenTable)[pV->tok].mpVariableInfo = pV->pOldDefinition;
Jack Palevich303d8ff2009-06-11 19:06:24 -07001804 }
Jack Palevich569f1352009-06-29 14:29:08 -07001805 mpArena->freeToMark(mark.mArenaMark);
Jack Palevich303d8ff2009-06-11 19:06:24 -07001806 }
1807
Jack Palevich569f1352009-06-29 14:29:08 -07001808 bool isDefinedAtCurrentLevel(tokenid_t tok) {
1809 VariableInfo* pV = (*mpTokenTable)[tok].mpVariableInfo;
1810 return pV && pV->level == level();
1811 }
1812
1813 VariableInfo* add(tokenid_t tok) {
1814 Token& token = (*mpTokenTable)[tok];
1815 VariableInfo* pOldV = token.mpVariableInfo;
1816 VariableInfo* pNewV =
1817 (VariableInfo*) mpArena->alloc(sizeof(VariableInfo));
1818 memset(pNewV, 0, sizeof(VariableInfo));
1819 pNewV->tok = tok;
1820 pNewV->level = level();
1821 pNewV->pOldDefinition = pOldV;
1822 token.mpVariableInfo = pNewV;
1823 mStack.push_back(pNewV);
1824 return pNewV;
1825 }
1826
Jack Palevich86351982009-06-30 18:09:56 -07001827 VariableInfo* add(Type* pType) {
1828 VariableInfo* pVI = add(pType->id);
1829 pVI->pType = pType;
1830 return pVI;
1831 }
1832
Jack Palevich569f1352009-06-29 14:29:08 -07001833 void forEach(bool (*fn)(VariableInfo*, void*), void* context) {
1834 for (size_t i = 0; i < mStack.size(); i++) {
1835 if (! fn(mStack[i], context)) {
Jack Palevich303d8ff2009-06-11 19:06:24 -07001836 break;
1837 }
1838 }
Jack Palevicha6baa232009-06-12 11:25:59 -07001839 }
1840
Jack Palevich303d8ff2009-06-11 19:06:24 -07001841 private:
Jack Palevich569f1352009-06-29 14:29:08 -07001842 inline size_t level() {
1843 return mLevelStack.size();
Jack Palevich303d8ff2009-06-11 19:06:24 -07001844 }
1845
Jack Palevich569f1352009-06-29 14:29:08 -07001846 struct Mark {
1847 Arena::Mark mArenaMark;
1848 size_t mSymbolHead;
Jack Palevich303d8ff2009-06-11 19:06:24 -07001849 };
1850
Jack Palevich569f1352009-06-29 14:29:08 -07001851 Arena* mpArena;
1852 TokenTable* mpTokenTable;
1853 Vector<VariableInfo*> mStack;
1854 Vector<Mark> mLevelStack;
Jack Palevich303d8ff2009-06-11 19:06:24 -07001855 };
Jack Palevich36d94142009-06-08 15:55:32 -07001856
1857 int ch; // Current input character, or EOF
Jack Palevich569f1352009-06-29 14:29:08 -07001858 tokenid_t tok; // token
Jack Palevich36d94142009-06-08 15:55:32 -07001859 intptr_t tokc; // token extra info
1860 int tokl; // token operator level
1861 intptr_t rsym; // return symbol
1862 intptr_t loc; // local variable index
1863 char* glo; // global variable index
Jack Palevich303d8ff2009-06-11 19:06:24 -07001864 String mTokenString;
Jack Palevich36d94142009-06-08 15:55:32 -07001865 char* dptr; // Macro state: Points to macro text during macro playback.
1866 int dch; // Macro state: Saves old value of ch during a macro playback.
Jack Palevich36d94142009-06-08 15:55:32 -07001867 char* pGlobalBase;
Jack Palevich569f1352009-06-29 14:29:08 -07001868
1869 // Arena for the duration of the compile
1870 Arena mGlobalArena;
1871 // Arena for data that's only needed when compiling a single function
1872 Arena mLocalArena;
1873
1874 TokenTable mTokenTable;
1875 SymbolStack mGlobals;
1876 SymbolStack mLocals;
1877
Jack Palevich86351982009-06-30 18:09:56 -07001878 Type* mkpInt;
1879 Type* mkpChar;
1880 Type* mkpVoid;
1881
Jack Palevich36d94142009-06-08 15:55:32 -07001882 InputStream* file;
1883
1884 CodeBuf codeBuf;
1885 CodeGenerator* pGen;
1886
Jack Palevicheedf9d22009-06-04 16:23:40 -07001887 String mErrorBuf;
1888
Jack Palevicheedf9d22009-06-04 16:23:40 -07001889 String mPragmas;
1890 int mPragmaStringCount;
1891
Jack Palevich21a15a22009-05-11 14:49:29 -07001892 static const int ALLOC_SIZE = 99999;
1893
Jack Palevich303d8ff2009-06-11 19:06:24 -07001894 static const int TOK_DUMMY = 1;
1895 static const int TOK_NUM = 2;
1896
1897 // 3..255 are character and/or operators
1898
Jack Palevich2db168f2009-06-11 14:29:47 -07001899 // Keywords start at 0x100 and increase by 1
Jack Palevich569f1352009-06-29 14:29:08 -07001900 // Order has to match string list in "internKeywords".
1901 enum {
1902 TOK_KEYWORD = TokenTable::TOKEN_BASE,
1903 TOK_INT = TOK_KEYWORD,
1904 TOK_CHAR,
1905 TOK_VOID,
1906 TOK_IF,
1907 TOK_ELSE,
1908 TOK_WHILE,
1909 TOK_BREAK,
1910 TOK_RETURN,
1911 TOK_FOR,
1912 TOK_PRAGMA,
1913 TOK_DEFINE,
1914 TOK_AUTO,
1915 TOK_CASE,
1916 TOK_CONST,
1917 TOK_CONTINUE,
1918 TOK_DEFAULT,
1919 TOK_DO,
1920 TOK_DOUBLE,
1921 TOK_ENUM,
1922 TOK_EXTERN,
1923 TOK_FLOAT,
1924 TOK_GOTO,
1925 TOK_LONG,
1926 TOK_REGISTER,
1927 TOK_SHORT,
1928 TOK_SIGNED,
1929 TOK_SIZEOF,
1930 TOK_STATIC,
1931 TOK_STRUCT,
1932 TOK_SWITCH,
1933 TOK_TYPEDEF,
1934 TOK_UNION,
1935 TOK_UNSIGNED,
1936 TOK_VOLATILE,
1937 TOK__BOOL,
1938 TOK__COMPLEX,
1939 TOK__IMAGINARY,
1940 TOK_INLINE,
1941 TOK_RESTRICT,
1942 // Symbols start after tokens
1943 TOK_SYMBOL
1944 };
Jack Palevich21a15a22009-05-11 14:49:29 -07001945
1946 static const int LOCAL = 0x200;
1947
1948 static const int SYM_FORWARD = 0;
1949 static const int SYM_DEFINE = 1;
1950
1951 /* tokens in string heap */
1952 static const int TAG_TOK = ' ';
Jack Palevich21a15a22009-05-11 14:49:29 -07001953
Jack Palevichbf42c9c2009-05-12 12:48:35 -07001954 static const int OP_INCREMENT = 0;
1955 static const int OP_DECREMENT = 1;
1956 static const int OP_MUL = 2;
1957 static const int OP_DIV = 3;
1958 static const int OP_MOD = 4;
1959 static const int OP_PLUS = 5;
1960 static const int OP_MINUS = 6;
1961 static const int OP_SHIFT_LEFT = 7;
1962 static const int OP_SHIFT_RIGHT = 8;
1963 static const int OP_LESS_EQUAL = 9;
1964 static const int OP_GREATER_EQUAL = 10;
1965 static const int OP_LESS = 11;
1966 static const int OP_GREATER = 12;
1967 static const int OP_EQUALS = 13;
1968 static const int OP_NOT_EQUALS = 14;
1969 static const int OP_LOGICAL_AND = 15;
1970 static const int OP_LOGICAL_OR = 16;
1971 static const int OP_BIT_AND = 17;
1972 static const int OP_BIT_XOR = 18;
1973 static const int OP_BIT_OR = 19;
1974 static const int OP_BIT_NOT = 20;
1975 static const int OP_LOGICAL_NOT = 21;
1976 static const int OP_COUNT = 22;
1977
1978 /* Operators are searched from front, the two-character operators appear
1979 * before the single-character operators with the same first character.
1980 * @ is used to pad out single-character operators.
1981 */
1982 static const char* operatorChars;
1983 static const char operatorLevel[];
1984
Jack Palevich569f1352009-06-29 14:29:08 -07001985 /* Called when we detect an internal problem. Does nothing in production.
1986 *
1987 */
1988 void internalError() {
1989 * (char*) 0 = 0;
1990 }
1991
Jack Palevich86351982009-06-30 18:09:56 -07001992 void assert(bool isTrue) {
1993 if (!isTrue) {
Jack Palevich569f1352009-06-29 14:29:08 -07001994 internalError();
1995 }
Jack Palevich86351982009-06-30 18:09:56 -07001996 }
1997
1998 VariableInfo* VI(tokenid_t t) {
1999 if ( t < TOK_SYMBOL || ((size_t) (t-TOK_SYMBOL)) >= mTokenTable.size()) {
2000 internalError();
2001 }
Jack Palevich569f1352009-06-29 14:29:08 -07002002 VariableInfo* pV = mTokenTable[t].mpVariableInfo;
2003 if (pV && pV->tok != t) {
2004 internalError();
2005 }
2006 return pV;
2007 }
2008
2009 inline bool isDefined(tokenid_t t) {
2010 return t >= TOK_SYMBOL && VI(t) != 0;
2011 }
2012
2013 inline const char* nameof(tokenid_t t) {
2014 return mTokenTable[t].pText;
2015 }
2016
Jack Palevich21a15a22009-05-11 14:49:29 -07002017 void pdef(int t) {
Jack Palevich303d8ff2009-06-11 19:06:24 -07002018 mTokenString.append(t);
Jack Palevich21a15a22009-05-11 14:49:29 -07002019 }
2020
2021 void inp() {
2022 if (dptr) {
Jack Palevich653f42d2009-05-28 17:15:32 -07002023 ch = *dptr++;
Jack Palevich2d11dfb2009-06-08 14:34:26 -07002024 if (ch == 0) {
Jack Palevich21a15a22009-05-11 14:49:29 -07002025 dptr = 0;
2026 ch = dch;
2027 }
2028 } else
Jack Palevicheedf9d22009-06-04 16:23:40 -07002029 ch = file->getChar();
Jack Palevichb7c81e92009-06-04 19:56:13 -07002030#if 0
2031 printf("ch='%c' 0x%x\n", ch, ch);
2032#endif
Jack Palevich21a15a22009-05-11 14:49:29 -07002033 }
2034
2035 int isid() {
Jack Palevich546b2242009-05-13 15:10:04 -07002036 return isalnum(ch) | (ch == '_');
Jack Palevich21a15a22009-05-11 14:49:29 -07002037 }
2038
Jack Palevichb4758ff2009-06-12 12:49:14 -07002039 /* read a character constant, advances ch to after end of constant */
2040 int getq() {
2041 int val = ch;
Jack Palevich21a15a22009-05-11 14:49:29 -07002042 if (ch == '\\') {
2043 inp();
Jack Palevichb4758ff2009-06-12 12:49:14 -07002044 if (isoctal(ch)) {
2045 // 1 to 3 octal characters.
2046 val = 0;
2047 for(int i = 0; i < 3; i++) {
2048 if (isoctal(ch)) {
2049 val = (val << 3) + ch - '0';
2050 inp();
2051 }
2052 }
2053 return val;
2054 } else if (ch == 'x' || ch == 'X') {
2055 // N hex chars
2056 inp();
2057 if (! isxdigit(ch)) {
2058 error("'x' character escape requires at least one digit.");
2059 } else {
2060 val = 0;
2061 while (isxdigit(ch)) {
2062 int d = ch;
2063 if (isdigit(d)) {
2064 d -= '0';
2065 } else if (d <= 'F') {
2066 d = d - 'A' + 10;
2067 } else {
2068 d = d - 'a' + 10;
2069 }
2070 val = (val << 4) + d;
2071 inp();
2072 }
2073 }
2074 } else {
2075 int val = ch;
2076 switch (ch) {
2077 case 'a':
2078 val = '\a';
2079 break;
2080 case 'b':
2081 val = '\b';
2082 break;
2083 case 'f':
2084 val = '\f';
2085 break;
2086 case 'n':
2087 val = '\n';
2088 break;
2089 case 'r':
2090 val = '\r';
2091 break;
2092 case 't':
2093 val = '\t';
2094 break;
2095 case 'v':
2096 val = '\v';
2097 break;
2098 case '\\':
2099 val = '\\';
2100 break;
2101 case '\'':
2102 val = '\'';
2103 break;
2104 case '"':
2105 val = '"';
2106 break;
2107 case '?':
2108 val = '?';
2109 break;
2110 default:
2111 error("Undefined character escape %c", ch);
2112 break;
2113 }
2114 inp();
2115 return val;
2116 }
2117 } else {
2118 inp();
Jack Palevich21a15a22009-05-11 14:49:29 -07002119 }
Jack Palevichb4758ff2009-06-12 12:49:14 -07002120 return val;
2121 }
2122
2123 static bool isoctal(int ch) {
2124 return ch >= '0' && ch <= '7';
Jack Palevich21a15a22009-05-11 14:49:29 -07002125 }
2126
2127 void next() {
2128 int l, a;
2129
Jack Palevich546b2242009-05-13 15:10:04 -07002130 while (isspace(ch) | (ch == '#')) {
Jack Palevich21a15a22009-05-11 14:49:29 -07002131 if (ch == '#') {
2132 inp();
2133 next();
2134 if (tok == TOK_DEFINE) {
Jack Palevich2d11dfb2009-06-08 14:34:26 -07002135 doDefine();
Jack Palevicheedf9d22009-06-04 16:23:40 -07002136 } else if (tok == TOK_PRAGMA) {
2137 doPragma();
2138 } else {
Jack Palevich303d8ff2009-06-11 19:06:24 -07002139 error("Unsupported preprocessor directive \"%s\"",
2140 mTokenString.getUnwrapped());
Jack Palevich21a15a22009-05-11 14:49:29 -07002141 }
Jack Palevich21a15a22009-05-11 14:49:29 -07002142 }
2143 inp();
2144 }
2145 tokl = 0;
2146 tok = ch;
2147 /* encode identifiers & numbers */
2148 if (isid()) {
Jack Palevich303d8ff2009-06-11 19:06:24 -07002149 mTokenString.clear();
Jack Palevich21a15a22009-05-11 14:49:29 -07002150 while (isid()) {
Jack Paleviche27bf3e2009-05-10 14:09:03 -07002151 pdef(ch);
2152 inp();
Jack Palevichae54f1f2009-05-08 14:54:15 -07002153 }
Jack Palevich21a15a22009-05-11 14:49:29 -07002154 if (isdigit(tok)) {
Jack Palevich303d8ff2009-06-11 19:06:24 -07002155 tokc = strtol(mTokenString.getUnwrapped(), 0, 0);
Jack Palevich21a15a22009-05-11 14:49:29 -07002156 tok = TOK_NUM;
Jack Paleviche27bf3e2009-05-10 14:09:03 -07002157 } else {
Jack Palevich569f1352009-06-29 14:29:08 -07002158 tok = mTokenTable.intern(mTokenString.getUnwrapped(),
2159 mTokenString.len());
Jack Palevich2d11dfb2009-06-08 14:34:26 -07002160 // Is this a macro?
Jack Palevich569f1352009-06-29 14:29:08 -07002161 char* pMacroDefinition = mTokenTable[tok].mpMacroDefinition;
2162 if(pMacroDefinition) {
Jack Palevich2d11dfb2009-06-08 14:34:26 -07002163 // Yes, it is a macro
Jack Palevich569f1352009-06-29 14:29:08 -07002164 dptr = pMacroDefinition;
Jack Palevich2d11dfb2009-06-08 14:34:26 -07002165 dch = ch;
2166 inp();
2167 next();
Jack Paleviche27bf3e2009-05-10 14:09:03 -07002168 }
2169 }
Jack Paleviche27bf3e2009-05-10 14:09:03 -07002170 } else {
Jack Palevich21a15a22009-05-11 14:49:29 -07002171 inp();
2172 if (tok == '\'') {
2173 tok = TOK_NUM;
Jack Palevichb4758ff2009-06-12 12:49:14 -07002174 tokc = getq();
2175 if (ch != '\'') {
2176 error("Expected a ' character, got %c", ch);
2177 } else {
2178 inp();
2179 }
Jack Palevich546b2242009-05-13 15:10:04 -07002180 } else if ((tok == '/') & (ch == '*')) {
Jack Palevich21a15a22009-05-11 14:49:29 -07002181 inp();
Jack Palevich22e3e8e2009-06-12 13:12:55 -07002182 while (ch && ch != EOF) {
2183 while (ch != '*' && ch != EOF)
Jack Palevich21a15a22009-05-11 14:49:29 -07002184 inp();
2185 inp();
2186 if (ch == '/')
2187 ch = 0;
Jack Paleviche27bf3e2009-05-10 14:09:03 -07002188 }
Jack Palevich22e3e8e2009-06-12 13:12:55 -07002189 if (ch == EOF) {
2190 error("End of file inside comment.");
2191 }
Jack Palevich21a15a22009-05-11 14:49:29 -07002192 inp();
Jack Paleviche27bf3e2009-05-10 14:09:03 -07002193 next();
Jack Palevichbd894902009-05-14 19:35:31 -07002194 } else if ((tok == '/') & (ch == '/')) {
2195 inp();
Jack Palevich22e3e8e2009-06-12 13:12:55 -07002196 while (ch && (ch != '\n') && (ch != EOF)) {
Jack Palevichbd894902009-05-14 19:35:31 -07002197 inp();
2198 }
2199 inp();
2200 next();
Jack Palevich21a15a22009-05-11 14:49:29 -07002201 } else {
Jack Palevichbf42c9c2009-05-12 12:48:35 -07002202 const char* t = operatorChars;
2203 int opIndex = 0;
Jack Palevich546b2242009-05-13 15:10:04 -07002204 while ((l = *t++) != 0) {
Jack Palevich21a15a22009-05-11 14:49:29 -07002205 a = *t++;
Jack Palevichbf42c9c2009-05-12 12:48:35 -07002206 tokl = operatorLevel[opIndex];
2207 tokc = opIndex;
Jack Palevich546b2242009-05-13 15:10:04 -07002208 if ((l == tok) & ((a == ch) | (a == '@'))) {
Jack Palevich21a15a22009-05-11 14:49:29 -07002209#if 0
2210 printf("%c%c -> tokl=%d tokc=0x%x\n",
2211 l, a, tokl, tokc);
2212#endif
2213 if (a == ch) {
2214 inp();
2215 tok = TOK_DUMMY; /* dummy token for double tokens */
2216 }
2217 break;
2218 }
Jack Palevichbf42c9c2009-05-12 12:48:35 -07002219 opIndex++;
2220 }
2221 if (l == 0) {
2222 tokl = 0;
2223 tokc = 0;
Jack Palevich21a15a22009-05-11 14:49:29 -07002224 }
2225 }
2226 }
2227#if 0
2228 {
Jack Palevich569f1352009-06-29 14:29:08 -07002229 String buf;
2230 decodeToken(buf, tok);
Jack Palevich86351982009-06-30 18:09:56 -07002231 fprintf(stderr, "%s\n", buf.getUnwrapped());
2232 }
Jack Palevich21a15a22009-05-11 14:49:29 -07002233#endif
2234 }
2235
Jack Palevich2d11dfb2009-06-08 14:34:26 -07002236 void doDefine() {
Jack Palevich569f1352009-06-29 14:29:08 -07002237 next();
2238 tokenid_t name = tok;
Jack Palevich2d11dfb2009-06-08 14:34:26 -07002239 String* pName = new String();
2240 while (isspace(ch)) {
2241 inp();
2242 }
Jack Palevich2d11dfb2009-06-08 14:34:26 -07002243 if (ch == '(') {
2244 delete pName;
2245 error("Defines with arguments not supported");
Jack Palevich0a280a02009-06-11 10:53:51 -07002246 return;
Jack Palevich2d11dfb2009-06-08 14:34:26 -07002247 }
2248 while (isspace(ch)) {
2249 inp();
2250 }
Jack Palevich569f1352009-06-29 14:29:08 -07002251 String value;
Jack Palevich2d11dfb2009-06-08 14:34:26 -07002252 while (ch != '\n' && ch != EOF) {
Jack Palevich569f1352009-06-29 14:29:08 -07002253 value.append(ch);
Jack Palevich2d11dfb2009-06-08 14:34:26 -07002254 inp();
2255 }
Jack Palevich569f1352009-06-29 14:29:08 -07002256 char* pDefn = (char*)mGlobalArena.alloc(value.len() + 1);
2257 memcpy(pDefn, value.getUnwrapped(), value.len());
2258 pDefn[value.len()] = 0;
2259 mTokenTable[name].mpMacroDefinition = pDefn;
Jack Palevich2d11dfb2009-06-08 14:34:26 -07002260 }
2261
Jack Palevicheedf9d22009-06-04 16:23:40 -07002262 void doPragma() {
2263 // # pragma name(val)
2264 int state = 0;
2265 while(ch != EOF && ch != '\n' && state < 10) {
2266 switch(state) {
2267 case 0:
2268 if (isspace(ch)) {
2269 inp();
2270 } else {
2271 state++;
2272 }
2273 break;
2274 case 1:
2275 if (isalnum(ch)) {
2276 mPragmas.append(ch);
2277 inp();
2278 } else if (ch == '(') {
2279 mPragmas.append(0);
2280 inp();
2281 state++;
2282 } else {
2283 state = 11;
2284 }
2285 break;
2286 case 2:
2287 if (isalnum(ch)) {
2288 mPragmas.append(ch);
2289 inp();
2290 } else if (ch == ')') {
2291 mPragmas.append(0);
2292 inp();
2293 state = 10;
2294 } else {
2295 state = 11;
2296 }
2297 break;
2298 }
2299 }
2300 if(state != 10) {
2301 error("Unexpected pragma syntax");
2302 }
2303 mPragmaStringCount += 2;
2304 }
Jack Palevich21a15a22009-05-11 14:49:29 -07002305
Jack Palevichac0e95e2009-05-29 13:53:44 -07002306 virtual void verror(const char* fmt, va_list ap) {
Jack Palevicheedf9d22009-06-04 16:23:40 -07002307 mErrorBuf.printf("%ld: ", file->getLine());
2308 mErrorBuf.vprintf(fmt, ap);
2309 mErrorBuf.printf("\n");
Jack Palevich21a15a22009-05-11 14:49:29 -07002310 }
2311
Jack Palevich8b0624c2009-05-20 12:12:06 -07002312 void skip(intptr_t c) {
Jack Palevich21a15a22009-05-11 14:49:29 -07002313 if (tok != c) {
2314 error("'%c' expected", c);
2315 }
2316 next();
2317 }
2318
Jack Palevich86351982009-06-30 18:09:56 -07002319 bool accept(intptr_t c) {
2320 if (tok == c) {
2321 next();
2322 return true;
2323 }
2324 return false;
2325 }
2326
Jack Palevich21a15a22009-05-11 14:49:29 -07002327 /* l is one if '=' parsing wanted (quick hack) */
Jack Palevich8b0624c2009-05-20 12:12:06 -07002328 void unary(intptr_t l) {
Jack Palevich653f42d2009-05-28 17:15:32 -07002329 intptr_t n, t, a;
2330 int c;
Jack Palevicha6baa232009-06-12 11:25:59 -07002331 String tString;
Jack Palevich546b2242009-05-13 15:10:04 -07002332 t = 0;
Jack Palevichb4758ff2009-06-12 12:49:14 -07002333 n = 1; /* type of expression 0 = forward, 1 = value, other = lvalue */
Jack Palevich21a15a22009-05-11 14:49:29 -07002334 if (tok == '\"') {
Jack Palevich653f42d2009-05-28 17:15:32 -07002335 pGen->li((int) glo);
Jack Palevichb4758ff2009-06-12 12:49:14 -07002336 while (ch != '\"' && ch != EOF) {
2337 *allocGlobalSpace(1) = getq();
2338 }
2339 if (ch != '\"') {
2340 error("Unterminated string constant.");
Jack Palevich21a15a22009-05-11 14:49:29 -07002341 }
Jack Palevich653f42d2009-05-28 17:15:32 -07002342 *glo = 0;
Jack Palevichf1f39cc2009-05-29 18:03:15 -07002343 /* align heap */
2344 allocGlobalSpace((char*) (((intptr_t) glo + 4) & -4) - glo);
Jack Palevich21a15a22009-05-11 14:49:29 -07002345 inp();
2346 next();
2347 } else {
2348 c = tokl;
2349 a = tokc;
2350 t = tok;
Jack Palevicha6baa232009-06-12 11:25:59 -07002351 tString = mTokenString;
Jack Palevich21a15a22009-05-11 14:49:29 -07002352 next();
2353 if (t == TOK_NUM) {
Jack Palevichbf42c9c2009-05-12 12:48:35 -07002354 pGen->li(a);
Jack Palevich21a15a22009-05-11 14:49:29 -07002355 } else if (c == 2) {
2356 /* -, +, !, ~ */
2357 unary(0);
Jack Palevich1cdef202009-05-22 12:06:27 -07002358 pGen->clearR1();
Jack Palevich21a15a22009-05-11 14:49:29 -07002359 if (t == '!')
Jack Palevichbf42c9c2009-05-12 12:48:35 -07002360 pGen->gcmp(a);
Jack Palevich21a15a22009-05-11 14:49:29 -07002361 else
Jack Palevichbf42c9c2009-05-12 12:48:35 -07002362 pGen->genOp(a);
Jack Palevich21a15a22009-05-11 14:49:29 -07002363 } else if (t == '(') {
2364 expr();
2365 skip(')');
2366 } else if (t == '*') {
2367 /* parse cast */
2368 skip('(');
2369 t = tok; /* get type */
2370 next(); /* skip int/char/void */
2371 next(); /* skip '*' or '(' */
2372 if (tok == '*') {
2373 /* function type */
2374 skip('*');
2375 skip(')');
2376 skip('(');
2377 skip(')');
2378 t = 0;
2379 }
2380 skip(')');
2381 unary(0);
2382 if (tok == '=') {
2383 next();
Jack Palevich1cdef202009-05-22 12:06:27 -07002384 pGen->pushR0();
Jack Palevich21a15a22009-05-11 14:49:29 -07002385 expr();
Jack Palevich1cdef202009-05-22 12:06:27 -07002386 pGen->popR1();
2387 pGen->storeR0ToR1(t == TOK_INT);
Jack Palevich21a15a22009-05-11 14:49:29 -07002388 } else if (t) {
Jack Palevich1cdef202009-05-22 12:06:27 -07002389 pGen->loadR0FromR0(t == TOK_INT);
Jack Palevich21a15a22009-05-11 14:49:29 -07002390 }
2391 } else if (t == '&') {
Jack Palevich569f1352009-06-29 14:29:08 -07002392 pGen->leaR0((int) VI(tok)->pAddress);
Jack Palevich21a15a22009-05-11 14:49:29 -07002393 next();
Jack Palevich303d8ff2009-06-11 19:06:24 -07002394 } else if (t == EOF ) {
2395 error("Unexpected EOF.");
Jack Palevicha1804dd2009-06-12 14:40:04 -07002396 } else if (!checkSymbol(t, &tString)) {
2397 // Don't have to do anything special here, the error
2398 // message was printed by checkSymbol() above.
Jack Palevich21a15a22009-05-11 14:49:29 -07002399 } else {
Jack Palevich569f1352009-06-29 14:29:08 -07002400 if (!isDefined(t)) {
2401 mGlobals.add(t);
2402 // printf("Adding new global function %s\n", nameof(t));
Jack Palevich303d8ff2009-06-11 19:06:24 -07002403 }
2404
Jack Palevich569f1352009-06-29 14:29:08 -07002405 n = (intptr_t) VI(t)->pAddress;
Jack Palevich21a15a22009-05-11 14:49:29 -07002406 /* forward reference: try dlsym */
Jack Palevichcb1c9ef2009-05-14 11:38:49 -07002407 if (!n) {
Jack Palevich303d8ff2009-06-11 19:06:24 -07002408 n = (intptr_t) dlsym(RTLD_DEFAULT,
Jack Palevicha6baa232009-06-12 11:25:59 -07002409 tString.getUnwrapped());
Jack Palevich569f1352009-06-29 14:29:08 -07002410 VI(t)->pAddress = (void*) n;
Jack Palevichcb1c9ef2009-05-14 11:38:49 -07002411 }
Jack Palevich546b2242009-05-13 15:10:04 -07002412 if ((tok == '=') & l) {
Jack Palevich21a15a22009-05-11 14:49:29 -07002413 /* assignment */
2414 next();
2415 expr();
Jack Palevich1cdef202009-05-22 12:06:27 -07002416 pGen->storeR0(n);
Jack Palevich21a15a22009-05-11 14:49:29 -07002417 } else if (tok != '(') {
2418 /* variable */
Jack Palevicha6baa232009-06-12 11:25:59 -07002419 if (!n) {
2420 error("Undefined variable %s", tString.getUnwrapped());
2421 }
Jack Palevich1cdef202009-05-22 12:06:27 -07002422 pGen->loadR0(n, tokl == 11, tokc);
Jack Palevich21a15a22009-05-11 14:49:29 -07002423 if (tokl == 11) {
Jack Palevich21a15a22009-05-11 14:49:29 -07002424 next();
2425 }
2426 }
2427 }
2428 }
2429
2430 /* function call */
2431 if (tok == '(') {
2432 if (n == 1)
Jack Palevich1cdef202009-05-22 12:06:27 -07002433 pGen->pushR0();
Jack Palevich21a15a22009-05-11 14:49:29 -07002434
2435 /* push args and invert order */
Jack Palevichcb1c9ef2009-05-14 11:38:49 -07002436 a = pGen->beginFunctionCallArguments();
Jack Palevich21a15a22009-05-11 14:49:29 -07002437 next();
2438 l = 0;
Jack Palevichb4758ff2009-06-12 12:49:14 -07002439 while (tok != ')' && tok != EOF) {
Jack Palevich21a15a22009-05-11 14:49:29 -07002440 expr();
Jack Palevich1cdef202009-05-22 12:06:27 -07002441 pGen->storeR0ToArg(l);
Jack Palevichbbf8ab52009-05-11 11:54:30 -07002442 if (tok == ',')
Jack Paleviche27bf3e2009-05-10 14:09:03 -07002443 next();
Jack Palevich21a15a22009-05-11 14:49:29 -07002444 l = l + 4;
Jack Paleviche27bf3e2009-05-10 14:09:03 -07002445 }
Jack Palevichcb1c9ef2009-05-14 11:38:49 -07002446 pGen->endFunctionCallArguments(a, l);
Jack Palevichb4758ff2009-06-12 12:49:14 -07002447 skip(')');
Jack Palevich21a15a22009-05-11 14:49:29 -07002448 if (!n) {
2449 /* forward reference */
Jack Palevich569f1352009-06-29 14:29:08 -07002450 VariableInfo* pVI = VI(t);
2451 pVI->pForward = (void*) pGen->callForward((int) pVI->pForward);
Jack Palevich21a15a22009-05-11 14:49:29 -07002452 } else if (n == 1) {
2453 pGen->callIndirect(l);
Jack Palevich21a15a22009-05-11 14:49:29 -07002454 } else {
Jack Palevich7810bc92009-05-15 14:31:47 -07002455 pGen->callRelative(n - codeBuf.getPC() - pGen->jumpOffset());
Jack Palevich21a15a22009-05-11 14:49:29 -07002456 }
-b master422972c2009-06-17 19:13:52 -07002457 pGen->adjustStackAfterCall(l, n == 1);
Jack Palevich21a15a22009-05-11 14:49:29 -07002458 }
2459 }
2460
Jack Palevich653f42d2009-05-28 17:15:32 -07002461 void sum(int l) {
Jack Palevich8b0624c2009-05-20 12:12:06 -07002462 intptr_t t, n, a;
Jack Palevich546b2242009-05-13 15:10:04 -07002463 t = 0;
Jack Palevich21a15a22009-05-11 14:49:29 -07002464 if (l-- == 1)
2465 unary(1);
2466 else {
2467 sum(l);
2468 a = 0;
2469 while (l == tokl) {
2470 n = tok;
2471 t = tokc;
2472 next();
2473
2474 if (l > 8) {
Jack Palevichbf42c9c2009-05-12 12:48:35 -07002475 a = pGen->gtst(t == OP_LOGICAL_OR, a); /* && and || output code generation */
Jack Palevich21a15a22009-05-11 14:49:29 -07002476 sum(l);
2477 } else {
Jack Palevich1cdef202009-05-22 12:06:27 -07002478 pGen->pushR0();
Jack Palevich21a15a22009-05-11 14:49:29 -07002479 sum(l);
Jack Palevich1cdef202009-05-22 12:06:27 -07002480 pGen->popR1();
Jack Palevich21a15a22009-05-11 14:49:29 -07002481
Jack Palevich546b2242009-05-13 15:10:04 -07002482 if ((l == 4) | (l == 5)) {
Jack Palevichbf42c9c2009-05-12 12:48:35 -07002483 pGen->gcmp(t);
Jack Palevich21a15a22009-05-11 14:49:29 -07002484 } else {
Jack Palevichbf42c9c2009-05-12 12:48:35 -07002485 pGen->genOp(t);
Jack Palevich21a15a22009-05-11 14:49:29 -07002486 }
2487 }
2488 }
2489 /* && and || output code generation */
2490 if (a && l > 8) {
Jack Palevichbf42c9c2009-05-12 12:48:35 -07002491 a = pGen->gtst(t == OP_LOGICAL_OR, a);
2492 pGen->li(t != OP_LOGICAL_OR);
Jack Palevicha6535612009-05-13 16:24:17 -07002493 pGen->gjmp(5); /* jmp $ + 5 (sizeof li, FIXME for ARM) */
Jack Palevichbf42c9c2009-05-12 12:48:35 -07002494 pGen->gsym(a);
2495 pGen->li(t == OP_LOGICAL_OR);
Jack Palevich21a15a22009-05-11 14:49:29 -07002496 }
2497 }
2498 }
2499
2500 void expr() {
2501 sum(11);
2502 }
2503
2504 int test_expr() {
2505 expr();
Jack Palevichbf42c9c2009-05-12 12:48:35 -07002506 return pGen->gtst(0, 0);
Jack Palevich21a15a22009-05-11 14:49:29 -07002507 }
2508
Jack Palevicha6baa232009-06-12 11:25:59 -07002509 void block(intptr_t l, bool outermostFunctionBlock) {
Jack Palevich8b0624c2009-05-20 12:12:06 -07002510 intptr_t a, n, t;
Jack Palevich21a15a22009-05-11 14:49:29 -07002511
Jack Palevicha1804dd2009-06-12 14:40:04 -07002512 if (tok == TOK_INT || tok == TOK_CHAR) {
2513 /* declarations */
2514 localDeclarations();
2515 } else if (tok == TOK_IF) {
Jack Paleviche27bf3e2009-05-10 14:09:03 -07002516 next();
2517 skip('(');
Jack Palevich21a15a22009-05-11 14:49:29 -07002518 a = test_expr();
2519 skip(')');
Jack Palevicha6baa232009-06-12 11:25:59 -07002520 block(l, false);
Jack Palevich21a15a22009-05-11 14:49:29 -07002521 if (tok == TOK_ELSE) {
Jack Paleviche27bf3e2009-05-10 14:09:03 -07002522 next();
Jack Palevichbf42c9c2009-05-12 12:48:35 -07002523 n = pGen->gjmp(0); /* jmp */
2524 pGen->gsym(a);
Jack Palevicha6baa232009-06-12 11:25:59 -07002525 block(l, false);
Jack Palevichbf42c9c2009-05-12 12:48:35 -07002526 pGen->gsym(n); /* patch else jmp */
Jack Palevich21a15a22009-05-11 14:49:29 -07002527 } else {
Jack Palevichbf42c9c2009-05-12 12:48:35 -07002528 pGen->gsym(a); /* patch if test */
Jack Paleviche27bf3e2009-05-10 14:09:03 -07002529 }
Jack Palevich546b2242009-05-13 15:10:04 -07002530 } else if ((tok == TOK_WHILE) | (tok == TOK_FOR)) {
Jack Palevich21a15a22009-05-11 14:49:29 -07002531 t = tok;
2532 next();
2533 skip('(');
2534 if (t == TOK_WHILE) {
Jack Palevicha6535612009-05-13 16:24:17 -07002535 n = codeBuf.getPC(); // top of loop, target of "next" iteration
Jack Palevich21a15a22009-05-11 14:49:29 -07002536 a = test_expr();
2537 } else {
2538 if (tok != ';')
2539 expr();
2540 skip(';');
2541 n = codeBuf.getPC();
2542 a = 0;
2543 if (tok != ';')
2544 a = test_expr();
2545 skip(';');
2546 if (tok != ')') {
Jack Palevichbf42c9c2009-05-12 12:48:35 -07002547 t = pGen->gjmp(0);
Jack Palevich21a15a22009-05-11 14:49:29 -07002548 expr();
Jack Palevicha6535612009-05-13 16:24:17 -07002549 pGen->gjmp(n - codeBuf.getPC() - pGen->jumpOffset());
Jack Palevichbf42c9c2009-05-12 12:48:35 -07002550 pGen->gsym(t);
Jack Palevich21a15a22009-05-11 14:49:29 -07002551 n = t + 4;
2552 }
2553 }
2554 skip(')');
Jack Palevicha6baa232009-06-12 11:25:59 -07002555 block((intptr_t) &a, false);
Jack Palevicha6535612009-05-13 16:24:17 -07002556 pGen->gjmp(n - codeBuf.getPC() - pGen->jumpOffset()); /* jmp */
Jack Palevichbf42c9c2009-05-12 12:48:35 -07002557 pGen->gsym(a);
Jack Palevich21a15a22009-05-11 14:49:29 -07002558 } else if (tok == '{') {
Jack Palevicha6baa232009-06-12 11:25:59 -07002559 if (! outermostFunctionBlock) {
Jack Palevich569f1352009-06-29 14:29:08 -07002560 mLocals.pushLevel();
Jack Palevicha6baa232009-06-12 11:25:59 -07002561 }
Jack Palevich21a15a22009-05-11 14:49:29 -07002562 next();
Jack Palevich303d8ff2009-06-11 19:06:24 -07002563 while (tok != '}' && tok != EOF)
Jack Palevicha6baa232009-06-12 11:25:59 -07002564 block(l, false);
Jack Palevich303d8ff2009-06-11 19:06:24 -07002565 skip('}');
Jack Palevicha6baa232009-06-12 11:25:59 -07002566 if (! outermostFunctionBlock) {
Jack Palevich569f1352009-06-29 14:29:08 -07002567 mLocals.popLevel();
Jack Palevicha6baa232009-06-12 11:25:59 -07002568 }
Jack Palevich21a15a22009-05-11 14:49:29 -07002569 } else {
2570 if (tok == TOK_RETURN) {
2571 next();
2572 if (tok != ';')
2573 expr();
Jack Palevichbf42c9c2009-05-12 12:48:35 -07002574 rsym = pGen->gjmp(rsym); /* jmp */
Jack Palevich21a15a22009-05-11 14:49:29 -07002575 } else if (tok == TOK_BREAK) {
2576 next();
Jack Palevichbf42c9c2009-05-12 12:48:35 -07002577 *(int *) l = pGen->gjmp(*(int *) l);
Jack Palevich21a15a22009-05-11 14:49:29 -07002578 } else if (tok != ';')
2579 expr();
2580 skip(';');
Jack Paleviche27bf3e2009-05-10 14:09:03 -07002581 }
2582 }
Jack Palevich21a15a22009-05-11 14:49:29 -07002583
Jack Palevich86351982009-06-30 18:09:56 -07002584 enum TypeTag {
2585 TY_INT, TY_CHAR, TY_VOID, TY_POINTER, TY_FUNC, TY_PARAM
2586 };
Jack Palevich21a15a22009-05-11 14:49:29 -07002587
Jack Palevich86351982009-06-30 18:09:56 -07002588 struct Type {
2589 TypeTag tag;
2590 tokenid_t id; // For function arguments
2591 Type* pHead;
2592 Type* pTail;
2593 };
2594
2595 Type* createType(TypeTag tag, Type* pHead, Type* pTail, Arena& arena) {
2596 assert(tag >= TY_INT && tag <= TY_PARAM);
2597 Type* pType = (Type*) arena.alloc(sizeof(Type));
2598 memset(pType, 0, sizeof(*pType));
2599 pType->tag = tag;
2600 pType->pHead = pHead;
2601 pType->pTail = pTail;
2602 return pType;
Jack Palevichb7c81e92009-06-04 19:56:13 -07002603 }
2604
Jack Palevich86351982009-06-30 18:09:56 -07002605 void decodeType(String& buffer, Type* pType) {
2606 if (pType == NULL) {
2607 buffer.appendCStr("null");
2608 return;
2609 }
2610 buffer.append('(');
2611 String temp;
2612 if (pType->id != 0) {
2613 decodeToken(temp, pType->id);
2614 buffer.append(temp);
2615 buffer.append(' ');
2616 }
2617 bool printHead = false;
2618 bool printTail = false;
2619 switch (pType->tag) {
2620 case TY_INT:
2621 buffer.appendCStr("int");
2622 break;
2623 case TY_CHAR:
2624 buffer.appendCStr("char");
2625 break;
2626 case TY_VOID:
2627 buffer.appendCStr("void");
2628 break;
2629 case TY_POINTER:
2630 buffer.appendCStr("*");
2631 printHead = true;
2632 break;
2633 case TY_FUNC:
2634 buffer.appendCStr("func");
2635 printHead = true;
2636 printTail = true;
2637 break;
2638 case TY_PARAM:
2639 buffer.appendCStr("param");
2640 printHead = true;
2641 printTail = true;
2642 break;
2643 default:
2644 String temp;
2645 temp.printf("Unknown tag %d", pType->tag);
2646 buffer.append(temp);
2647 break;
2648 }
2649 if (printHead) {
2650 buffer.append(' ');
2651 decodeType(buffer, pType->pHead);
2652 }
2653 if (printTail) {
2654 buffer.append(' ');
2655 decodeType(buffer, pType->pTail);
2656 }
2657 buffer.append(')');
Jack Palevichb7c81e92009-06-04 19:56:13 -07002658 }
2659
Jack Palevich86351982009-06-30 18:09:56 -07002660 void printType(Type* pType) {
2661 String buffer;
2662 decodeType(buffer, pType);
2663 fprintf(stderr, "%s\n", buffer.getUnwrapped());
Jack Palevichb7c81e92009-06-04 19:56:13 -07002664 }
2665
Jack Palevich86351982009-06-30 18:09:56 -07002666 Type* acceptPrimitiveType(Arena& arena) {
2667 Type* pType;
Jack Palevichb7c81e92009-06-04 19:56:13 -07002668 if (tok == TOK_INT) {
Jack Palevich86351982009-06-30 18:09:56 -07002669 pType = mkpInt;
Jack Palevichb7c81e92009-06-04 19:56:13 -07002670 } else if (tok == TOK_CHAR) {
Jack Palevich86351982009-06-30 18:09:56 -07002671 pType = mkpChar;
Jack Palevichb7c81e92009-06-04 19:56:13 -07002672 } else if (tok == TOK_VOID) {
Jack Palevich86351982009-06-30 18:09:56 -07002673 pType = mkpVoid;
Jack Palevichb7c81e92009-06-04 19:56:13 -07002674 } else {
Jack Palevich86351982009-06-30 18:09:56 -07002675 return NULL;
Jack Palevichb7c81e92009-06-04 19:56:13 -07002676 }
2677 next();
Jack Palevich86351982009-06-30 18:09:56 -07002678 return pType;
Jack Palevichb7c81e92009-06-04 19:56:13 -07002679 }
2680
Jack Palevich86351982009-06-30 18:09:56 -07002681 Type* acceptDeclaration(const Type* pBaseType, Arena& arena) {
2682 Type* pType = createType(pBaseType->tag, pBaseType->pHead,
2683 pBaseType->pTail, arena);
2684 tokenid_t declName;
2685 if (pType) {
2686 pType = acceptDecl2(pType, declName, arena);
2687 pType->id = declName;
2688 // fprintf(stderr, "Parsed a declaration: ");
2689 // printType(pType);
2690 }
2691 return pType;
2692 }
2693
2694 Type* expectDeclaration(const Type* pBaseType, Arena& arena) {
2695 Type* pType = acceptDeclaration(pBaseType, arena);
2696 if (! pType) {
2697 error("Expected a declaration");
2698 }
2699 return pType;
2700 }
2701
2702 Type* acceptDecl2(Type* pType, tokenid_t& declName, Arena& arena) {
2703 while (tok == '*') {
2704 pType = createType(TY_POINTER, pType, NULL, arena);
Jack Palevichb7c81e92009-06-04 19:56:13 -07002705 next();
Jack Palevichb7c81e92009-06-04 19:56:13 -07002706 }
Jack Palevich86351982009-06-30 18:09:56 -07002707 pType = acceptDecl3(pType, declName, arena);
2708 return pType;
Jack Palevichb7c81e92009-06-04 19:56:13 -07002709 }
2710
Jack Palevich86351982009-06-30 18:09:56 -07002711 Type* acceptDecl3(Type* pType, tokenid_t& declName, Arena& arena) {
2712 if (accept('(')) {
2713 pType = acceptDecl2(pType, declName, arena);
2714 skip(')');
2715 } else {
2716 declName = acceptSymbol();
2717 }
2718 while (tok == '(') {
2719 // Function declaration
2720 skip('(');
2721 Type* pTail = acceptArgs(arena);
2722 pType = createType(TY_FUNC, pType, pTail, arena);
2723 skip(')');
2724 }
2725 return pType;
2726 }
2727
2728 Type* acceptArgs(Arena& arena) {
2729 Type* pHead = NULL;
2730 Type* pTail = NULL;
2731 for(;;) {
2732 Type* pBaseArg = acceptPrimitiveType(arena);
2733 if (pBaseArg) {
2734 Type* pArg = acceptDeclaration(pBaseArg, arena);
2735 if (pArg) {
2736 Type* pParam = createType(TY_PARAM, pArg, NULL, arena);
2737 if (!pHead) {
2738 pHead = pParam;
2739 pTail = pParam;
2740 } else {
2741 pTail->pTail = pParam;
2742 pTail = pParam;
2743 }
2744 }
2745 }
2746 if (! accept(',')) {
2747 break;
2748 }
2749 }
2750 return pHead;
2751 }
2752
2753 Type* expectPrimitiveType(Arena& arena) {
2754 Type* pType = acceptPrimitiveType(arena);
2755 if (!pType) {
Jack Palevich569f1352009-06-29 14:29:08 -07002756 String buf;
2757 decodeToken(buf, tok);
2758 error("Expected a type, got %s", buf.getUnwrapped());
Jack Palevichb7c81e92009-06-04 19:56:13 -07002759 }
Jack Palevich86351982009-06-30 18:09:56 -07002760 return pType;
Jack Palevichb7c81e92009-06-04 19:56:13 -07002761 }
2762
Jack Palevich86351982009-06-30 18:09:56 -07002763 void addGlobalSymbol(Type* pDecl) {
2764 tokenid_t t = pDecl->id;
2765 VariableInfo* pVI = VI(t);
Jack Palevich569f1352009-06-29 14:29:08 -07002766 if(pVI && pVI->pAddress) {
Jack Palevich86351982009-06-30 18:09:56 -07002767 reportDuplicate(t);
Jack Palevich569f1352009-06-29 14:29:08 -07002768 }
Jack Palevich86351982009-06-30 18:09:56 -07002769 mGlobals.add(pDecl);
Jack Palevicha6baa232009-06-12 11:25:59 -07002770 }
2771
Jack Palevich86351982009-06-30 18:09:56 -07002772 void reportDuplicate(tokenid_t t) {
2773 error("Duplicate definition of %s", nameof(t));
Jack Palevich303d8ff2009-06-11 19:06:24 -07002774 }
2775
Jack Palevich86351982009-06-30 18:09:56 -07002776 void addLocalSymbol(Type* pDecl) {
2777 tokenid_t t = pDecl->id;
2778 if (mLocals.isDefinedAtCurrentLevel(t)) {
2779 reportDuplicate(t);
Jack Palevich569f1352009-06-29 14:29:08 -07002780 }
Jack Palevich86351982009-06-30 18:09:56 -07002781 mLocals.add(pDecl);
Jack Palevich303d8ff2009-06-11 19:06:24 -07002782 }
2783
Jack Palevichb7c81e92009-06-04 19:56:13 -07002784 void localDeclarations() {
2785 intptr_t a;
Jack Palevich86351982009-06-30 18:09:56 -07002786 Type* pBaseType;
Jack Palevichb7c81e92009-06-04 19:56:13 -07002787
Jack Palevich86351982009-06-30 18:09:56 -07002788 while ((pBaseType = acceptPrimitiveType(mLocalArena)) != NULL) {
Jack Palevich22e3e8e2009-06-12 13:12:55 -07002789 while (tok != ';' && tok != EOF) {
Jack Palevich86351982009-06-30 18:09:56 -07002790 Type* pDecl = expectDeclaration(pBaseType, mLocalArena);
2791 if (!pDecl) {
2792 break;
Jack Palevicha6baa232009-06-12 11:25:59 -07002793 }
Jack Palevich86351982009-06-30 18:09:56 -07002794 int variableAddress = 0;
2795 addLocalSymbol(pDecl);
2796 loc = loc + 4;
2797 variableAddress = -loc;
2798 VI(pDecl->id)->pAddress = (void*) variableAddress;
2799 if (accept('=')) {
Jack Palevichd7461a72009-06-12 14:26:58 -07002800 /* assignment */
Jack Palevichd7461a72009-06-12 14:26:58 -07002801 expr();
2802 pGen->storeR0(variableAddress);
2803 }
Jack Palevichb7c81e92009-06-04 19:56:13 -07002804 if (tok == ',')
2805 next();
2806 }
2807 skip(';');
2808 }
2809 }
2810
Jack Palevichf1728be2009-06-12 13:53:51 -07002811 bool checkSymbol() {
Jack Palevicha1804dd2009-06-12 14:40:04 -07002812 return checkSymbol(tok, &mTokenString);
2813 }
2814
Jack Palevich569f1352009-06-29 14:29:08 -07002815 void decodeToken(String& buffer, tokenid_t token) {
2816 if (token == EOF ) {
2817 buffer.printf("EOF");
2818 } else if (token == TOK_NUM) {
2819 buffer.printf("numeric constant");
2820 } else if (token >= 0 && token < 256) {
Jack Palevich86351982009-06-30 18:09:56 -07002821 if (token < 32) {
2822 buffer.printf("'\\x%02x'", token);
2823 } else {
2824 buffer.printf("'%c'", token);
2825 }
Jack Palevich569f1352009-06-29 14:29:08 -07002826 } else if (token >= TOK_KEYWORD && token < TOK_SYMBOL) {
2827 buffer.printf("keyword \"%s\"", nameof(token));
2828 } else {
2829 buffer.printf("symbol \"%s\"", nameof(token));
2830 }
2831 }
2832
2833 bool checkSymbol(tokenid_t token, String* pText) {
2834 bool result = token >= TOK_SYMBOL;
Jack Palevichf1728be2009-06-12 13:53:51 -07002835 if (!result) {
2836 String temp;
Jack Palevich569f1352009-06-29 14:29:08 -07002837 decodeToken(temp, token);
Jack Palevichf1728be2009-06-12 13:53:51 -07002838 error("Expected symbol. Got %s", temp.getUnwrapped());
2839 }
2840 return result;
2841 }
2842
Jack Palevich86351982009-06-30 18:09:56 -07002843 tokenid_t acceptSymbol() {
2844 tokenid_t result = 0;
2845 if (tok >= TOK_SYMBOL) {
2846 result = tok;
2847 next();
2848 } else {
2849 String temp;
2850 decodeToken(temp, tok);
2851 error("Expected symbol. Got %s", temp.getUnwrapped());
2852 }
2853 return result;
2854 }
2855
Jack Palevichb7c81e92009-06-04 19:56:13 -07002856 void globalDeclarations() {
2857 while (tok != EOF) {
Jack Palevich86351982009-06-30 18:09:56 -07002858 Type* pBaseType = expectPrimitiveType(mGlobalArena);
2859 if (!pBaseType) {
Jack Palevichf1728be2009-06-12 13:53:51 -07002860 break;
2861 }
Jack Palevich86351982009-06-30 18:09:56 -07002862 Type* pDecl = expectDeclaration(pBaseType, mGlobalArena);
2863 if (!pDecl) {
2864 break;
Jack Palevicha6baa232009-06-12 11:25:59 -07002865 }
Jack Palevich86351982009-06-30 18:09:56 -07002866 if (! isDefined(pDecl->id)) {
2867 addGlobalSymbol(pDecl);
2868 }
2869 VariableInfo* name = VI(pDecl->id);
Jack Palevicha6baa232009-06-12 11:25:59 -07002870 if (name && name->pAddress) {
Jack Palevich86351982009-06-30 18:09:56 -07002871 error("Already defined global %s", nameof(pDecl->id));
Jack Palevicha6baa232009-06-12 11:25:59 -07002872 }
Jack Palevich86351982009-06-30 18:09:56 -07002873 if (pDecl->tag < TY_FUNC) {
Jack Palevichb7c81e92009-06-04 19:56:13 -07002874 // it's a variable declaration
2875 for(;;) {
Jack Palevich86351982009-06-30 18:09:56 -07002876 if (name && !name->pAddress) {
Jack Palevicha6baa232009-06-12 11:25:59 -07002877 name->pAddress = (int*) allocGlobalSpace(4);
2878 }
Jack Palevich86351982009-06-30 18:09:56 -07002879 if (accept('=')) {
Jack Palevichd7461a72009-06-12 14:26:58 -07002880 if (tok == TOK_NUM) {
2881 if (name) {
2882 * (int*) name->pAddress = tokc;
2883 }
2884 next();
2885 } else {
2886 error("Expected an integer constant");
2887 }
2888 }
Jack Palevich86351982009-06-30 18:09:56 -07002889 if (!accept(',')) {
Jack Palevichb7c81e92009-06-04 19:56:13 -07002890 break;
Jack Palevich21a15a22009-05-11 14:49:29 -07002891 }
Jack Palevich86351982009-06-30 18:09:56 -07002892 pDecl = expectDeclaration(pBaseType, mGlobalArena);
2893 if (!pDecl) {
2894 break;
2895 }
2896 if (! isDefined(pDecl->id)) {
2897 addGlobalSymbol(pDecl);
2898 }
2899 name = VI(pDecl->id);
Jack Palevich21a15a22009-05-11 14:49:29 -07002900 }
2901 skip(';');
2902 } else {
Jack Palevich86351982009-06-30 18:09:56 -07002903 // Function declaration
Jack Palevicha6baa232009-06-12 11:25:59 -07002904 if (name) {
2905 /* patch forward references (XXX: does not work for function
2906 pointers) */
2907 pGen->gsym((int) name->pForward);
2908 /* put function address */
2909 name->pAddress = (void*) codeBuf.getPC();
2910 }
Jack Palevich86351982009-06-30 18:09:56 -07002911 // Calculate stack offsets for parameters
Jack Palevich569f1352009-06-29 14:29:08 -07002912 mLocals.pushLevel();
Jack Palevichb7c81e92009-06-04 19:56:13 -07002913 intptr_t a = 8;
Jack Palevich546b2242009-05-13 15:10:04 -07002914 int argCount = 0;
Jack Palevich86351982009-06-30 18:09:56 -07002915 for (Type* pP = pDecl->pTail; pP; pP = pP->pTail) {
2916 Type* pArg = pP->pHead;
2917 addLocalSymbol(pArg);
2918 /* read param name and compute offset */
2919 VI(pArg->id)->pAddress = (void*) a;
2920 a = a + 4;
Jack Palevich546b2242009-05-13 15:10:04 -07002921 argCount++;
Jack Palevich21a15a22009-05-11 14:49:29 -07002922 }
Jack Palevich21a15a22009-05-11 14:49:29 -07002923 rsym = loc = 0;
Jack Palevich546b2242009-05-13 15:10:04 -07002924 a = pGen->functionEntry(argCount);
Jack Palevicha6baa232009-06-12 11:25:59 -07002925 block(0, true);
Jack Palevichbf42c9c2009-05-12 12:48:35 -07002926 pGen->gsym(rsym);
Jack Palevich546b2242009-05-13 15:10:04 -07002927 pGen->functionExit(argCount, a, loc);
Jack Palevich569f1352009-06-29 14:29:08 -07002928 mLocals.popLevel();
Jack Palevich21a15a22009-05-11 14:49:29 -07002929 }
2930 }
2931 }
2932
Jack Palevichf1f39cc2009-05-29 18:03:15 -07002933 char* allocGlobalSpace(int bytes) {
2934 if (glo - pGlobalBase + bytes > ALLOC_SIZE) {
2935 error("Global space exhausted");
Jack Palevich0a280a02009-06-11 10:53:51 -07002936 return NULL;
Jack Palevichf1f39cc2009-05-29 18:03:15 -07002937 }
2938 char* result = glo;
2939 glo += bytes;
2940 return result;
2941 }
2942
Jack Palevich21a15a22009-05-11 14:49:29 -07002943 void cleanup() {
Jack Palevich21a15a22009-05-11 14:49:29 -07002944 if (pGlobalBase != 0) {
Jack Palevichf1f39cc2009-05-29 18:03:15 -07002945 free(pGlobalBase);
Jack Palevich21a15a22009-05-11 14:49:29 -07002946 pGlobalBase = 0;
2947 }
Jack Palevich21a15a22009-05-11 14:49:29 -07002948 if (pGen) {
2949 delete pGen;
2950 pGen = 0;
2951 }
Jack Palevich1cdef202009-05-22 12:06:27 -07002952 if (file) {
2953 delete file;
2954 file = 0;
2955 }
Jack Palevich21a15a22009-05-11 14:49:29 -07002956 }
2957
2958 void clear() {
2959 tok = 0;
2960 tokc = 0;
2961 tokl = 0;
2962 ch = 0;
Jack Palevich21a15a22009-05-11 14:49:29 -07002963 rsym = 0;
2964 loc = 0;
2965 glo = 0;
Jack Palevich21a15a22009-05-11 14:49:29 -07002966 dptr = 0;
2967 dch = 0;
Jack Palevich21a15a22009-05-11 14:49:29 -07002968 file = 0;
2969 pGlobalBase = 0;
Jack Palevich21a15a22009-05-11 14:49:29 -07002970 pGen = 0;
Jack Palevicheedf9d22009-06-04 16:23:40 -07002971 mPragmaStringCount = 0;
Jack Palevich21a15a22009-05-11 14:49:29 -07002972 }
Jack Paleviche27bf3e2009-05-10 14:09:03 -07002973
Jack Palevich22305132009-05-13 10:58:45 -07002974 void setArchitecture(const char* architecture) {
2975 delete pGen;
2976 pGen = 0;
2977
2978 if (architecture != NULL) {
Jack Paleviche7b59062009-05-19 17:12:17 -07002979#ifdef PROVIDE_ARM_CODEGEN
Jack Palevich8b0624c2009-05-20 12:12:06 -07002980 if (! pGen && strcmp(architecture, "arm") == 0) {
Jack Palevich22305132009-05-13 10:58:45 -07002981 pGen = new ARMCodeGenerator();
Jack Palevich8b0624c2009-05-20 12:12:06 -07002982 }
Jack Paleviche7b59062009-05-19 17:12:17 -07002983#endif
Jack Paleviche7b59062009-05-19 17:12:17 -07002984#ifdef PROVIDE_X86_CODEGEN
Jack Palevich8b0624c2009-05-20 12:12:06 -07002985 if (! pGen && strcmp(architecture, "x86") == 0) {
Jack Palevich22305132009-05-13 10:58:45 -07002986 pGen = new X86CodeGenerator();
Jack Palevich8b0624c2009-05-20 12:12:06 -07002987 }
Jack Paleviche7b59062009-05-19 17:12:17 -07002988#endif
Jack Palevich8b0624c2009-05-20 12:12:06 -07002989 if (!pGen ) {
Jack Palevichac0e95e2009-05-29 13:53:44 -07002990 error("Unknown architecture %s\n", architecture);
Jack Palevich22305132009-05-13 10:58:45 -07002991 }
2992 }
2993
2994 if (pGen == NULL) {
Jack Paleviche7b59062009-05-19 17:12:17 -07002995#if defined(DEFAULT_ARM_CODEGEN)
Jack Palevich22305132009-05-13 10:58:45 -07002996 pGen = new ARMCodeGenerator();
Jack Paleviche7b59062009-05-19 17:12:17 -07002997#elif defined(DEFAULT_X86_CODEGEN)
2998 pGen = new X86CodeGenerator();
2999#endif
3000 }
3001 if (pGen == NULL) {
Jack Palevichac0e95e2009-05-29 13:53:44 -07003002 error("No code generator defined.");
Jack Palevich0a280a02009-06-11 10:53:51 -07003003 } else {
3004 pGen->setErrorSink(this);
Jack Palevich22305132009-05-13 10:58:45 -07003005 }
3006 }
3007
Jack Palevich77ae76e2009-05-10 19:59:24 -07003008public:
Jack Palevich22305132009-05-13 10:58:45 -07003009 struct args {
3010 args() {
3011 architecture = 0;
3012 }
3013 const char* architecture;
3014 };
3015
Jack Paleviche7b59062009-05-19 17:12:17 -07003016 Compiler() {
Jack Palevich21a15a22009-05-11 14:49:29 -07003017 clear();
Jack Paleviche27bf3e2009-05-10 14:09:03 -07003018 }
Jack Palevichbbf8ab52009-05-11 11:54:30 -07003019
Jack Paleviche7b59062009-05-19 17:12:17 -07003020 ~Compiler() {
Jack Palevich21a15a22009-05-11 14:49:29 -07003021 cleanup();
3022 }
3023
Jack Palevich1cdef202009-05-22 12:06:27 -07003024 int compile(const char* text, size_t textLength) {
Jack Palevichac0e95e2009-05-29 13:53:44 -07003025 int result;
Jack Palevich0a280a02009-06-11 10:53:51 -07003026
3027 cleanup();
3028 clear();
Jack Palevich569f1352009-06-29 14:29:08 -07003029 mTokenTable.setArena(&mGlobalArena);
3030 mGlobals.setArena(&mGlobalArena);
3031 mGlobals.setTokenTable(&mTokenTable);
3032 mLocals.setArena(&mLocalArena);
3033 mLocals.setTokenTable(&mTokenTable);
3034
3035 internKeywords();
Jack Palevich86351982009-06-30 18:09:56 -07003036 createPrimitiveTypes();
Jack Palevich0a280a02009-06-11 10:53:51 -07003037 codeBuf.init(ALLOC_SIZE);
3038 setArchitecture(NULL);
3039 if (!pGen) {
3040 return -1;
3041 }
Jack Palevichb67b18f2009-06-11 21:12:23 -07003042#ifdef PROVIDE_TRACE_CODEGEN
3043 pGen = new TraceCodeGenerator(pGen);
3044#endif
3045 pGen->setErrorSink(this);
Jack Palevich0a280a02009-06-11 10:53:51 -07003046 pGen->init(&codeBuf);
3047 file = new TextInputStream(text, textLength);
Jack Palevich0a280a02009-06-11 10:53:51 -07003048 pGlobalBase = (char*) calloc(1, ALLOC_SIZE);
3049 glo = pGlobalBase;
Jack Palevich0a280a02009-06-11 10:53:51 -07003050 inp();
3051 next();
3052 globalDeclarations();
Jack Palevicha6baa232009-06-12 11:25:59 -07003053 checkForUndefinedForwardReferences();
Jack Palevich0a280a02009-06-11 10:53:51 -07003054 result = pGen->finishCompile();
3055 if (result == 0) {
3056 if (mErrorBuf.len()) {
3057 result = -2;
Jack Palevichac0e95e2009-05-29 13:53:44 -07003058 }
Jack Palevich8b0624c2009-05-20 12:12:06 -07003059 }
Jack Palevichac0e95e2009-05-29 13:53:44 -07003060 return result;
Jack Palevich21a15a22009-05-11 14:49:29 -07003061 }
3062
Jack Palevich86351982009-06-30 18:09:56 -07003063 void createPrimitiveTypes() {
3064 mkpInt = createType(TY_INT, NULL, NULL, mGlobalArena);
3065 mkpChar = createType(TY_CHAR, NULL, NULL, mGlobalArena);
3066 mkpVoid = createType(TY_VOID, NULL, NULL, mGlobalArena);
3067 }
3068
Jack Palevicha6baa232009-06-12 11:25:59 -07003069 void checkForUndefinedForwardReferences() {
Jack Palevich569f1352009-06-29 14:29:08 -07003070 mGlobals.forEach(static_ufrcFn, this);
Jack Palevicha6baa232009-06-12 11:25:59 -07003071 }
3072
Jack Palevich569f1352009-06-29 14:29:08 -07003073 static bool static_ufrcFn(VariableInfo* value, void* context) {
Jack Palevicha6baa232009-06-12 11:25:59 -07003074 Compiler* pCompiler = (Compiler*) context;
Jack Palevich569f1352009-06-29 14:29:08 -07003075 return pCompiler->undefinedForwardReferenceCheck(value);
Jack Palevicha6baa232009-06-12 11:25:59 -07003076 }
3077
Jack Palevich569f1352009-06-29 14:29:08 -07003078 bool undefinedForwardReferenceCheck(VariableInfo* value) {
Jack Palevicha6baa232009-06-12 11:25:59 -07003079 if (!value->pAddress && value->pForward) {
Jack Palevich569f1352009-06-29 14:29:08 -07003080 error("Undefined forward reference: %s",
3081 mTokenTable[value->tok].pText);
Jack Palevicha6baa232009-06-12 11:25:59 -07003082 }
3083 return true;
3084 }
3085
Jack Palevich21a15a22009-05-11 14:49:29 -07003086 int dump(FILE* out) {
3087 fwrite(codeBuf.getBase(), 1, codeBuf.getSize(), out);
3088 return 0;
3089 }
Jack Palevich77ae76e2009-05-10 19:59:24 -07003090
Jack Palevicha6535612009-05-13 16:24:17 -07003091 int disassemble(FILE* out) {
3092 return pGen->disassemble(out);
3093 }
3094
Jack Palevich1cdef202009-05-22 12:06:27 -07003095 /* Look through the symbol table to find a symbol.
3096 * If found, return its value.
3097 */
3098 void* lookup(const char* name) {
Jack Palevich569f1352009-06-29 14:29:08 -07003099 tokenid_t tok = mTokenTable.intern(name, strlen(name));
3100 VariableInfo* pVariableInfo = VI(tok);
Jack Palevich303d8ff2009-06-11 19:06:24 -07003101 if (pVariableInfo) {
3102 return pVariableInfo->pAddress;
Jack Palevich1cdef202009-05-22 12:06:27 -07003103 }
3104 return NULL;
3105 }
3106
Jack Palevicheedf9d22009-06-04 16:23:40 -07003107 void getPragmas(ACCsizei* actualStringCount,
3108 ACCsizei maxStringCount, ACCchar** strings) {
3109 int stringCount = mPragmaStringCount;
3110 if (actualStringCount) {
3111 *actualStringCount = stringCount;
3112 }
3113 if (stringCount > maxStringCount) {
3114 stringCount = maxStringCount;
3115 }
3116 if (strings) {
3117 char* pPragmas = mPragmas.getUnwrapped();
3118 while (stringCount-- > 0) {
3119 *strings++ = pPragmas;
3120 pPragmas += strlen(pPragmas) + 1;
3121 }
3122 }
3123 }
3124
Jack Palevichac0e95e2009-05-29 13:53:44 -07003125 char* getErrorMessage() {
Jack Palevicheedf9d22009-06-04 16:23:40 -07003126 return mErrorBuf.getUnwrapped();
Jack Palevichac0e95e2009-05-29 13:53:44 -07003127 }
3128
Jack Palevich77ae76e2009-05-10 19:59:24 -07003129};
3130
Jack Paleviche7b59062009-05-19 17:12:17 -07003131const char* Compiler::operatorChars =
Jack Palevichbf42c9c2009-05-12 12:48:35 -07003132 "++--*@/@%@+@-@<<>><=>=<@>@==!=&&||&@^@|@~@!@";
3133
Jack Paleviche7b59062009-05-19 17:12:17 -07003134const char Compiler::operatorLevel[] =
Jack Palevichbf42c9c2009-05-12 12:48:35 -07003135 {11, 11, 1, 1, 1, 2, 2, 3, 3, 4, 4, 4, 4,
3136 5, 5, /* ==, != */
3137 9, 10, /* &&, || */
3138 6, 7, 8, /* & ^ | */
3139 2, 2 /* ~ ! */
3140 };
3141
Jack Palevich8b0624c2009-05-20 12:12:06 -07003142#ifdef PROVIDE_ARM_CODEGEN
Jack Paleviche7b59062009-05-19 17:12:17 -07003143FILE* Compiler::ARMCodeGenerator::disasmOut;
Jack Palevich8b0624c2009-05-20 12:12:06 -07003144#endif
Jack Palevicha6535612009-05-13 16:24:17 -07003145
Jack Palevich8b0624c2009-05-20 12:12:06 -07003146#ifdef PROVIDE_X86_CODEGEN
Jack Paleviche7b59062009-05-19 17:12:17 -07003147const int Compiler::X86CodeGenerator::operatorHelper[] = {
Jack Palevichbf42c9c2009-05-12 12:48:35 -07003148 0x1, // ++
3149 0xff, // --
3150 0xc1af0f, // *
3151 0xf9f79991, // /
3152 0xf9f79991, // % (With manual assist to swap results)
3153 0xc801, // +
3154 0xd8f7c829, // -
3155 0xe0d391, // <<
3156 0xf8d391, // >>
3157 0xe, // <=
3158 0xd, // >=
3159 0xc, // <
3160 0xf, // >
3161 0x4, // ==
3162 0x5, // !=
3163 0x0, // &&
3164 0x1, // ||
3165 0xc821, // &
3166 0xc831, // ^
3167 0xc809, // |
3168 0xd0f7, // ~
3169 0x4 // !
3170};
Jack Palevich8b0624c2009-05-20 12:12:06 -07003171#endif
Jack Palevichbf42c9c2009-05-12 12:48:35 -07003172
Jack Palevich1cdef202009-05-22 12:06:27 -07003173struct ACCscript {
3174 ACCscript() {
3175 text = 0;
3176 textLength = 0;
3177 accError = ACC_NO_ERROR;
3178 }
Jack Palevichbbf8ab52009-05-11 11:54:30 -07003179
Jack Palevich1cdef202009-05-22 12:06:27 -07003180 ~ACCscript() {
3181 delete text;
3182 }
Jack Palevich546b2242009-05-13 15:10:04 -07003183
Jack Palevich1cdef202009-05-22 12:06:27 -07003184 void setError(ACCenum error) {
3185 if (accError == ACC_NO_ERROR && error != ACC_NO_ERROR) {
3186 accError = error;
Jack Palevichbbf8ab52009-05-11 11:54:30 -07003187 }
3188 }
3189
Jack Palevich1cdef202009-05-22 12:06:27 -07003190 ACCenum getError() {
3191 ACCenum result = accError;
3192 accError = ACC_NO_ERROR;
Jack Palevich22305132009-05-13 10:58:45 -07003193 return result;
Jack Palevichbbf8ab52009-05-11 11:54:30 -07003194 }
3195
Jack Palevich1cdef202009-05-22 12:06:27 -07003196 Compiler compiler;
3197 char* text;
3198 int textLength;
3199 ACCenum accError;
3200};
3201
3202
3203extern "C"
3204ACCscript* accCreateScript() {
3205 return new ACCscript();
Jack Palevichbbf8ab52009-05-11 11:54:30 -07003206}
Jack Palevich1cdef202009-05-22 12:06:27 -07003207
3208extern "C"
3209ACCenum accGetError( ACCscript* script ) {
3210 return script->getError();
3211}
3212
3213extern "C"
3214void accDeleteScript(ACCscript* script) {
3215 delete script;
3216}
3217
3218extern "C"
3219void accScriptSource(ACCscript* script,
3220 ACCsizei count,
3221 const ACCchar ** string,
3222 const ACCint * length) {
3223 int totalLength = 0;
3224 for(int i = 0; i < count; i++) {
3225 int len = -1;
3226 const ACCchar* s = string[i];
3227 if (length) {
3228 len = length[i];
3229 }
3230 if (len < 0) {
3231 len = strlen(s);
3232 }
3233 totalLength += len;
3234 }
3235 delete script->text;
3236 char* text = new char[totalLength + 1];
3237 script->text = text;
3238 script->textLength = totalLength;
Jack Palevich09555c72009-05-27 12:25:55 -07003239 char* dest = text;
Jack Palevich1cdef202009-05-22 12:06:27 -07003240 for(int i = 0; i < count; i++) {
3241 int len = -1;
3242 const ACCchar* s = string[i];
3243 if (length) {
3244 len = length[i];
3245 }
3246 if (len < 0) {
3247 len = strlen(s);
3248 }
Jack Palevich09555c72009-05-27 12:25:55 -07003249 memcpy(dest, s, len);
3250 dest += len;
Jack Palevich1cdef202009-05-22 12:06:27 -07003251 }
3252 text[totalLength] = '\0';
3253}
3254
3255extern "C"
3256void accCompileScript(ACCscript* script) {
3257 int result = script->compiler.compile(script->text, script->textLength);
3258 if (result) {
3259 script->setError(ACC_INVALID_OPERATION);
3260 }
3261}
3262
3263extern "C"
3264void accGetScriptiv(ACCscript* script,
3265 ACCenum pname,
3266 ACCint * params) {
3267 switch (pname) {
3268 case ACC_INFO_LOG_LENGTH:
3269 *params = 0;
3270 break;
3271 }
3272}
3273
3274extern "C"
3275void accGetScriptInfoLog(ACCscript* script,
3276 ACCsizei maxLength,
3277 ACCsizei * length,
3278 ACCchar * infoLog) {
Jack Palevichac0e95e2009-05-29 13:53:44 -07003279 char* message = script->compiler.getErrorMessage();
3280 int messageLength = strlen(message) + 1;
Jack Palevich1cdef202009-05-22 12:06:27 -07003281 if (length) {
Jack Palevichac0e95e2009-05-29 13:53:44 -07003282 *length = messageLength;
Jack Palevich1cdef202009-05-22 12:06:27 -07003283 }
Jack Palevichac0e95e2009-05-29 13:53:44 -07003284 if (infoLog && maxLength > 0) {
3285 int trimmedLength = maxLength < messageLength ?
3286 maxLength : messageLength;
3287 memcpy(infoLog, message, trimmedLength);
3288 infoLog[trimmedLength] = 0;
Jack Palevich1cdef202009-05-22 12:06:27 -07003289 }
3290}
3291
3292extern "C"
3293void accGetScriptLabel(ACCscript* script, const ACCchar * name,
3294 ACCvoid ** address) {
3295 void* value = script->compiler.lookup(name);
3296 if (value) {
3297 *address = value;
3298 } else {
3299 script->setError(ACC_INVALID_VALUE);
3300 }
3301}
3302
Jack Palevicheedf9d22009-06-04 16:23:40 -07003303extern "C"
3304void accGetPragmas(ACCscript* script, ACCsizei* actualStringCount,
3305 ACCsizei maxStringCount, ACCchar** strings){
3306 script->compiler.getPragmas(actualStringCount, maxStringCount, strings);
3307}
3308
-b master422972c2009-06-17 19:13:52 -07003309extern "C"
3310void accDisassemble(ACCscript* script) {
3311 script->compiler.disassemble(stderr);
3312}
3313
Jack Palevicheedf9d22009-06-04 16:23:40 -07003314
Jack Palevich1cdef202009-05-22 12:06:27 -07003315} // namespace acc
3316