123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715 |
- #include <setjmp.h>
- #include <stdarg.h>
- #include <stdio.h>
- #include "Compiler.h"
- #include "FunctionMap.h"
- #include "Operation.h"
- #include "StringIntMap.h"
- #include "Tokenizer.h"
- #define ERROR_LENGTH 256
- #define RETURN_BUFFER 16
- #define BREAK_BUFFER 32
- static jmp_buf errorJump;
- static char error[ERROR_LENGTH] = {'\0'};
- static ByteCode* code;
- static int16 line = 1;
- static int varIndex = 0;
- static StringIntMap vars[2];
- static FunctionMap functions;
- static int returns[RETURN_BUFFER];
- static int returnIndex = 0;
- static int returnState = 0;
- static int breaks[BREAK_BUFFER];
- static int breakIndex = 0;
- static int forWhileStack = 0;
- static void cError(const char* format, ...) {
- va_list args;
- va_start(args, format);
- vsnprintf(error, ERROR_LENGTH, format, args);
- va_end(args);
- longjmp(errorJump, 0);
- }
- static int cAddVar(const char* var) {
- int index = vars[varIndex].entries;
- simAdd(vars + varIndex, var, &index);
- return index;
- }
- static void cUnexpectedToken(Token t) {
- cError("unexpected token on line %d: %s", line, tGetTokenName(t));
- }
- static void cAddOperation(Operation token) {
- unsigned char c = token;
- bcAddBytes(code, &c, 1);
- }
- static int cReserveInt() {
- return bcReserveBytes(code, sizeof(int));
- }
- static void cSetInt(int p, int i) {
- bcSetBytes(code, p, &i, sizeof(int));
- }
- static void cAddInt(int i) {
- bcAddBytes(code, &i, sizeof(int));
- }
- static void cAddInt16(int16 i) {
- bcAddBytes(code, &i, sizeof(int16));
- }
- static void cAddFloat(float f) {
- bcAddBytes(code, &f, sizeof(float));
- }
- static int cAddPush(int offset) {
- cAddOperation(OP_PUSH_VARS);
- int p = cReserveInt();
- cAddInt(offset);
- return p;
- }
- static void cAddPop(int p, int vars) {
- cAddOperation(OP_POP_VARS);
- cAddInt(vars);
- cSetInt(p, vars);
- }
- static Token cReadTokenAndLine() {
- Token t = tReadToken();
- if(tReadInt16(&line)) {
- return t;
- }
- return T_END;
- }
- static void cConsumeToken(Token wanted) {
- Token t = cReadTokenAndLine();
- if(wanted != t) {
- cError("unexpected token on line %d: expected '%s' got '%s'", line, tGetTokenName(wanted), tGetTokenName(t));
- }
- }
- static bool cConsumeTokenIf(Token t) {
- if(tPeekToken() == t) {
- cReadTokenAndLine();
- return true;
- }
- return false;
- }
- static void cConstantInt() {
- int value;
- if(!tReadInt(&value)) {
- cError("int token without an int on line %d", line);
- }
- cAddOperation(OP_PUSH_INT);
- cAddInt(value);
- }
- static void cConstantFloat() {
- float value;
- if(!tReadFloat(&value)) {
- cError("float token without a float on line %d", line);
- }
- cAddOperation(OP_PUSH_FLOAT);
- cAddFloat(value);
- }
- static const char* cReadString() {
- const char* literal = tReadString();
- if(literal == NULL) {
- cError("literal without string on line %d", line);
- }
- return literal;
- }
- static void cGetVar(const char* var) {
- cAddOperation(OP_GET);
- cAddInt(cAddVar(var));
- }
- static void cExpression();
- static int cCallFunctionArguments() {
- int arguments = 0;
- while(!cConsumeTokenIf(T_CLOSE_BRACKET)) {
- arguments++;
- cExpression();
- if(cConsumeTokenIf(T_COMMA) && tPeekToken() == T_CLOSE_BRACKET) {
- cUnexpectedToken(tPeekToken());
- }
- }
- return arguments;
- }
- static void cCallFunction(const char* literal, bool noReturn) {
- cAddOperation(OP_PUSH_INT);
- cAddInt(0);
- int arguments = cCallFunctionArguments();
- Function* f = fmSearch(&functions, literal, arguments);
- cAddOperation(OP_GOSUB);
- if(f == NULL) {
- fmEnqueue(&functions, literal, arguments, line, cReserveInt(), noReturn);
- cAddInt(arguments);
- cAddOperation(OP_NOTHING);
- } else {
- if(!noReturn && !f->returns) {
- cError("function '%s' needs a return value on line %d", f->name, line);
- }
- cAddInt(f->address);
- cAddInt(arguments);
- if(f->returns && noReturn) {
- cAddOperation(OP_POP);
- }
- }
- }
- static void cPostIncrement(const char* literal) {
- cAddOperation(OP_POST_INCREMENT);
- cAddInt(cAddVar(literal));
- }
- static void cPostDecrement(const char* literal) {
- cAddOperation(OP_POST_DECREMENT);
- cAddInt(cAddVar(literal));
- }
- static void cLiteral() {
- const char* literal = cReadString();
- if(cConsumeTokenIf(T_OPEN_BRACKET)) {
- cCallFunction(literal, false);
- } else if(cConsumeTokenIf(T_INCREMENT)) {
- cPostIncrement(literal);
- } else if(cConsumeTokenIf(T_DECREMENT)) {
- cPostDecrement(literal);
- } else {
- cGetVar(literal);
- }
- }
- static void cPrimary() {
- Token t = cReadTokenAndLine();
- switch(t) {
- case T_INT: cConstantInt(); break;
- case T_FLOAT: cConstantFloat(); break;
- case T_NULL: cAddOperation(OP_PUSH_NULL); break;
- case T_TRUE: cAddOperation(OP_PUSH_TRUE); break;
- case T_FALSE: cAddOperation(OP_PUSH_FALSE); break;
- case T_OPEN_BRACKET:
- cExpression();
- cConsumeToken(T_CLOSE_BRACKET);
- break;
- case T_LITERAL: cLiteral(); break;
- default: cUnexpectedToken(t); break;
- }
- }
- static void cPreIncrement() {
- cConsumeToken(T_LITERAL);
- cAddOperation(OP_PRE_INCREMENT);
- cAddInt(cAddVar(cReadString()));
- }
- static void cPreDecrement() {
- cConsumeToken(T_LITERAL);
- cAddOperation(OP_PRE_DECREMENT);
- cAddInt(cAddVar(cReadString()));
- }
- static void cPreUnary() {
- if(cConsumeTokenIf(T_SUB)) {
- cPrimary();
- cAddOperation(OP_INVERT_SIGN);
- } else if(cConsumeTokenIf(T_INCREMENT)) {
- cPreIncrement();
- } else if(cConsumeTokenIf(T_DECREMENT)) {
- cPreDecrement();
- } else if(cConsumeTokenIf(T_NOT)) {
- int counter = 1;
- while(cConsumeTokenIf(T_NOT)) {
- counter++;
- }
- cPrimary();
- cAddOperation(OP_NOT);
- if((counter & 1) == 0) {
- cAddOperation(OP_NOT);
- }
- } else if(cConsumeTokenIf(T_BIT_NOT)) {
- cPrimary();
- cAddOperation(OP_BIT_NOT);
- } else {
- cPrimary();
- }
- }
- static void cMul() {
- cPreUnary();
- while(true) {
- if(cConsumeTokenIf(T_MUL)) {
- cPreUnary();
- cAddOperation(OP_MUL);
- } else if(cConsumeTokenIf(T_DIV)) {
- cPreUnary();
- cAddOperation(OP_DIV);
- } else if(cConsumeTokenIf(T_MOD)) {
- cPreUnary();
- cAddOperation(OP_MOD);
- } else {
- break;
- }
- }
- }
- static void cAdd() {
- cMul();
- while(true) {
- if(cConsumeTokenIf(T_ADD)) {
- cMul();
- cAddOperation(OP_ADD);
- } else if(cConsumeTokenIf(T_SUB)) {
- cMul();
- cAddOperation(OP_SUB);
- } else {
- break;
- }
- }
- }
- static void cShift() {
- cAdd();
- while(true) {
- if(cConsumeTokenIf(T_LEFT_SHIFT)) {
- cAdd();
- cAddOperation(OP_LEFT_SHIFT);
- } else if(cConsumeTokenIf(T_RIGHT_SHIFT)) {
- cAdd();
- cAddOperation(OP_RIGHT_SHIFT);
- } else {
- break;
- }
- }
- }
- static void cComparison() {
- cShift();
- while(true) {
- if(cConsumeTokenIf(T_LESS)) {
- cShift();
- cAddOperation(OP_LESS);
- } else if(cConsumeTokenIf(T_LESS_EQUAL)) {
- cShift();
- cAddOperation(OP_GREATER);
- cAddOperation(OP_NOT);
- } else if(cConsumeTokenIf(T_GREATER)) {
- cShift();
- cAddOperation(OP_GREATER);
- } else if(cConsumeTokenIf(T_GREATER_EQUAL)) {
- cShift();
- cAddOperation(OP_LESS);
- cAddOperation(OP_NOT);
- } else {
- break;
- }
- }
- }
- static void cEqual() {
- cComparison();
- while(true) {
- if(cConsumeTokenIf(T_EQUAL)) {
- cComparison();
- cAddOperation(OP_EQUAL);
- } else if(cConsumeTokenIf(T_NOT_EQUAL)) {
- cComparison();
- cAddOperation(OP_EQUAL);
- cAddOperation(OP_NOT);
- } else {
- break;
- }
- }
- }
- static void cBitAnd() {
- cEqual();
- while(cConsumeTokenIf(T_BIT_AND)) {
- cEqual();
- cAddOperation(OP_BIT_AND);
- }
- }
- static void cBitXor() {
- cBitAnd();
- while(cConsumeTokenIf(T_BIT_XOR)) {
- cBitAnd();
- cAddOperation(OP_BIT_XOR);
- }
- }
- static void cBitOr() {
- cBitXor();
- while(cConsumeTokenIf(T_BIT_OR)) {
- cBitXor();
- cAddOperation(OP_BIT_OR);
- }
- }
- static void cAnd() {
- cBitOr();
- while(cConsumeTokenIf(T_AND)) {
- cAddOperation(OP_DUPLICATE);
- cAddOperation(OP_IF_GOTO);
- int p = cReserveInt();
- cBitOr();
- cAddOperation(OP_AND);
- cSetInt(p, code->length);
- }
- }
- static void cOr() {
- cAnd();
- while(cConsumeTokenIf(T_OR)) {
- cAddOperation(OP_DUPLICATE);
- cAddOperation(OP_NOT);
- cAddOperation(OP_IF_GOTO);
- int p = cReserveInt();
- cAnd();
- cAddOperation(OP_OR);
- cSetInt(p, code->length);
- }
- }
- static void cExpression() {
- cOr();
- }
- static void cSetVar(const char* literal) {
- cExpression();
- cAddOperation(OP_SET);
- cAddInt(cAddVar(literal));
- }
- static void cOperationSetVar(const char* literal, Operation op) {
- cGetVar(literal);
- cExpression();
- cAddOperation(op);
- cAddOperation(OP_SET);
- cAddInt(cAddVar(literal));
- }
- static void cLineLiteral() {
- const char* literal = cReadString();
- Token t = cReadTokenAndLine();
- switch(t) {
- case T_SET: cSetVar(literal); break;
- case T_ADD_SET: cOperationSetVar(literal, OP_ADD); break;
- case T_SUB_SET: cOperationSetVar(literal, OP_SUB); break;
- case T_MUL_SET: cOperationSetVar(literal, OP_MUL); break;
- case T_DIV_SET: cOperationSetVar(literal, OP_DIV); break;
- case T_MOD_SET: cOperationSetVar(literal, OP_MOD); break;
- case T_BIT_AND_SET: cOperationSetVar(literal, OP_BIT_AND); break;
- case T_BIT_OR_SET: cOperationSetVar(literal, OP_BIT_OR); break;
- case T_BIT_XOR_SET: cOperationSetVar(literal, OP_BIT_XOR); break;
- case T_LEFT_SHIFT_SET: cOperationSetVar(literal, OP_LEFT_SHIFT); break;
- case T_RIGHT_SHIFT_SET: cOperationSetVar(literal, OP_RIGHT_SHIFT); break;
- case T_OPEN_BRACKET: cCallFunction(literal, true); break;
- case T_INCREMENT:
- cPostIncrement(literal);
- cAddOperation(OP_POP);
- break;
- case T_DECREMENT:
- cPostDecrement(literal);
- cAddOperation(OP_POP);
- break;
- default: cUnexpectedToken(t);
- }
- }
- static int cFunctionArguments() {
- int arguments = 0;
- while(!cConsumeTokenIf(T_CLOSE_BRACKET)) {
- cConsumeToken(T_LITERAL);
- arguments++;
- cAddVar(cReadString());
- if(cConsumeTokenIf(T_COMMA) && tPeekToken() != T_LITERAL) {
- cUnexpectedToken(tPeekToken());
- }
- }
- return arguments;
- }
- static void cLine(Token t);
- static void cConsumeBody() {
- cConsumeToken(T_OPEN_CURVED_BRACKET);
- int oldLine = line;
- while(!cConsumeTokenIf(T_CLOSE_CURVED_BRACKET)) {
- Token t = cReadTokenAndLine();
- if(t == T_END) {
- cError("unexpected end of file: non closed curved bracket on line %d", oldLine);
- }
- cLine(t);
- }
- }
- static void cLinkReturns() {
- for(int i = 0; i < returnIndex; i++) {
- cSetInt(returns[i], vars[1].entries);
- }
- returnIndex = 0;
- }
- static void cFunctionBody(const char* name, int arguments) {
- int oldLine = line;
- cAddOperation(OP_GOTO);
- int gotoIndex = cReserveInt();
- int address = code->length;
- returnState = 0;
- int p = cAddPush(arguments);
- cConsumeBody(false);
- cAddPop(p, vars[1].entries);
- cLinkReturns();
- if(!fmAdd(&functions, name, arguments, address, returnState == 2)) {
- cError("function registered twice on line %d", oldLine);
- }
- cAddOperation(OP_RETURN);
- cSetInt(gotoIndex, code->length);
- }
- static void cFunction() {
- if(varIndex == 1) {
- cError("function inside function on line %d", line);
- }
- cConsumeToken(T_LITERAL);
- const char* name = cReadString();
- cConsumeToken(T_OPEN_BRACKET);
- varIndex = 1;
- vars[1].entries = 0;
- cFunctionBody(name, cFunctionArguments());
- varIndex = 0;
- }
- static void cAddReturn() {
- cAddOperation(OP_POP_VARS);
- returns[returnIndex++] = cReserveInt(vars);
- cAddOperation(OP_RETURN);
- }
- static void cReturn() {
- if(varIndex == 0) {
- cError("return without a function on line %d", line);
- } else if(returnIndex >= RETURN_BUFFER) {
- cError("too much returns in function around line %d", line);
- }
- if(cConsumeTokenIf(T_SEMICOLON)) {
- if(returnState == 2) {
- cError("mixed return type on line %d", line);
- }
- returnState = 1;
- cAddReturn();
- } else {
- if(returnState == 1) {
- cError("mixed return type on line %d", line);
- }
- returnState = 2;
- cExpression();
- cAddOperation(OP_SET_RETURN);
- cAddReturn();
- cConsumeToken(T_SEMICOLON);
- }
- }
- static void cPrint() {
- cExpression();
- cConsumeToken(T_SEMICOLON);
- cAddOperation(OP_PRINT);
- }
- static void cIf() {
- cConsumeToken(T_OPEN_BRACKET);
- cExpression();
- cConsumeToken(T_CLOSE_BRACKET);
- cAddOperation(OP_IF_GOTO);
- int ifP = cReserveInt();
- cConsumeBody(false);
- cSetInt(ifP, code->length);
- if(cConsumeTokenIf(T_ELSE)) {
- cAddOperation(OP_GOTO);
- int elseP = cReserveInt();
- cSetInt(ifP, code->length);
- if(cConsumeTokenIf(T_IF)) {
- cIf();
- } else {
- cConsumeBody(false);
- }
- cSetInt(elseP, code->length);
- }
- }
- static void cConsumeBreaks(int start, int address) {
- for(int i = start; i < breakIndex; i++) {
- cSetInt(breaks[i], address);
- }
- breakIndex = start;
- }
- static void cWhile() {
- int start = code->length;
- cConsumeToken(T_OPEN_BRACKET);
- cExpression();
- cConsumeToken(T_CLOSE_BRACKET);
- cAddOperation(OP_IF_GOTO);
- int ifP = cReserveInt();
- int breakStart = breakIndex;
- forWhileStack++;
- cConsumeBody(true);
- forWhileStack--;
- cAddOperation(OP_GOTO);
- cAddInt(start);
- cSetInt(ifP, code->length);
- cConsumeBreaks(breakStart, code->length);
- }
- static void cLineExpression(Token t) {
- switch(t) {
- case T_LITERAL: cLineLiteral(); break;
- case T_INCREMENT:
- cPreIncrement();
- cAddOperation(OP_POP);
- break;
- case T_DECREMENT:
- cPreDecrement();
- cAddOperation(OP_POP);
- break;
- default: cUnexpectedToken(t);
- }
- }
- static void cFor() {
- cConsumeToken(T_OPEN_BRACKET);
- cLineExpression(cReadTokenAndLine());
- cConsumeToken(T_SEMICOLON);
- int startCheck = code->length;
- cExpression();
- cConsumeToken(T_SEMICOLON);
- cAddOperation(OP_IF_GOTO);
- int end = cReserveInt();
- cAddOperation(OP_GOTO);
- int beginBody = cReserveInt();
- int startPerLoop = code->length;
- cLineExpression(cReadTokenAndLine());
- cAddOperation(OP_GOTO);
- cAddInt(startCheck);
- cConsumeToken(T_CLOSE_BRACKET);
- cSetInt(beginBody, code->length);
- int breakStart = breakIndex;
- forWhileStack++;
- cConsumeBody(true);
- forWhileStack--;
- cAddOperation(OP_GOTO);
- cAddInt(startPerLoop);
- cSetInt(end, code->length);
- cConsumeBreaks(breakStart, code->length);
- }
- static void cBreak() {
- if(forWhileStack == 0) {
- cError("break without for or while on line %d", line);
- } else if(breakIndex >= BREAK_BUFFER) {
- cError("too much breaks around line %d", line);
- }
- cAddOperation(OP_GOTO);
- breaks[breakIndex++] = cReserveInt();
- cConsumeToken(T_SEMICOLON);
- }
- static void cLine(Token t) {
- cAddOperation(OP_LINE);
- cAddInt16(line);
- switch(t) {
- case T_PRINT: cPrint(); break;
- case T_FUNCTION: cFunction(); break;
- case T_RETURN: cReturn(); break;
- case T_IF: cIf(); break;
- case T_WHILE: cWhile(); break;
- case T_FOR: cFor(); break;
- case T_BREAK: cBreak(); break;
- default: cLineExpression(t); cConsumeToken(T_SEMICOLON);
- }
- }
- static void cForEachLine() {
- Token t = cReadTokenAndLine();
- while(t != T_END) {
- cLine(t);
- t = cReadTokenAndLine();
- }
- }
- static void cLinkQueuedFunctions() {
- for(int i = 0; i < functions.queueEntries; i++) {
- Function* f = fmSearch(&functions, functions.queue[i].name, functions.queue[i].arguments);
- if(f == NULL) {
- cError("unknown function on line %d", functions.queue[i].line);
- } else if(!functions.queue[i].noReturn && !f->returns) {
- cError("function '%s' needs a return value on line %d", f->name, functions.queue[i].line);
- }
- cSetInt(functions.queue[i].reserved, f->address);
- if(functions.queue[i].noReturn && f->returns) {
- code->code[functions.queue[i].reserved + sizeof(int) * 2] = OP_POP;
- }
- }
- }
- static void cAllocAndCompile() {
- varIndex = 0;
- returnIndex = 0;
- returnState = 0;
- forWhileStack = 0;
- breakIndex = 0;
- simInit(vars);
- simInit(vars + 1);
- fmInit(&functions);
- if(!setjmp(errorJump)) {
- int p = cAddPush(0);
- cForEachLine();
- cAddPop(p, vars[varIndex].entries);
- cLinkQueuedFunctions();
- }
- fmDelete(&functions);
- simDelete(vars + 1);
- simDelete(vars);
- }
- ByteCode* cCompile() {
- error[0] = '\0';
- code = bcInit();
- cAllocAndCompile();
- if(error[0] != '\0') {
- bcDelete(code);
- return NULL;
- }
- return code;
- }
- const char* cGetError() {
- return error;
- }
|