Parser.java 19 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627
  1. package me.hammerle.snuviscript.token;
  2. import java.util.HashMap;
  3. import java.util.LinkedList;
  4. import java.util.Stack;
  5. import me.hammerle.snuviscript.array.DynamicArray;
  6. import me.hammerle.snuviscript.code.Function;
  7. import me.hammerle.snuviscript.code.FunctionLoader;
  8. import me.hammerle.snuviscript.code.InputProvider;
  9. import me.hammerle.snuviscript.code.Instruction;
  10. import me.hammerle.snuviscript.code.JumpData;
  11. import me.hammerle.snuviscript.code.SignInverter;
  12. import me.hammerle.snuviscript.constants.ConstantBoolean;
  13. import me.hammerle.snuviscript.constants.ConstantDouble;
  14. import me.hammerle.snuviscript.constants.ConstantNull;
  15. import me.hammerle.snuviscript.constants.ConstantString;
  16. import me.hammerle.snuviscript.exceptions.PreScriptException;
  17. import static me.hammerle.snuviscript.token.TokenType.*;
  18. import me.hammerle.snuviscript.variable.ArrayVariable;
  19. import me.hammerle.snuviscript.variable.Variable;
  20. public class Parser
  21. {
  22. private final HashMap<String, Variable> vars = new HashMap<>();
  23. private final HashMap<String, Integer> labels = new HashMap<>();
  24. private boolean tryState = false;
  25. private boolean cancel = false;
  26. private class JumpWrapper
  27. {
  28. private final JumpData data;
  29. private final String function;
  30. public JumpWrapper(JumpData data, String function)
  31. {
  32. this.data = data;
  33. this.function = function;
  34. }
  35. }
  36. private final Stack<JumpWrapper> jumps = new Stack<>();
  37. private final Stack<JumpWrapper> loopJumps = new Stack<>();
  38. private final LinkedList<JumpData> breakContinueJumps = new LinkedList<>();
  39. private final Token[] tokens;
  40. private int current = 0;
  41. private int layer = 0;
  42. private final LinkedList<Instruction> inst = new LinkedList<>();
  43. public Parser(LinkedList<Token> tokens)
  44. {
  45. this.tokens = tokens.toArray(new Token[tokens.size()]);
  46. //tokens.forEach(t -> System.out.println(t));
  47. }
  48. // -------------------------------------------------------------------------
  49. // utility
  50. // -------------------------------------------------------------------------
  51. private boolean match(TokenType... types)
  52. {
  53. for(TokenType type : types)
  54. {
  55. if(check(type))
  56. {
  57. advance();
  58. return true;
  59. }
  60. }
  61. return false;
  62. }
  63. private boolean check(TokenType tokenType)
  64. {
  65. if(current >= tokens.length)
  66. {
  67. return false;
  68. }
  69. return tokens[current].getToken() == tokenType;
  70. }
  71. private Token advance()
  72. {
  73. if(current < tokens.length)
  74. {
  75. current++;
  76. }
  77. return previous();
  78. }
  79. private Token previous()
  80. {
  81. return tokens[current - 1];
  82. }
  83. private void consume(TokenType type, String s)
  84. {
  85. if(tokens[current].getToken() != type)
  86. {
  87. throw new PreScriptException(s, tokens[current].getLine());
  88. }
  89. current++;
  90. }
  91. private void peek(TokenType type, String s)
  92. {
  93. if(tokens[current].getToken() != type)
  94. {
  95. throw new PreScriptException(s, tokens[current].getLine());
  96. }
  97. }
  98. // -------------------------------------------------------------------------
  99. // parsing precedence layers
  100. // http://en.cppreference.com/w/c/language/operator_precedence
  101. // -------------------------------------------------------------------------
  102. private void addInstruction(int line, String function, InputProvider... in)
  103. {
  104. inst.add(new Instruction(line, (byte) layer, new Function(FunctionLoader.getFunction(function), in)));
  105. }
  106. public Instruction[] parseTokens()
  107. {
  108. while(current < tokens.length && tokens[current].getToken() != END_OF_FILE)
  109. {
  110. if(match(LABEL))
  111. {
  112. if(labels.put(previous().getData().toString(), inst.size()) != null)
  113. {
  114. throw new PreScriptException("label duplicate", previous().getLine());
  115. }
  116. match(SEMICOLON);
  117. }
  118. int line = tokens[current].getLine();
  119. inst.add(new Instruction(line, (byte) layer, parseExpression()));
  120. tryState = false;
  121. if(cancel)
  122. {
  123. cancel = false;
  124. continue;
  125. }
  126. if(match(OPEN_CURVED_BRACKET))
  127. {
  128. layer++;
  129. }
  130. else
  131. {
  132. consume(SEMICOLON, "unexpected token after expression: " + tokens[current]);
  133. }
  134. while(match(CLOSE_CURVED_BRACKET))
  135. {
  136. layer--;
  137. if(jumps.isEmpty())
  138. {
  139. throw new PreScriptException("} without a corresponding function and / or {", previous().getLine());
  140. }
  141. JumpWrapper data = jumps.pop();
  142. switch(data.function)
  143. {
  144. case "try":
  145. {
  146. peek(CATCH, "try without catch");
  147. data.data.setRelativeJump(inst.size());
  148. tryState = true;
  149. break;
  150. }
  151. case "catch":
  152. {
  153. data.data.setRelativeJump(inst.size());
  154. break;
  155. }
  156. case "else":
  157. case "elseif":
  158. case "if":
  159. {
  160. data.data.setRelativeJump(inst.size() + 1);
  161. addInstruction(previous().getLine(), "endif");
  162. break;
  163. }
  164. case "for":
  165. {
  166. loopJumps.pop();
  167. createBreakContinue(inst.size());
  168. JumpData jump = data.data;
  169. jump.setRelativeJump(inst.size());
  170. addInstruction(previous().getLine(), "next", new JumpData(-jump.getInt(null) - 1));
  171. break;
  172. }
  173. case "while":
  174. {
  175. loopJumps.pop();
  176. createBreakContinue(inst.size());
  177. JumpData jump = data.data;
  178. jump.setRelativeJump(inst.size() + 1);
  179. addInstruction(previous().getLine(), "wend", new JumpData(-jump.getInt(null) - 1));
  180. break;
  181. }
  182. }
  183. }
  184. }
  185. return inst.toArray(new Instruction[inst.size()]);
  186. }
  187. private void createBreakContinue(int current)
  188. {
  189. breakContinueJumps.forEach(jump -> jump.setRelativeJump(current));
  190. breakContinueJumps.clear();
  191. }
  192. private InputProvider binaryFunction(InputProvider left, Object t, InputProvider right)
  193. {
  194. return new Function(FunctionLoader.getFunction(t.toString()), new InputProvider[] {left, right});
  195. }
  196. private InputProvider unaryFunction(InputProvider in, Object t)
  197. {
  198. return new Function(FunctionLoader.getFunction(t.toString()), new InputProvider[] {in});
  199. }
  200. private InputProvider parseExpression()
  201. {
  202. return parseAssignment();
  203. }
  204. // level 14
  205. private InputProvider parseAssignment()
  206. {
  207. InputProvider expr = parseLogicalOr();
  208. while(match(SET, ADD_SET, SUB_SET, MUL_SET, DIV_SET, MOD_SET, LEFT_SHIFT_SET, RIGHT_SHIFT_SET, BIT_AND_SET, BIT_XOR_SET, BIT_OR_SET))
  209. {
  210. Token operator = previous();
  211. InputProvider right = parseAssignment();
  212. expr = binaryFunction(expr, operator, right);
  213. }
  214. return expr;
  215. }
  216. // level 12
  217. private InputProvider parseLogicalOr()
  218. {
  219. InputProvider expr = parseLogicalAnd();
  220. while(match(OR))
  221. {
  222. Token operator = previous();
  223. InputProvider right = parseLogicalAnd();
  224. expr = binaryFunction(expr, operator, right);
  225. }
  226. return expr;
  227. }
  228. // level 11
  229. private InputProvider parseLogicalAnd()
  230. {
  231. InputProvider expr = parseBitOr();
  232. while(match(AND))
  233. {
  234. Token operator = previous();
  235. InputProvider right = parseBitOr();
  236. expr = binaryFunction(expr, operator, right);
  237. }
  238. return expr;
  239. }
  240. // level 10
  241. private InputProvider parseBitOr()
  242. {
  243. InputProvider expr = parseBitXor();
  244. while(match(BIT_OR))
  245. {
  246. Token operator = previous();
  247. InputProvider right = parseBitXor();
  248. expr = binaryFunction(expr, operator, right);
  249. }
  250. return expr;
  251. }
  252. // level 9
  253. private InputProvider parseBitXor()
  254. {
  255. InputProvider expr = parseBitAnd();
  256. while(match(BIT_XOR))
  257. {
  258. Token operator = previous();
  259. InputProvider right = parseBitAnd();
  260. expr = binaryFunction(expr, operator, right);
  261. }
  262. return expr;
  263. }
  264. // level 8
  265. private InputProvider parseBitAnd()
  266. {
  267. InputProvider expr = parseEquality();
  268. while(match(BIT_AND))
  269. {
  270. Token operator = previous();
  271. InputProvider right = parseEquality();
  272. expr = binaryFunction(expr, operator, right);
  273. }
  274. return expr;
  275. }
  276. // level 7
  277. private InputProvider parseEquality()
  278. {
  279. InputProvider expr = parseComparison();
  280. while(match(EQUAL, NOT_EQUAL))
  281. {
  282. Token operator = previous();
  283. InputProvider right = parseComparison();
  284. expr = binaryFunction(expr, operator, right);
  285. }
  286. return expr;
  287. }
  288. // level 6
  289. private InputProvider parseComparison()
  290. {
  291. InputProvider expr = parseShifting();
  292. while(match(GREATER, GREATER_EQUAL, LESS, LESS_EQUAL))
  293. {
  294. Token operator = previous();
  295. InputProvider right = parseShifting();
  296. expr = binaryFunction(expr, operator, right);
  297. }
  298. return expr;
  299. }
  300. // level 5
  301. private InputProvider parseShifting()
  302. {
  303. InputProvider expr = parseAddition();
  304. while(match(LEFT_SHIFT, RIGHT_SHIFT))
  305. {
  306. Token operator = previous();
  307. InputProvider right = parseAddition();
  308. expr = binaryFunction(expr, operator, right);
  309. }
  310. return expr;
  311. }
  312. // level 4
  313. private InputProvider parseAddition()
  314. {
  315. InputProvider expr = parseMultiplication();
  316. while(match(SUB, ADD))
  317. {
  318. Token operator = previous();
  319. InputProvider right = parseMultiplication();
  320. expr = binaryFunction(expr, operator, right);
  321. }
  322. return expr;
  323. }
  324. // level 3
  325. private InputProvider parseMultiplication()
  326. {
  327. InputProvider expr = parseUnary();
  328. while(match(DIV, MUL, MOD))
  329. {
  330. Token operator = previous();
  331. InputProvider right = parseUnary();
  332. expr = binaryFunction(expr, operator, right);
  333. }
  334. return expr;
  335. }
  336. // level 2
  337. private InputProvider parseUnary()
  338. {
  339. if(match(INVERT, SUB, BIT_INVERT, INC, DEC))
  340. {
  341. if(previous().getToken() == SUB)
  342. {
  343. return new SignInverter(parseUnary());
  344. }
  345. Token operator = previous();
  346. InputProvider right = parseUnary();
  347. return unaryFunction(right, operator);
  348. }
  349. return parsePost();
  350. }
  351. // level 1
  352. private InputProvider parsePost()
  353. {
  354. InputProvider expr = primary();
  355. while(true)
  356. {
  357. if(match(INC, DEC))
  358. {
  359. Token operator = previous();
  360. expr = unaryFunction(expr, "p" + operator);
  361. }
  362. else if(match(OPEN_BRACKET))
  363. {
  364. expr = new Function(FunctionLoader.getFunction(expr.toString()), parseArguments(CLOSE_BRACKET));
  365. }
  366. else if(match(OPEN_SQUARE_BRACKET))
  367. {
  368. String name = expr.toString();
  369. Variable oldVar = vars.get(name);
  370. if(oldVar == null)
  371. {
  372. oldVar = new ArrayVariable(name);
  373. vars.put(name, oldVar);
  374. }
  375. return new DynamicArray(oldVar, parseArguments(CLOSE_SQUARE_BRACKET));
  376. }
  377. else
  378. {
  379. break;
  380. }
  381. }
  382. return expr;
  383. }
  384. private InputProvider[] parseArguments(TokenType close)
  385. {
  386. if(match(close))
  387. {
  388. return new InputProvider[0];
  389. }
  390. LinkedList<InputProvider> list = new LinkedList<>();
  391. while(true)
  392. {
  393. list.add(parseExpression());
  394. if(match(close))
  395. {
  396. return list.toArray(new InputProvider[list.size()]);
  397. }
  398. consume(COMMA, "missing ',' in function");
  399. }
  400. }
  401. private InputProvider primary()
  402. {
  403. if(match(FALSE))
  404. {
  405. return ConstantBoolean.FALSE;
  406. }
  407. else if(match(TRUE))
  408. {
  409. return ConstantBoolean.TRUE;
  410. }
  411. else if(match(NULL))
  412. {
  413. return ConstantNull.NULL;
  414. }
  415. else if(match(DOUBLE))
  416. {
  417. return new ConstantDouble((double) previous().getData());
  418. }
  419. else if(match(TEXT))
  420. {
  421. return new ConstantString((String) previous().getData());
  422. }
  423. else if(match(VAR))
  424. {
  425. String name = (String) previous().getData();
  426. Variable v = vars.get(name);
  427. if(v == null)
  428. {
  429. v = new Variable(name);
  430. vars.put(name, v);
  431. }
  432. return v;
  433. }
  434. else if(match(IF, ELSE_IF))
  435. {
  436. String name = previous().getToken() == IF ? "if" : "elseif";
  437. consume(OPEN_BRACKET, "if without (");
  438. InputProvider[] input = parseArguments(CLOSE_BRACKET);
  439. InputProvider[] realInput = new InputProvider[input.length + 1];
  440. System.arraycopy(input, 0, realInput, 0, input.length);
  441. JumpData jump = new JumpData(inst.size());
  442. realInput[input.length] = jump;
  443. jumps.push(new JumpWrapper(jump, name));
  444. return new Function(FunctionLoader.getFunction(name), realInput);
  445. }
  446. else if(match(ELSE))
  447. {
  448. peek(OPEN_CURVED_BRACKET, "unexpected token after 'else': " + tokens[current]);
  449. JumpData jump = new JumpData(inst.size());
  450. jumps.push(new JumpWrapper(jump, "else"));
  451. return unaryFunction(jump, "else");
  452. }
  453. else if(match(FOR))
  454. {
  455. consume(OPEN_BRACKET, "for without (");
  456. // expected syntax
  457. // for(var, start, end, step)
  458. // for(var, start, end)
  459. InputProvider[] input = parseArguments(CLOSE_BRACKET);
  460. if(input.length != 3 && input.length != 4)
  461. {
  462. throw new PreScriptException("invalid 'for' syntax", previous().getLine());
  463. }
  464. InputProvider[] realInput = new InputProvider[5];
  465. System.arraycopy(input, 0, realInput, 0, input.length);
  466. if(input.length == 3)
  467. {
  468. realInput[3] = new ConstantDouble(1.0);
  469. }
  470. JumpData jump = new JumpData(inst.size());
  471. realInput[4] = jump;
  472. JumpWrapper wrapper = new JumpWrapper(jump, "for");
  473. jumps.push(wrapper);
  474. loopJumps.push(wrapper);
  475. return new Function(FunctionLoader.getFunction("for"), realInput);
  476. }
  477. else if(match(WHILE))
  478. {
  479. consume(OPEN_BRACKET, "for without (");
  480. // expected syntax
  481. // while(condition)
  482. InputProvider[] input = parseArguments(CLOSE_BRACKET);
  483. if(input.length != 1)
  484. {
  485. throw new PreScriptException("invalid conditions at 'while'", previous().getLine());
  486. }
  487. InputProvider[] realInput = new InputProvider[2];
  488. realInput[0] = input[0];
  489. JumpData jump = new JumpData(inst.size());
  490. realInput[1] = jump;
  491. JumpWrapper wrapper = new JumpWrapper(jump, "while");
  492. jumps.push(wrapper);
  493. loopJumps.push(wrapper);
  494. return new Function(FunctionLoader.getFunction("while"), realInput);
  495. }
  496. else if(match(FUNCTION))
  497. {
  498. cancel = true;
  499. int counter = 0;
  500. while(current < tokens.length && tokens[current].getToken() != OPEN_CURVED_BRACKET)
  501. {
  502. current++;
  503. }
  504. counter++;
  505. current++;
  506. while(current < tokens.length && counter != 0)
  507. {
  508. if(tokens[current].getToken() == OPEN_CURVED_BRACKET)
  509. {
  510. counter++;
  511. }
  512. else if(tokens[current].getToken() == CLOSE_CURVED_BRACKET)
  513. {
  514. counter--;
  515. }
  516. current++;
  517. }
  518. return new Function(FunctionLoader.getFunction("nothing"), new InputProvider[0]);
  519. }
  520. else if(match(BREAK))
  521. {
  522. if(loopJumps.isEmpty())
  523. {
  524. throw new PreScriptException("break without a loop", previous().getLine());
  525. }
  526. JumpData jump = new JumpData(inst.size() - 1);
  527. breakContinueJumps.add(jump);
  528. return unaryFunction(jump, "break");
  529. }
  530. else if(match(CONTINUE))
  531. {
  532. if(loopJumps.isEmpty())
  533. {
  534. throw new PreScriptException("continue without a loop", previous().getLine());
  535. }
  536. JumpData jump = new JumpData(inst.size());
  537. breakContinueJumps.add(jump);
  538. return unaryFunction(jump, "continue");
  539. }
  540. else if(match(RETURN))
  541. {
  542. if(match(SEMICOLON))
  543. {
  544. current--;
  545. return new Function(FunctionLoader.getFunction("return"), new InputProvider[0]);
  546. }
  547. return unaryFunction(parseExpression(), "return");
  548. }
  549. else if(match(TRY))
  550. {
  551. peek(OPEN_CURVED_BRACKET, "unexpected token after 'try': " + tokens[current]);
  552. JumpData jump = new JumpData(inst.size());
  553. jumps.push(new JumpWrapper(jump, "try"));
  554. return unaryFunction(jump, "try");
  555. }
  556. else if(match(CATCH))
  557. {
  558. if(!tryState)
  559. {
  560. throw new PreScriptException("catch without try", previous().getLine());
  561. }
  562. peek(OPEN_CURVED_BRACKET, "unexpected token after 'catch': " + tokens[current]);
  563. JumpData jump = new JumpData(inst.size());
  564. jumps.push(new JumpWrapper(jump, "catch"));
  565. return unaryFunction(jump, "catch");
  566. }
  567. else if(match(OPEN_BRACKET))
  568. {
  569. InputProvider expr = parseExpression();
  570. consume(CLOSE_BRACKET, "'(' without ')'");
  571. return expr;
  572. }
  573. throw new PreScriptException("unexpected token: " + tokens[current], tokens[current].getLine());
  574. }
  575. }